{"current_steps": 5, "total_steps": 67140, "loss": 7.196, "lr": 2.978850163836759e-08, "epoch": 0.0007447125409591898, "percentage": 0.01, "elapsed_time": "0:00:01", "remaining_time": "6:42:41", "throughput": 1653.81, "total_tokens": 2976} {"current_steps": 10, "total_steps": 67140, "loss": 7.2587, "lr": 6.702412868632709e-08, "epoch": 0.0014894250819183796, "percentage": 0.01, "elapsed_time": "0:00:02", "remaining_time": "5:28:53", "throughput": 2013.89, "total_tokens": 5920} {"current_steps": 15, "total_steps": 67140, "loss": 6.546, "lr": 1.0425975573428657e-07, "epoch": 0.002234137622877569, "percentage": 0.02, "elapsed_time": "0:00:04", "remaining_time": "5:04:45", "throughput": 2161.42, "total_tokens": 8832} {"current_steps": 20, "total_steps": 67140, "loss": 6.6276, "lr": 1.4149538278224606e-07, "epoch": 0.002978850163836759, "percentage": 0.03, "elapsed_time": "0:00:05", "remaining_time": "4:51:31", "throughput": 2234.86, "total_tokens": 11648} {"current_steps": 25, "total_steps": 67140, "loss": 6.5739, "lr": 1.7873100983020555e-07, "epoch": 0.0037235627047959487, "percentage": 0.04, "elapsed_time": "0:00:06", "remaining_time": "4:42:56", "throughput": 2272.06, "total_tokens": 14368} {"current_steps": 30, "total_steps": 67140, "loss": 6.138, "lr": 2.1596663687816505e-07, "epoch": 0.004468275245755138, "percentage": 0.04, "elapsed_time": "0:00:07", "remaining_time": "4:37:50", "throughput": 2318.78, "total_tokens": 17280} {"current_steps": 35, "total_steps": 67140, "loss": 5.3035, "lr": 2.532022639261245e-07, "epoch": 0.005212987786714328, "percentage": 0.05, "elapsed_time": "0:00:08", "remaining_time": "4:34:03", "throughput": 2350.59, "total_tokens": 20160} {"current_steps": 40, "total_steps": 67140, "loss": 5.5269, "lr": 2.90437890974084e-07, "epoch": 0.005957700327673518, "percentage": 0.06, "elapsed_time": "0:00:09", "remaining_time": "4:31:42", "throughput": 2377.33, "total_tokens": 23104} {"current_steps": 45, "total_steps": 67140, "loss": 4.9813, "lr": 3.276735180220435e-07, "epoch": 0.006702412868632708, "percentage": 0.07, "elapsed_time": "0:00:10", "remaining_time": "4:29:35", "throughput": 2401.06, "total_tokens": 26048} {"current_steps": 50, "total_steps": 67140, "loss": 4.6177, "lr": 3.64909145070003e-07, "epoch": 0.0074471254095918975, "percentage": 0.07, "elapsed_time": "0:00:11", "remaining_time": "4:27:45", "throughput": 2416.01, "total_tokens": 28928} {"current_steps": 55, "total_steps": 67140, "loss": 4.1926, "lr": 4.021447721179625e-07, "epoch": 0.008191837950551088, "percentage": 0.08, "elapsed_time": "0:00:13", "remaining_time": "4:27:50", "throughput": 2448.24, "total_tokens": 32256} {"current_steps": 60, "total_steps": 67140, "loss": 4.0465, "lr": 4.3938039916592203e-07, "epoch": 0.008936550491510277, "percentage": 0.09, "elapsed_time": "0:00:14", "remaining_time": "4:26:59", "throughput": 2458.91, "total_tokens": 35232} {"current_steps": 65, "total_steps": 67140, "loss": 3.996, "lr": 4.7661602621388146e-07, "epoch": 0.009681263032469467, "percentage": 0.1, "elapsed_time": "0:00:15", "remaining_time": "4:25:45", "throughput": 2466.5, "total_tokens": 38112} {"current_steps": 70, "total_steps": 67140, "loss": 3.7153, "lr": 5.13851653261841e-07, "epoch": 0.010425975573428656, "percentage": 0.1, "elapsed_time": "0:00:16", "remaining_time": "4:25:12", "throughput": 2475.94, "total_tokens": 41120} {"current_steps": 75, "total_steps": 67140, "loss": 3.5405, "lr": 5.510872803098004e-07, "epoch": 0.011170688114387846, "percentage": 0.11, "elapsed_time": "0:00:17", "remaining_time": "4:24:40", "throughput": 2481.22, "total_tokens": 44064} {"current_steps": 80, "total_steps": 67140, "loss": 3.2765, "lr": 5.8832290735776e-07, "epoch": 0.011915400655347037, "percentage": 0.12, "elapsed_time": "0:00:18", "remaining_time": "4:23:02", "throughput": 2474.68, "total_tokens": 46592} {"current_steps": 85, "total_steps": 67140, "loss": 3.2172, "lr": 6.255585344057195e-07, "epoch": 0.012660113196306225, "percentage": 0.13, "elapsed_time": "0:00:19", "remaining_time": "4:21:36", "throughput": 2470.23, "total_tokens": 49152} {"current_steps": 90, "total_steps": 67140, "loss": 3.1597, "lr": 6.627941614536789e-07, "epoch": 0.013404825737265416, "percentage": 0.13, "elapsed_time": "0:00:20", "remaining_time": "4:20:40", "throughput": 2466.16, "total_tokens": 51776} {"current_steps": 95, "total_steps": 67140, "loss": 2.7179, "lr": 7.000297885016385e-07, "epoch": 0.014149538278224605, "percentage": 0.14, "elapsed_time": "0:00:22", "remaining_time": "4:20:11", "throughput": 2469.32, "total_tokens": 54624} {"current_steps": 100, "total_steps": 67140, "loss": 2.8843, "lr": 7.372654155495979e-07, "epoch": 0.014894250819183795, "percentage": 0.15, "elapsed_time": "0:00:23", "remaining_time": "4:19:27", "throughput": 2468.05, "total_tokens": 57312} {"current_steps": 105, "total_steps": 67140, "loss": 2.8324, "lr": 7.745010425975574e-07, "epoch": 0.015638963360142984, "percentage": 0.16, "elapsed_time": "0:00:24", "remaining_time": "4:18:56", "throughput": 2468.19, "total_tokens": 60064} {"current_steps": 110, "total_steps": 67140, "loss": 2.6194, "lr": 8.11736669645517e-07, "epoch": 0.016383675901102176, "percentage": 0.16, "elapsed_time": "0:00:25", "remaining_time": "4:19:30", "throughput": 2482.13, "total_tokens": 63424} {"current_steps": 115, "total_steps": 67140, "loss": 2.3547, "lr": 8.489722966934764e-07, "epoch": 0.017128388442061365, "percentage": 0.17, "elapsed_time": "0:00:26", "remaining_time": "4:18:52", "throughput": 2479.46, "total_tokens": 66080} {"current_steps": 120, "total_steps": 67140, "loss": 2.3412, "lr": 8.862079237414358e-07, "epoch": 0.017873100983020553, "percentage": 0.18, "elapsed_time": "0:00:27", "remaining_time": "4:19:25", "throughput": 2491.52, "total_tokens": 69440} {"current_steps": 125, "total_steps": 67140, "loss": 2.0561, "lr": 9.234435507893953e-07, "epoch": 0.018617813523979745, "percentage": 0.19, "elapsed_time": "0:00:29", "remaining_time": "4:19:11", "throughput": 2493.17, "total_tokens": 72320} {"current_steps": 130, "total_steps": 67140, "loss": 1.8618, "lr": 9.606791778373549e-07, "epoch": 0.019362526064938934, "percentage": 0.19, "elapsed_time": "0:00:30", "remaining_time": "4:18:49", "throughput": 2495.07, "total_tokens": 75168} {"current_steps": 135, "total_steps": 67140, "loss": 1.8099, "lr": 9.979148048853143e-07, "epoch": 0.020107238605898123, "percentage": 0.2, "elapsed_time": "0:00:31", "remaining_time": "4:18:45", "throughput": 2499.23, "total_tokens": 78176} {"current_steps": 140, "total_steps": 67140, "loss": 1.5512, "lr": 1.035150431933274e-06, "epoch": 0.02085195114685731, "percentage": 0.21, "elapsed_time": "0:00:32", "remaining_time": "4:18:47", "throughput": 2504.06, "total_tokens": 81248} {"current_steps": 145, "total_steps": 67140, "loss": 1.5942, "lr": 1.0723860589812334e-06, "epoch": 0.021596663687816504, "percentage": 0.22, "elapsed_time": "0:00:33", "remaining_time": "4:18:55", "throughput": 2510.57, "total_tokens": 84416} {"current_steps": 150, "total_steps": 67140, "loss": 1.4061, "lr": 1.1096216860291928e-06, "epoch": 0.022341376228775692, "percentage": 0.22, "elapsed_time": "0:00:34", "remaining_time": "4:19:02", "throughput": 2516.57, "total_tokens": 87584} {"current_steps": 155, "total_steps": 67140, "loss": 1.1484, "lr": 1.1468573130771522e-06, "epoch": 0.02308608876973488, "percentage": 0.23, "elapsed_time": "0:00:35", "remaining_time": "4:18:45", "throughput": 2515.52, "total_tokens": 90368} {"current_steps": 160, "total_steps": 67140, "loss": 1.3229, "lr": 1.1840929401251119e-06, "epoch": 0.023830801310694073, "percentage": 0.24, "elapsed_time": "0:00:37", "remaining_time": "4:18:27", "throughput": 2514.58, "total_tokens": 93152} {"current_steps": 165, "total_steps": 67140, "loss": 1.0603, "lr": 1.2213285671730713e-06, "epoch": 0.024575513851653262, "percentage": 0.25, "elapsed_time": "0:00:38", "remaining_time": "4:18:37", "throughput": 2521.2, "total_tokens": 96384} {"current_steps": 170, "total_steps": 67140, "loss": 1.1298, "lr": 1.2585641942210307e-06, "epoch": 0.02532022639261245, "percentage": 0.25, "elapsed_time": "0:00:39", "remaining_time": "4:18:23", "throughput": 2518.96, "total_tokens": 99136} {"current_steps": 175, "total_steps": 67140, "loss": 1.1053, "lr": 1.2957998212689904e-06, "epoch": 0.026064938933571643, "percentage": 0.26, "elapsed_time": "0:00:40", "remaining_time": "4:18:02", "throughput": 2516.64, "total_tokens": 101824} {"current_steps": 180, "total_steps": 67140, "loss": 1.0142, "lr": 1.3330354483169498e-06, "epoch": 0.02680965147453083, "percentage": 0.27, "elapsed_time": "0:00:41", "remaining_time": "4:18:02", "throughput": 2518.88, "total_tokens": 104832} {"current_steps": 185, "total_steps": 67140, "loss": 1.0161, "lr": 1.3702710753649092e-06, "epoch": 0.02755436401549002, "percentage": 0.28, "elapsed_time": "0:00:42", "remaining_time": "4:17:49", "throughput": 2519.29, "total_tokens": 107680} {"current_steps": 190, "total_steps": 67140, "loss": 0.9298, "lr": 1.4075067024128687e-06, "epoch": 0.02829907655644921, "percentage": 0.28, "elapsed_time": "0:00:43", "remaining_time": "4:17:41", "throughput": 2519.62, "total_tokens": 110560} {"current_steps": 195, "total_steps": 67140, "loss": 0.9707, "lr": 1.4447423294608283e-06, "epoch": 0.0290437890974084, "percentage": 0.29, "elapsed_time": "0:00:45", "remaining_time": "4:17:43", "throughput": 2524.15, "total_tokens": 113696} {"current_steps": 200, "total_steps": 67140, "loss": 1.0271, "lr": 1.4819779565087877e-06, "epoch": 0.02978850163836759, "percentage": 0.3, "elapsed_time": "0:00:46", "remaining_time": "4:17:33", "throughput": 2522.73, "total_tokens": 116480} {"current_steps": 205, "total_steps": 67140, "loss": 0.976, "lr": 1.5192135835567472e-06, "epoch": 0.03053321417932678, "percentage": 0.31, "elapsed_time": "0:00:47", "remaining_time": "4:17:41", "throughput": 2527.99, "total_tokens": 119712} {"current_steps": 210, "total_steps": 67140, "loss": 0.9068, "lr": 1.5564492106047066e-06, "epoch": 0.03127792672028597, "percentage": 0.31, "elapsed_time": "0:00:48", "remaining_time": "4:17:52", "throughput": 2532.47, "total_tokens": 122944} {"current_steps": 215, "total_steps": 67140, "loss": 0.7781, "lr": 1.593684837652666e-06, "epoch": 0.032022639261245156, "percentage": 0.32, "elapsed_time": "0:00:49", "remaining_time": "4:17:52", "throughput": 2534.62, "total_tokens": 125984} {"current_steps": 220, "total_steps": 67140, "loss": 1.0523, "lr": 1.6309204647006257e-06, "epoch": 0.03276735180220435, "percentage": 0.33, "elapsed_time": "0:00:50", "remaining_time": "4:17:59", "throughput": 2539.22, "total_tokens": 129216} {"current_steps": 225, "total_steps": 67140, "loss": 0.9772, "lr": 1.668156091748585e-06, "epoch": 0.03351206434316354, "percentage": 0.34, "elapsed_time": "0:00:51", "remaining_time": "4:17:39", "throughput": 2535.62, "total_tokens": 131808} {"current_steps": 230, "total_steps": 67140, "loss": 0.8965, "lr": 1.7053917187965447e-06, "epoch": 0.03425677688412273, "percentage": 0.34, "elapsed_time": "0:00:53", "remaining_time": "4:17:46", "throughput": 2540.0, "total_tokens": 135040} {"current_steps": 235, "total_steps": 67140, "loss": 0.9434, "lr": 1.7426273458445042e-06, "epoch": 0.03500148942508192, "percentage": 0.35, "elapsed_time": "0:00:54", "remaining_time": "4:17:31", "throughput": 2538.89, "total_tokens": 137792} {"current_steps": 240, "total_steps": 67140, "loss": 0.9646, "lr": 1.7798629728924636e-06, "epoch": 0.035746201966041107, "percentage": 0.36, "elapsed_time": "0:00:55", "remaining_time": "4:17:30", "throughput": 2540.2, "total_tokens": 140800} {"current_steps": 245, "total_steps": 67140, "loss": 0.9094, "lr": 1.817098599940423e-06, "epoch": 0.036490914507000295, "percentage": 0.36, "elapsed_time": "0:00:56", "remaining_time": "4:17:23", "throughput": 2539.1, "total_tokens": 143616} {"current_steps": 250, "total_steps": 67140, "loss": 0.9301, "lr": 1.8543342269883825e-06, "epoch": 0.03723562704795949, "percentage": 0.37, "elapsed_time": "0:00:57", "remaining_time": "4:17:21", "throughput": 2540.04, "total_tokens": 146592} {"current_steps": 255, "total_steps": 67140, "loss": 1.0944, "lr": 1.8915698540363419e-06, "epoch": 0.03798033958891868, "percentage": 0.38, "elapsed_time": "0:00:58", "remaining_time": "4:17:09", "throughput": 2539.36, "total_tokens": 149376} {"current_steps": 260, "total_steps": 67140, "loss": 0.9266, "lr": 1.9288054810843013e-06, "epoch": 0.03872505212987787, "percentage": 0.39, "elapsed_time": "0:00:59", "remaining_time": "4:17:00", "throughput": 2539.72, "total_tokens": 152256} {"current_steps": 265, "total_steps": 67140, "loss": 0.942, "lr": 1.966041108132261e-06, "epoch": 0.03946976467083706, "percentage": 0.39, "elapsed_time": "0:01:01", "remaining_time": "4:16:55", "throughput": 2540.18, "total_tokens": 155168} {"current_steps": 270, "total_steps": 67140, "loss": 0.9838, "lr": 2.0032767351802206e-06, "epoch": 0.040214477211796246, "percentage": 0.4, "elapsed_time": "0:01:02", "remaining_time": "4:16:50", "throughput": 2539.44, "total_tokens": 158016} {"current_steps": 275, "total_steps": 67140, "loss": 1.055, "lr": 2.04051236222818e-06, "epoch": 0.040959189752755434, "percentage": 0.41, "elapsed_time": "0:01:03", "remaining_time": "4:16:44", "throughput": 2541.05, "total_tokens": 160992} {"current_steps": 280, "total_steps": 67140, "loss": 0.7821, "lr": 2.0777479892761395e-06, "epoch": 0.04170390229371462, "percentage": 0.42, "elapsed_time": "0:01:04", "remaining_time": "4:16:33", "throughput": 2538.09, "total_tokens": 163616} {"current_steps": 285, "total_steps": 67140, "loss": 0.8794, "lr": 2.114983616324099e-06, "epoch": 0.04244861483467382, "percentage": 0.42, "elapsed_time": "0:01:05", "remaining_time": "4:16:29", "throughput": 2537.79, "total_tokens": 166496} {"current_steps": 290, "total_steps": 67140, "loss": 0.8459, "lr": 2.1522192433720583e-06, "epoch": 0.04319332737563301, "percentage": 0.43, "elapsed_time": "0:01:06", "remaining_time": "4:16:18", "throughput": 2537.03, "total_tokens": 169248} {"current_steps": 295, "total_steps": 67140, "loss": 0.9928, "lr": 2.1894548704200177e-06, "epoch": 0.043938039916592196, "percentage": 0.44, "elapsed_time": "0:01:07", "remaining_time": "4:16:14", "throughput": 2537.42, "total_tokens": 172160} {"current_steps": 300, "total_steps": 67140, "loss": 1.0563, "lr": 2.2266904974679776e-06, "epoch": 0.044682752457551385, "percentage": 0.45, "elapsed_time": "0:01:08", "remaining_time": "4:16:06", "throughput": 2535.67, "total_tokens": 174880} {"current_steps": 305, "total_steps": 67140, "loss": 1.009, "lr": 2.263926124515937e-06, "epoch": 0.045427464998510574, "percentage": 0.45, "elapsed_time": "0:01:10", "remaining_time": "4:15:54", "throughput": 2533.74, "total_tokens": 177536} {"current_steps": 310, "total_steps": 67140, "loss": 1.0043, "lr": 2.3011617515638965e-06, "epoch": 0.04617217753946976, "percentage": 0.46, "elapsed_time": "0:01:11", "remaining_time": "4:15:50", "throughput": 2533.3, "total_tokens": 180384} {"current_steps": 315, "total_steps": 67140, "loss": 0.8316, "lr": 2.338397378611856e-06, "epoch": 0.04691689008042895, "percentage": 0.47, "elapsed_time": "0:01:12", "remaining_time": "4:15:41", "throughput": 2531.91, "total_tokens": 183104} {"current_steps": 320, "total_steps": 67140, "loss": 0.8994, "lr": 2.3756330056598153e-06, "epoch": 0.04766160262138815, "percentage": 0.48, "elapsed_time": "0:01:13", "remaining_time": "4:15:31", "throughput": 2530.39, "total_tokens": 185792} {"current_steps": 325, "total_steps": 67140, "loss": 0.8567, "lr": 2.4128686327077747e-06, "epoch": 0.048406315162347335, "percentage": 0.48, "elapsed_time": "0:01:14", "remaining_time": "4:15:28", "throughput": 2530.07, "total_tokens": 188640} {"current_steps": 330, "total_steps": 67140, "loss": 0.9353, "lr": 2.4501042597557346e-06, "epoch": 0.049151027703306524, "percentage": 0.49, "elapsed_time": "0:01:15", "remaining_time": "4:15:18", "throughput": 2528.58, "total_tokens": 191328} {"current_steps": 335, "total_steps": 67140, "loss": 0.8509, "lr": 2.487339886803694e-06, "epoch": 0.04989574024426571, "percentage": 0.5, "elapsed_time": "0:01:16", "remaining_time": "4:15:24", "throughput": 2530.5, "total_tokens": 194464} {"current_steps": 340, "total_steps": 67140, "loss": 0.9665, "lr": 2.5245755138516535e-06, "epoch": 0.0506404527852249, "percentage": 0.51, "elapsed_time": "0:01:17", "remaining_time": "4:15:06", "throughput": 2528.11, "total_tokens": 196960} {"current_steps": 345, "total_steps": 67140, "loss": 0.8715, "lr": 2.561811140899613e-06, "epoch": 0.05138516532618409, "percentage": 0.51, "elapsed_time": "0:01:19", "remaining_time": "4:15:01", "throughput": 2528.58, "total_tokens": 199840} {"current_steps": 350, "total_steps": 67140, "loss": 0.8209, "lr": 2.5990467679475723e-06, "epoch": 0.052129877867143286, "percentage": 0.52, "elapsed_time": "0:01:20", "remaining_time": "4:14:52", "throughput": 2527.63, "total_tokens": 202560} {"current_steps": 355, "total_steps": 67140, "loss": 0.8802, "lr": 2.6362823949955317e-06, "epoch": 0.052874590408102475, "percentage": 0.53, "elapsed_time": "0:01:21", "remaining_time": "4:14:56", "throughput": 2528.6, "total_tokens": 205600} {"current_steps": 360, "total_steps": 67140, "loss": 0.8617, "lr": 2.673518022043491e-06, "epoch": 0.05361930294906166, "percentage": 0.54, "elapsed_time": "0:01:22", "remaining_time": "4:14:59", "throughput": 2530.03, "total_tokens": 208672} {"current_steps": 365, "total_steps": 67140, "loss": 0.8325, "lr": 2.710753649091451e-06, "epoch": 0.05436401549002085, "percentage": 0.54, "elapsed_time": "0:01:23", "remaining_time": "4:14:56", "throughput": 2529.72, "total_tokens": 211520} {"current_steps": 370, "total_steps": 67140, "loss": 1.0399, "lr": 2.7479892761394105e-06, "epoch": 0.05510872803098004, "percentage": 0.55, "elapsed_time": "0:01:24", "remaining_time": "4:14:57", "throughput": 2530.28, "total_tokens": 214496} {"current_steps": 375, "total_steps": 67140, "loss": 0.8416, "lr": 2.78522490318737e-06, "epoch": 0.05585344057193923, "percentage": 0.56, "elapsed_time": "0:01:25", "remaining_time": "4:14:49", "throughput": 2529.42, "total_tokens": 217216} {"current_steps": 380, "total_steps": 67140, "loss": 0.931, "lr": 2.8224605302353293e-06, "epoch": 0.05659815311289842, "percentage": 0.57, "elapsed_time": "0:01:27", "remaining_time": "4:14:46", "throughput": 2528.48, "total_tokens": 220000} {"current_steps": 385, "total_steps": 67140, "loss": 1.0547, "lr": 2.8596961572832887e-06, "epoch": 0.057342865653857614, "percentage": 0.57, "elapsed_time": "0:01:28", "remaining_time": "4:14:42", "throughput": 2527.98, "total_tokens": 222816} {"current_steps": 390, "total_steps": 67140, "loss": 0.841, "lr": 2.896931784331248e-06, "epoch": 0.0580875781948168, "percentage": 0.58, "elapsed_time": "0:01:29", "remaining_time": "4:14:38", "throughput": 2527.99, "total_tokens": 225664} {"current_steps": 395, "total_steps": 67140, "loss": 0.8392, "lr": 2.9341674113792076e-06, "epoch": 0.05883229073577599, "percentage": 0.59, "elapsed_time": "0:01:30", "remaining_time": "4:14:46", "throughput": 2529.14, "total_tokens": 228800} {"current_steps": 400, "total_steps": 67140, "loss": 0.8746, "lr": 2.9714030384271675e-06, "epoch": 0.05957700327673518, "percentage": 0.6, "elapsed_time": "0:01:31", "remaining_time": "4:14:55", "throughput": 2531.5, "total_tokens": 232064} {"current_steps": 405, "total_steps": 67140, "loss": 0.7465, "lr": 3.008638665475127e-06, "epoch": 0.06032171581769437, "percentage": 0.6, "elapsed_time": "0:01:32", "remaining_time": "4:14:50", "throughput": 2531.18, "total_tokens": 234880} {"current_steps": 410, "total_steps": 67140, "loss": 0.9453, "lr": 3.0458742925230863e-06, "epoch": 0.06106642835865356, "percentage": 0.61, "elapsed_time": "0:01:33", "remaining_time": "4:14:49", "throughput": 2531.98, "total_tokens": 237856} {"current_steps": 415, "total_steps": 67140, "loss": 0.9598, "lr": 3.0831099195710457e-06, "epoch": 0.06181114089961275, "percentage": 0.62, "elapsed_time": "0:01:35", "remaining_time": "4:14:44", "throughput": 2531.05, "total_tokens": 240608} {"current_steps": 420, "total_steps": 67140, "loss": 0.8648, "lr": 3.120345546619005e-06, "epoch": 0.06255585344057193, "percentage": 0.63, "elapsed_time": "0:01:36", "remaining_time": "4:14:33", "throughput": 2529.18, "total_tokens": 243168} {"current_steps": 425, "total_steps": 67140, "loss": 0.8792, "lr": 3.1575811736669646e-06, "epoch": 0.06330056598153112, "percentage": 0.63, "elapsed_time": "0:01:37", "remaining_time": "4:14:36", "throughput": 2530.99, "total_tokens": 246304} {"current_steps": 430, "total_steps": 67140, "loss": 1.0397, "lr": 3.194816800714924e-06, "epoch": 0.06404527852249031, "percentage": 0.64, "elapsed_time": "0:01:38", "remaining_time": "4:14:30", "throughput": 2529.87, "total_tokens": 249024} {"current_steps": 435, "total_steps": 67140, "loss": 0.941, "lr": 3.2320524277628835e-06, "epoch": 0.06478999106344951, "percentage": 0.65, "elapsed_time": "0:01:39", "remaining_time": "4:14:32", "throughput": 2532.4, "total_tokens": 252224} {"current_steps": 440, "total_steps": 67140, "loss": 0.983, "lr": 3.269288054810843e-06, "epoch": 0.0655347036044087, "percentage": 0.66, "elapsed_time": "0:01:40", "remaining_time": "4:14:25", "throughput": 2530.77, "total_tokens": 254848} {"current_steps": 445, "total_steps": 67140, "loss": 0.9496, "lr": 3.3065236818588023e-06, "epoch": 0.06627941614536789, "percentage": 0.66, "elapsed_time": "0:01:41", "remaining_time": "4:14:24", "throughput": 2530.85, "total_tokens": 257760} {"current_steps": 450, "total_steps": 67140, "loss": 0.8912, "lr": 3.3437593089067626e-06, "epoch": 0.06702412868632708, "percentage": 0.67, "elapsed_time": "0:01:42", "remaining_time": "4:14:17", "throughput": 2529.21, "total_tokens": 260384} {"current_steps": 455, "total_steps": 67140, "loss": 0.8947, "lr": 3.380994935954722e-06, "epoch": 0.06776884122728627, "percentage": 0.68, "elapsed_time": "0:01:44", "remaining_time": "4:14:16", "throughput": 2529.88, "total_tokens": 263360} {"current_steps": 460, "total_steps": 67140, "loss": 0.8604, "lr": 3.4182305630026814e-06, "epoch": 0.06851355376824546, "percentage": 0.69, "elapsed_time": "0:01:45", "remaining_time": "4:14:11", "throughput": 2529.23, "total_tokens": 266112} {"current_steps": 465, "total_steps": 67140, "loss": 0.8826, "lr": 3.455466190050641e-06, "epoch": 0.06925826630920465, "percentage": 0.69, "elapsed_time": "0:01:46", "remaining_time": "4:14:01", "throughput": 2527.59, "total_tokens": 268672} {"current_steps": 470, "total_steps": 67140, "loss": 0.8912, "lr": 3.4927018170986003e-06, "epoch": 0.07000297885016384, "percentage": 0.7, "elapsed_time": "0:01:47", "remaining_time": "4:13:55", "throughput": 2526.21, "total_tokens": 271328} {"current_steps": 475, "total_steps": 67140, "loss": 0.8963, "lr": 3.5299374441465597e-06, "epoch": 0.07074769139112302, "percentage": 0.71, "elapsed_time": "0:01:48", "remaining_time": "4:13:51", "throughput": 2526.0, "total_tokens": 274144} {"current_steps": 480, "total_steps": 67140, "loss": 0.806, "lr": 3.567173071194519e-06, "epoch": 0.07149240393208221, "percentage": 0.71, "elapsed_time": "0:01:49", "remaining_time": "4:13:48", "throughput": 2526.22, "total_tokens": 277024} {"current_steps": 485, "total_steps": 67140, "loss": 0.9033, "lr": 3.6044086982424786e-06, "epoch": 0.0722371164730414, "percentage": 0.72, "elapsed_time": "0:01:50", "remaining_time": "4:13:46", "throughput": 2525.81, "total_tokens": 279840} {"current_steps": 490, "total_steps": 67140, "loss": 0.8872, "lr": 3.641644325290438e-06, "epoch": 0.07298182901400059, "percentage": 0.73, "elapsed_time": "0:01:52", "remaining_time": "4:13:55", "throughput": 2528.3, "total_tokens": 283200} {"current_steps": 495, "total_steps": 67140, "loss": 0.8645, "lr": 3.6788799523383975e-06, "epoch": 0.07372654155495978, "percentage": 0.74, "elapsed_time": "0:01:53", "remaining_time": "4:13:54", "throughput": 2527.76, "total_tokens": 286016} {"current_steps": 500, "total_steps": 67140, "loss": 0.8283, "lr": 3.716115579386357e-06, "epoch": 0.07447125409591898, "percentage": 0.74, "elapsed_time": "0:01:54", "remaining_time": "4:13:50", "throughput": 2527.77, "total_tokens": 288864} {"current_steps": 505, "total_steps": 67140, "loss": 1.0209, "lr": 3.7533512064343163e-06, "epoch": 0.07521596663687817, "percentage": 0.75, "elapsed_time": "0:01:55", "remaining_time": "4:13:50", "throughput": 2528.89, "total_tokens": 291904} {"current_steps": 510, "total_steps": 67140, "loss": 1.235, "lr": 3.7905868334822757e-06, "epoch": 0.07596067917783736, "percentage": 0.76, "elapsed_time": "0:01:56", "remaining_time": "4:13:45", "throughput": 2528.68, "total_tokens": 294688} {"current_steps": 515, "total_steps": 67140, "loss": 0.9427, "lr": 3.827822460530236e-06, "epoch": 0.07670539171879655, "percentage": 0.77, "elapsed_time": "0:01:57", "remaining_time": "4:13:48", "throughput": 2529.78, "total_tokens": 297792} {"current_steps": 520, "total_steps": 67140, "loss": 0.886, "lr": 3.8650580875781954e-06, "epoch": 0.07745010425975574, "percentage": 0.77, "elapsed_time": "0:01:58", "remaining_time": "4:13:45", "throughput": 2530.48, "total_tokens": 300736} {"current_steps": 525, "total_steps": 67140, "loss": 0.8543, "lr": 3.9022937146261545e-06, "epoch": 0.07819481680071493, "percentage": 0.78, "elapsed_time": "0:01:59", "remaining_time": "4:13:41", "throughput": 2529.9, "total_tokens": 303488} {"current_steps": 530, "total_steps": 67140, "loss": 0.7119, "lr": 3.939529341674114e-06, "epoch": 0.07893952934167411, "percentage": 0.79, "elapsed_time": "0:02:01", "remaining_time": "4:13:44", "throughput": 2531.18, "total_tokens": 306624} {"current_steps": 535, "total_steps": 67140, "loss": 0.8965, "lr": 3.976764968722073e-06, "epoch": 0.0796842418826333, "percentage": 0.8, "elapsed_time": "0:02:02", "remaining_time": "4:13:47", "throughput": 2532.69, "total_tokens": 309792} {"current_steps": 540, "total_steps": 67140, "loss": 0.9347, "lr": 4.014000595770033e-06, "epoch": 0.08042895442359249, "percentage": 0.8, "elapsed_time": "0:02:03", "remaining_time": "4:13:43", "throughput": 2532.34, "total_tokens": 312576} {"current_steps": 545, "total_steps": 67140, "loss": 0.9361, "lr": 4.051236222817992e-06, "epoch": 0.08117366696455168, "percentage": 0.81, "elapsed_time": "0:02:04", "remaining_time": "4:13:39", "throughput": 2532.01, "total_tokens": 315360} {"current_steps": 550, "total_steps": 67140, "loss": 1.0087, "lr": 4.088471849865952e-06, "epoch": 0.08191837950551087, "percentage": 0.82, "elapsed_time": "0:02:05", "remaining_time": "4:13:31", "throughput": 2531.15, "total_tokens": 318016} {"current_steps": 555, "total_steps": 67140, "loss": 0.8295, "lr": 4.125707476913911e-06, "epoch": 0.08266309204647006, "percentage": 0.83, "elapsed_time": "0:02:06", "remaining_time": "4:13:28", "throughput": 2530.44, "total_tokens": 320768} {"current_steps": 560, "total_steps": 67140, "loss": 0.8625, "lr": 4.162943103961871e-06, "epoch": 0.08340780458742925, "percentage": 0.83, "elapsed_time": "0:02:07", "remaining_time": "4:13:25", "throughput": 2530.85, "total_tokens": 323680} {"current_steps": 565, "total_steps": 67140, "loss": 0.9651, "lr": 4.20017873100983e-06, "epoch": 0.08415251712838845, "percentage": 0.84, "elapsed_time": "0:02:09", "remaining_time": "4:13:25", "throughput": 2531.14, "total_tokens": 326624} {"current_steps": 570, "total_steps": 67140, "loss": 0.9424, "lr": 4.23741435805779e-06, "epoch": 0.08489722966934764, "percentage": 0.85, "elapsed_time": "0:02:10", "remaining_time": "4:13:18", "throughput": 2529.87, "total_tokens": 329216} {"current_steps": 575, "total_steps": 67140, "loss": 0.879, "lr": 4.274649985105749e-06, "epoch": 0.08564194221030683, "percentage": 0.86, "elapsed_time": "0:02:11", "remaining_time": "4:13:12", "throughput": 2529.03, "total_tokens": 331904} {"current_steps": 580, "total_steps": 67140, "loss": 0.855, "lr": 4.3118856121537094e-06, "epoch": 0.08638665475126601, "percentage": 0.86, "elapsed_time": "0:02:12", "remaining_time": "4:13:10", "throughput": 2528.9, "total_tokens": 334752} {"current_steps": 585, "total_steps": 67140, "loss": 0.818, "lr": 4.3491212392016685e-06, "epoch": 0.0871313672922252, "percentage": 0.87, "elapsed_time": "0:02:13", "remaining_time": "4:13:15", "throughput": 2530.42, "total_tokens": 337984} {"current_steps": 590, "total_steps": 67140, "loss": 0.9237, "lr": 4.386356866249628e-06, "epoch": 0.08787607983318439, "percentage": 0.88, "elapsed_time": "0:02:14", "remaining_time": "4:13:11", "throughput": 2530.41, "total_tokens": 340800} {"current_steps": 595, "total_steps": 67140, "loss": 0.7448, "lr": 4.423592493297587e-06, "epoch": 0.08862079237414358, "percentage": 0.89, "elapsed_time": "0:02:15", "remaining_time": "4:13:05", "throughput": 2529.28, "total_tokens": 343424} {"current_steps": 600, "total_steps": 67140, "loss": 1.0281, "lr": 4.460828120345547e-06, "epoch": 0.08936550491510277, "percentage": 0.89, "elapsed_time": "0:02:16", "remaining_time": "4:13:11", "throughput": 2531.15, "total_tokens": 346720} {"current_steps": 605, "total_steps": 67140, "loss": 0.9625, "lr": 4.498063747393506e-06, "epoch": 0.09011021745606196, "percentage": 0.9, "elapsed_time": "0:02:18", "remaining_time": "4:13:11", "throughput": 2531.72, "total_tokens": 349728} {"current_steps": 610, "total_steps": 67140, "loss": 0.8841, "lr": 4.535299374441466e-06, "epoch": 0.09085492999702115, "percentage": 0.91, "elapsed_time": "0:02:19", "remaining_time": "4:13:05", "throughput": 2530.67, "total_tokens": 352352} {"current_steps": 615, "total_steps": 67140, "loss": 0.7964, "lr": 4.572535001489425e-06, "epoch": 0.09159964253798034, "percentage": 0.92, "elapsed_time": "0:02:20", "remaining_time": "4:13:02", "throughput": 2530.51, "total_tokens": 355168} {"current_steps": 620, "total_steps": 67140, "loss": 0.8582, "lr": 4.609770628537385e-06, "epoch": 0.09234435507893952, "percentage": 0.92, "elapsed_time": "0:02:21", "remaining_time": "4:12:58", "throughput": 2530.01, "total_tokens": 357920} {"current_steps": 625, "total_steps": 67140, "loss": 0.9372, "lr": 4.647006255585344e-06, "epoch": 0.09308906761989871, "percentage": 0.93, "elapsed_time": "0:02:22", "remaining_time": "4:12:56", "throughput": 2529.45, "total_tokens": 360704} {"current_steps": 630, "total_steps": 67140, "loss": 0.8964, "lr": 4.684241882633304e-06, "epoch": 0.0938337801608579, "percentage": 0.94, "elapsed_time": "0:02:23", "remaining_time": "4:12:58", "throughput": 2530.87, "total_tokens": 363872} {"current_steps": 635, "total_steps": 67140, "loss": 0.8797, "lr": 4.721477509681263e-06, "epoch": 0.0945784927018171, "percentage": 0.95, "elapsed_time": "0:02:24", "remaining_time": "4:13:00", "throughput": 2531.87, "total_tokens": 366976} {"current_steps": 640, "total_steps": 67140, "loss": 0.8006, "lr": 4.758713136729223e-06, "epoch": 0.0953232052427763, "percentage": 0.95, "elapsed_time": "0:02:26", "remaining_time": "4:12:58", "throughput": 2531.64, "total_tokens": 369824} {"current_steps": 645, "total_steps": 67140, "loss": 0.8516, "lr": 4.7959487637771824e-06, "epoch": 0.09606791778373548, "percentage": 0.96, "elapsed_time": "0:02:27", "remaining_time": "4:12:57", "throughput": 2532.47, "total_tokens": 372832} {"current_steps": 650, "total_steps": 67140, "loss": 0.9315, "lr": 4.833184390825142e-06, "epoch": 0.09681263032469467, "percentage": 0.97, "elapsed_time": "0:02:28", "remaining_time": "4:12:58", "throughput": 2533.18, "total_tokens": 375872} {"current_steps": 655, "total_steps": 67140, "loss": 0.8474, "lr": 4.870420017873101e-06, "epoch": 0.09755734286565386, "percentage": 0.98, "elapsed_time": "0:02:29", "remaining_time": "4:12:56", "throughput": 2533.14, "total_tokens": 378752} {"current_steps": 660, "total_steps": 67140, "loss": 0.8887, "lr": 4.907655644921061e-06, "epoch": 0.09830205540661305, "percentage": 0.98, "elapsed_time": "0:02:30", "remaining_time": "4:12:54", "throughput": 2533.18, "total_tokens": 381632} {"current_steps": 665, "total_steps": 67140, "loss": 0.8347, "lr": 4.94489127196902e-06, "epoch": 0.09904676794757224, "percentage": 0.99, "elapsed_time": "0:02:31", "remaining_time": "4:12:57", "throughput": 2534.54, "total_tokens": 384832} {"current_steps": 670, "total_steps": 67140, "loss": 0.7682, "lr": 4.98212689901698e-06, "epoch": 0.09979148048853143, "percentage": 1.0, "elapsed_time": "0:02:33", "remaining_time": "4:13:02", "throughput": 2536.59, "total_tokens": 388192} {"current_steps": 675, "total_steps": 67140, "loss": 0.9034, "lr": 5.019362526064939e-06, "epoch": 0.10053619302949061, "percentage": 1.01, "elapsed_time": "0:02:34", "remaining_time": "4:13:01", "throughput": 2536.56, "total_tokens": 391072} {"current_steps": 680, "total_steps": 67140, "loss": 1.1481, "lr": 5.056598153112899e-06, "epoch": 0.1012809055704498, "percentage": 1.01, "elapsed_time": "0:02:35", "remaining_time": "4:12:56", "throughput": 2536.06, "total_tokens": 393792} {"current_steps": 685, "total_steps": 67140, "loss": 0.9595, "lr": 5.093833780160858e-06, "epoch": 0.10202561811140899, "percentage": 1.02, "elapsed_time": "0:02:36", "remaining_time": "4:12:56", "throughput": 2536.56, "total_tokens": 396800} {"current_steps": 690, "total_steps": 67140, "loss": 0.8885, "lr": 5.131069407208818e-06, "epoch": 0.10277033065236818, "percentage": 1.03, "elapsed_time": "0:02:37", "remaining_time": "4:12:54", "throughput": 2536.33, "total_tokens": 399648} {"current_steps": 695, "total_steps": 67140, "loss": 0.7986, "lr": 5.168305034256777e-06, "epoch": 0.10351504319332737, "percentage": 1.04, "elapsed_time": "0:02:38", "remaining_time": "4:12:52", "throughput": 2536.38, "total_tokens": 402528} {"current_steps": 700, "total_steps": 67140, "loss": 0.8624, "lr": 5.205540661304737e-06, "epoch": 0.10425975573428657, "percentage": 1.04, "elapsed_time": "0:02:39", "remaining_time": "4:12:54", "throughput": 2537.54, "total_tokens": 405696} {"current_steps": 705, "total_steps": 67140, "loss": 0.857, "lr": 5.242776288352696e-06, "epoch": 0.10500446827524576, "percentage": 1.05, "elapsed_time": "0:02:41", "remaining_time": "4:12:56", "throughput": 2538.64, "total_tokens": 408864} {"current_steps": 710, "total_steps": 67140, "loss": 0.8417, "lr": 5.2800119154006555e-06, "epoch": 0.10574918081620495, "percentage": 1.06, "elapsed_time": "0:02:42", "remaining_time": "4:12:53", "throughput": 2538.17, "total_tokens": 411616} {"current_steps": 715, "total_steps": 67140, "loss": 0.8854, "lr": 5.317247542448615e-06, "epoch": 0.10649389335716414, "percentage": 1.06, "elapsed_time": "0:02:43", "remaining_time": "4:12:53", "throughput": 2538.08, "total_tokens": 414528} {"current_steps": 720, "total_steps": 67140, "loss": 0.8461, "lr": 5.354483169496575e-06, "epoch": 0.10723860589812333, "percentage": 1.07, "elapsed_time": "0:02:44", "remaining_time": "4:12:51", "throughput": 2538.25, "total_tokens": 417440} {"current_steps": 725, "total_steps": 67140, "loss": 0.7645, "lr": 5.391718796544534e-06, "epoch": 0.10798331843908252, "percentage": 1.08, "elapsed_time": "0:02:45", "remaining_time": "4:12:49", "throughput": 2538.11, "total_tokens": 420288} {"current_steps": 730, "total_steps": 67140, "loss": 0.9127, "lr": 5.428954423592494e-06, "epoch": 0.1087280309800417, "percentage": 1.09, "elapsed_time": "0:02:46", "remaining_time": "4:12:47", "throughput": 2538.06, "total_tokens": 423168} {"current_steps": 735, "total_steps": 67140, "loss": 0.8004, "lr": 5.466190050640453e-06, "epoch": 0.10947274352100089, "percentage": 1.09, "elapsed_time": "0:02:47", "remaining_time": "4:12:46", "throughput": 2538.68, "total_tokens": 426176} {"current_steps": 740, "total_steps": 67140, "loss": 0.8383, "lr": 5.503425677688413e-06, "epoch": 0.11021745606196008, "percentage": 1.1, "elapsed_time": "0:02:49", "remaining_time": "4:12:49", "throughput": 2539.69, "total_tokens": 429344} {"current_steps": 745, "total_steps": 67140, "loss": 0.8357, "lr": 5.540661304736372e-06, "epoch": 0.11096216860291927, "percentage": 1.11, "elapsed_time": "0:02:50", "remaining_time": "4:12:43", "throughput": 2539.15, "total_tokens": 432032} {"current_steps": 750, "total_steps": 67140, "loss": 0.9268, "lr": 5.577896931784332e-06, "epoch": 0.11170688114387846, "percentage": 1.12, "elapsed_time": "0:02:51", "remaining_time": "4:12:40", "throughput": 2538.66, "total_tokens": 434784} {"current_steps": 755, "total_steps": 67140, "loss": 0.8091, "lr": 5.615132558832291e-06, "epoch": 0.11245159368483765, "percentage": 1.12, "elapsed_time": "0:02:52", "remaining_time": "4:12:42", "throughput": 2539.71, "total_tokens": 437952} {"current_steps": 760, "total_steps": 67140, "loss": 0.8245, "lr": 5.652368185880251e-06, "epoch": 0.11319630622579684, "percentage": 1.13, "elapsed_time": "0:02:53", "remaining_time": "4:12:39", "throughput": 2539.01, "total_tokens": 440672} {"current_steps": 765, "total_steps": 67140, "loss": 0.9108, "lr": 5.68960381292821e-06, "epoch": 0.11394101876675604, "percentage": 1.14, "elapsed_time": "0:02:54", "remaining_time": "4:12:39", "throughput": 2539.36, "total_tokens": 443680} {"current_steps": 770, "total_steps": 67140, "loss": 0.849, "lr": 5.7268394399761695e-06, "epoch": 0.11468573130771523, "percentage": 1.15, "elapsed_time": "0:02:55", "remaining_time": "4:12:35", "throughput": 2538.87, "total_tokens": 446400} {"current_steps": 775, "total_steps": 67140, "loss": 0.8606, "lr": 5.7640750670241285e-06, "epoch": 0.11543044384867442, "percentage": 1.15, "elapsed_time": "0:02:56", "remaining_time": "4:12:32", "throughput": 2538.47, "total_tokens": 449184} {"current_steps": 780, "total_steps": 67140, "loss": 0.8904, "lr": 5.801310694072089e-06, "epoch": 0.1161751563896336, "percentage": 1.16, "elapsed_time": "0:02:58", "remaining_time": "4:12:29", "throughput": 2538.47, "total_tokens": 452032} {"current_steps": 785, "total_steps": 67140, "loss": 0.9192, "lr": 5.838546321120048e-06, "epoch": 0.1169198689305928, "percentage": 1.17, "elapsed_time": "0:02:59", "remaining_time": "4:12:30", "throughput": 2538.96, "total_tokens": 455072} {"current_steps": 790, "total_steps": 67140, "loss": 0.8831, "lr": 5.875781948168008e-06, "epoch": 0.11766458147155198, "percentage": 1.18, "elapsed_time": "0:03:00", "remaining_time": "4:12:26", "throughput": 2538.31, "total_tokens": 457760} {"current_steps": 795, "total_steps": 67140, "loss": 0.8503, "lr": 5.913017575215967e-06, "epoch": 0.11840929401251117, "percentage": 1.18, "elapsed_time": "0:03:01", "remaining_time": "4:12:23", "throughput": 2538.3, "total_tokens": 460608} {"current_steps": 800, "total_steps": 67140, "loss": 0.7846, "lr": 5.950253202263927e-06, "epoch": 0.11915400655347036, "percentage": 1.19, "elapsed_time": "0:03:02", "remaining_time": "4:12:23", "throughput": 2537.94, "total_tokens": 463456} {"current_steps": 805, "total_steps": 67140, "loss": 0.8532, "lr": 5.987488829311886e-06, "epoch": 0.11989871909442955, "percentage": 1.2, "elapsed_time": "0:03:03", "remaining_time": "4:12:20", "throughput": 2538.05, "total_tokens": 466336} {"current_steps": 810, "total_steps": 67140, "loss": 0.8915, "lr": 6.024724456359846e-06, "epoch": 0.12064343163538874, "percentage": 1.21, "elapsed_time": "0:03:04", "remaining_time": "4:12:19", "throughput": 2538.33, "total_tokens": 469280} {"current_steps": 815, "total_steps": 67140, "loss": 0.8188, "lr": 6.061960083407805e-06, "epoch": 0.12138814417634793, "percentage": 1.21, "elapsed_time": "0:03:06", "remaining_time": "4:12:17", "throughput": 2538.1, "total_tokens": 472096} {"current_steps": 820, "total_steps": 67140, "loss": 0.8545, "lr": 6.099195710455765e-06, "epoch": 0.12213285671730711, "percentage": 1.22, "elapsed_time": "0:03:07", "remaining_time": "4:12:14", "throughput": 2538.04, "total_tokens": 474944} {"current_steps": 825, "total_steps": 67140, "loss": 0.8171, "lr": 6.136431337503724e-06, "epoch": 0.1228775692582663, "percentage": 1.23, "elapsed_time": "0:03:08", "remaining_time": "4:12:12", "throughput": 2537.53, "total_tokens": 477696} {"current_steps": 830, "total_steps": 67140, "loss": 0.8097, "lr": 6.1736669645516834e-06, "epoch": 0.1236222817992255, "percentage": 1.24, "elapsed_time": "0:03:09", "remaining_time": "4:12:12", "throughput": 2537.76, "total_tokens": 480672} {"current_steps": 835, "total_steps": 67140, "loss": 0.8718, "lr": 6.2109025915996425e-06, "epoch": 0.1243669943401847, "percentage": 1.24, "elapsed_time": "0:03:10", "remaining_time": "4:12:12", "throughput": 2538.18, "total_tokens": 483712} {"current_steps": 840, "total_steps": 67140, "loss": 0.8227, "lr": 6.248138218647602e-06, "epoch": 0.12511170688114387, "percentage": 1.25, "elapsed_time": "0:03:11", "remaining_time": "4:12:10", "throughput": 2538.06, "total_tokens": 486528} {"current_steps": 845, "total_steps": 67140, "loss": 0.7903, "lr": 6.285373845695562e-06, "epoch": 0.12585641942210307, "percentage": 1.26, "elapsed_time": "0:03:12", "remaining_time": "4:12:05", "throughput": 2537.44, "total_tokens": 489184} {"current_steps": 850, "total_steps": 67140, "loss": 0.8724, "lr": 6.322609472743521e-06, "epoch": 0.12660113196306225, "percentage": 1.27, "elapsed_time": "0:03:13", "remaining_time": "4:12:04", "throughput": 2537.42, "total_tokens": 492096} {"current_steps": 855, "total_steps": 67140, "loss": 0.937, "lr": 6.359845099791481e-06, "epoch": 0.12734584450402145, "percentage": 1.27, "elapsed_time": "0:03:15", "remaining_time": "4:12:06", "throughput": 2537.9, "total_tokens": 495168} {"current_steps": 860, "total_steps": 67140, "loss": 0.8293, "lr": 6.39708072683944e-06, "epoch": 0.12809055704498062, "percentage": 1.28, "elapsed_time": "0:03:16", "remaining_time": "4:12:04", "throughput": 2538.17, "total_tokens": 498112} {"current_steps": 865, "total_steps": 67140, "loss": 0.8206, "lr": 6.4343163538874e-06, "epoch": 0.12883526958593983, "percentage": 1.29, "elapsed_time": "0:03:17", "remaining_time": "4:12:07", "throughput": 2538.62, "total_tokens": 501216} {"current_steps": 870, "total_steps": 67140, "loss": 0.7863, "lr": 6.471551980935359e-06, "epoch": 0.12957998212689903, "percentage": 1.3, "elapsed_time": "0:03:18", "remaining_time": "4:12:04", "throughput": 2538.3, "total_tokens": 504000} {"current_steps": 875, "total_steps": 67140, "loss": 0.8806, "lr": 6.508787607983319e-06, "epoch": 0.1303246946678582, "percentage": 1.3, "elapsed_time": "0:03:19", "remaining_time": "4:12:02", "throughput": 2538.53, "total_tokens": 506912} {"current_steps": 880, "total_steps": 67140, "loss": 0.8242, "lr": 6.546023235031279e-06, "epoch": 0.1310694072088174, "percentage": 1.31, "elapsed_time": "0:03:20", "remaining_time": "4:12:00", "throughput": 2538.21, "total_tokens": 509696} {"current_steps": 885, "total_steps": 67140, "loss": 0.8784, "lr": 6.583258862079238e-06, "epoch": 0.13181411974977658, "percentage": 1.32, "elapsed_time": "0:03:21", "remaining_time": "4:11:58", "throughput": 2538.08, "total_tokens": 512544} {"current_steps": 890, "total_steps": 67140, "loss": 1.013, "lr": 6.6204944891271974e-06, "epoch": 0.13255883229073578, "percentage": 1.33, "elapsed_time": "0:03:23", "remaining_time": "4:11:55", "throughput": 2538.08, "total_tokens": 515392} {"current_steps": 895, "total_steps": 67140, "loss": 0.8238, "lr": 6.6577301161751565e-06, "epoch": 0.13330354483169496, "percentage": 1.33, "elapsed_time": "0:03:24", "remaining_time": "4:11:56", "throughput": 2539.08, "total_tokens": 518560} {"current_steps": 900, "total_steps": 67140, "loss": 0.8272, "lr": 6.694965743223116e-06, "epoch": 0.13404825737265416, "percentage": 1.34, "elapsed_time": "0:03:25", "remaining_time": "4:11:54", "throughput": 2539.2, "total_tokens": 521440} {"current_steps": 905, "total_steps": 67140, "loss": 0.8323, "lr": 6.732201370271075e-06, "epoch": 0.13479296991361334, "percentage": 1.35, "elapsed_time": "0:03:26", "remaining_time": "4:11:52", "throughput": 2539.32, "total_tokens": 524352} {"current_steps": 910, "total_steps": 67140, "loss": 1.0111, "lr": 6.769436997319035e-06, "epoch": 0.13553768245457254, "percentage": 1.36, "elapsed_time": "0:03:27", "remaining_time": "4:11:57", "throughput": 2540.97, "total_tokens": 527808} {"current_steps": 915, "total_steps": 67140, "loss": 1.2627, "lr": 6.806672624366994e-06, "epoch": 0.1362823949955317, "percentage": 1.36, "elapsed_time": "0:03:28", "remaining_time": "4:11:55", "throughput": 2541.06, "total_tokens": 530688} {"current_steps": 920, "total_steps": 67140, "loss": 0.9499, "lr": 6.843908251414954e-06, "epoch": 0.13702710753649092, "percentage": 1.37, "elapsed_time": "0:03:29", "remaining_time": "4:11:52", "throughput": 2540.51, "total_tokens": 533408} {"current_steps": 925, "total_steps": 67140, "loss": 0.8445, "lr": 6.881143878462913e-06, "epoch": 0.1377718200774501, "percentage": 1.38, "elapsed_time": "0:03:31", "remaining_time": "4:11:52", "throughput": 2541.08, "total_tokens": 536480} {"current_steps": 930, "total_steps": 67140, "loss": 0.8811, "lr": 6.918379505510873e-06, "epoch": 0.1385165326184093, "percentage": 1.39, "elapsed_time": "0:03:32", "remaining_time": "4:11:47", "throughput": 2540.3, "total_tokens": 539072} {"current_steps": 935, "total_steps": 67140, "loss": 1.0344, "lr": 6.955615132558832e-06, "epoch": 0.1392612451593685, "percentage": 1.39, "elapsed_time": "0:03:33", "remaining_time": "4:11:49", "throughput": 2541.02, "total_tokens": 542208} {"current_steps": 940, "total_steps": 67140, "loss": 0.9861, "lr": 6.992850759606792e-06, "epoch": 0.14000595770032767, "percentage": 1.4, "elapsed_time": "0:03:34", "remaining_time": "4:11:48", "throughput": 2541.2, "total_tokens": 545152} {"current_steps": 945, "total_steps": 67140, "loss": 0.941, "lr": 7.0300863866547524e-06, "epoch": 0.14075067024128687, "percentage": 1.41, "elapsed_time": "0:03:35", "remaining_time": "4:11:43", "throughput": 2540.55, "total_tokens": 547776} {"current_steps": 950, "total_steps": 67140, "loss": 0.8363, "lr": 7.067322013702711e-06, "epoch": 0.14149538278224605, "percentage": 1.41, "elapsed_time": "0:03:36", "remaining_time": "4:11:40", "throughput": 2540.65, "total_tokens": 550656} {"current_steps": 955, "total_steps": 67140, "loss": 0.858, "lr": 7.104557640750671e-06, "epoch": 0.14224009532320525, "percentage": 1.42, "elapsed_time": "0:03:37", "remaining_time": "4:11:37", "throughput": 2540.27, "total_tokens": 553376} {"current_steps": 960, "total_steps": 67140, "loss": 0.8051, "lr": 7.14179326779863e-06, "epoch": 0.14298480786416443, "percentage": 1.43, "elapsed_time": "0:03:39", "remaining_time": "4:11:38", "throughput": 2540.91, "total_tokens": 556512} {"current_steps": 965, "total_steps": 67140, "loss": 0.9369, "lr": 7.17902889484659e-06, "epoch": 0.14372952040512363, "percentage": 1.44, "elapsed_time": "0:03:40", "remaining_time": "4:11:39", "throughput": 2541.16, "total_tokens": 559520} {"current_steps": 970, "total_steps": 67140, "loss": 0.8294, "lr": 7.216264521894549e-06, "epoch": 0.1444742329460828, "percentage": 1.44, "elapsed_time": "0:03:41", "remaining_time": "4:11:37", "throughput": 2541.39, "total_tokens": 562464} {"current_steps": 975, "total_steps": 67140, "loss": 0.8835, "lr": 7.253500148942509e-06, "epoch": 0.145218945487042, "percentage": 1.45, "elapsed_time": "0:03:42", "remaining_time": "4:11:33", "throughput": 2540.16, "total_tokens": 564960} {"current_steps": 980, "total_steps": 67140, "loss": 0.8255, "lr": 7.290735775990468e-06, "epoch": 0.14596365802800118, "percentage": 1.46, "elapsed_time": "0:03:43", "remaining_time": "4:11:33", "throughput": 2540.73, "total_tokens": 568032} {"current_steps": 985, "total_steps": 67140, "loss": 0.8602, "lr": 7.327971403038428e-06, "epoch": 0.14670837056896038, "percentage": 1.47, "elapsed_time": "0:03:44", "remaining_time": "4:11:32", "throughput": 2540.64, "total_tokens": 570912} {"current_steps": 990, "total_steps": 67140, "loss": 0.8323, "lr": 7.365207030086387e-06, "epoch": 0.14745308310991956, "percentage": 1.47, "elapsed_time": "0:03:45", "remaining_time": "4:11:29", "throughput": 2540.34, "total_tokens": 573696} {"current_steps": 995, "total_steps": 67140, "loss": 0.8355, "lr": 7.402442657134347e-06, "epoch": 0.14819779565087876, "percentage": 1.48, "elapsed_time": "0:03:46", "remaining_time": "4:11:27", "throughput": 2539.97, "total_tokens": 576480} {"current_steps": 1000, "total_steps": 67140, "loss": 0.8182, "lr": 7.439678284182306e-06, "epoch": 0.14894250819183796, "percentage": 1.49, "elapsed_time": "0:03:48", "remaining_time": "4:11:27", "throughput": 2540.14, "total_tokens": 579424} {"current_steps": 1005, "total_steps": 67140, "loss": 0.7963, "lr": 7.476913911230266e-06, "epoch": 0.14968722073279714, "percentage": 1.5, "elapsed_time": "0:03:49", "remaining_time": "4:11:25", "throughput": 2540.42, "total_tokens": 582368} {"current_steps": 1010, "total_steps": 67140, "loss": 0.8412, "lr": 7.5141495382782254e-06, "epoch": 0.15043193327375634, "percentage": 1.5, "elapsed_time": "0:03:50", "remaining_time": "4:11:25", "throughput": 2540.8, "total_tokens": 585408} {"current_steps": 1015, "total_steps": 67140, "loss": 0.8297, "lr": 7.5513851653261844e-06, "epoch": 0.15117664581471552, "percentage": 1.51, "elapsed_time": "0:03:51", "remaining_time": "4:11:24", "throughput": 2540.74, "total_tokens": 588288} {"current_steps": 1020, "total_steps": 67140, "loss": 0.8484, "lr": 7.588620792374144e-06, "epoch": 0.15192135835567472, "percentage": 1.52, "elapsed_time": "0:03:52", "remaining_time": "4:11:22", "throughput": 2540.94, "total_tokens": 591200} {"current_steps": 1025, "total_steps": 67140, "loss": 0.8566, "lr": 7.625856419422103e-06, "epoch": 0.1526660708966339, "percentage": 1.53, "elapsed_time": "0:03:53", "remaining_time": "4:11:21", "throughput": 2540.76, "total_tokens": 594048} {"current_steps": 1030, "total_steps": 67140, "loss": 0.8359, "lr": 7.663092046470063e-06, "epoch": 0.1534107834375931, "percentage": 1.53, "elapsed_time": "0:03:54", "remaining_time": "4:11:19", "throughput": 2541.09, "total_tokens": 597024} {"current_steps": 1035, "total_steps": 67140, "loss": 0.8339, "lr": 7.700327673518021e-06, "epoch": 0.15415549597855227, "percentage": 1.54, "elapsed_time": "0:03:56", "remaining_time": "4:11:18", "throughput": 2540.8, "total_tokens": 599840} {"current_steps": 1040, "total_steps": 67140, "loss": 0.8462, "lr": 7.737563300565983e-06, "epoch": 0.15490020851951147, "percentage": 1.55, "elapsed_time": "0:03:57", "remaining_time": "4:11:15", "throughput": 2540.73, "total_tokens": 602656} {"current_steps": 1045, "total_steps": 67140, "loss": 0.8547, "lr": 7.774798927613941e-06, "epoch": 0.15564492106047065, "percentage": 1.56, "elapsed_time": "0:03:58", "remaining_time": "4:11:15", "throughput": 2541.37, "total_tokens": 605760} {"current_steps": 1050, "total_steps": 67140, "loss": 0.7948, "lr": 7.812034554661901e-06, "epoch": 0.15638963360142985, "percentage": 1.56, "elapsed_time": "0:03:59", "remaining_time": "4:11:12", "throughput": 2540.84, "total_tokens": 608448} {"current_steps": 1055, "total_steps": 67140, "loss": 0.8331, "lr": 7.84927018170986e-06, "epoch": 0.15713434614238903, "percentage": 1.57, "elapsed_time": "0:04:00", "remaining_time": "4:11:10", "throughput": 2540.78, "total_tokens": 611296} {"current_steps": 1060, "total_steps": 67140, "loss": 0.8671, "lr": 7.88650580875782e-06, "epoch": 0.15787905868334823, "percentage": 1.58, "elapsed_time": "0:04:01", "remaining_time": "4:11:10", "throughput": 2540.94, "total_tokens": 614272} {"current_steps": 1065, "total_steps": 67140, "loss": 0.8171, "lr": 7.923741435805779e-06, "epoch": 0.15862377122430743, "percentage": 1.59, "elapsed_time": "0:04:02", "remaining_time": "4:11:12", "throughput": 2541.84, "total_tokens": 617504} {"current_steps": 1070, "total_steps": 67140, "loss": 0.8654, "lr": 7.960977062853739e-06, "epoch": 0.1593684837652666, "percentage": 1.59, "elapsed_time": "0:04:04", "remaining_time": "4:11:10", "throughput": 2541.9, "total_tokens": 620384} {"current_steps": 1075, "total_steps": 67140, "loss": 0.8811, "lr": 7.998212689901698e-06, "epoch": 0.1601131963062258, "percentage": 1.6, "elapsed_time": "0:04:05", "remaining_time": "4:11:09", "throughput": 2542.16, "total_tokens": 623360} {"current_steps": 1080, "total_steps": 67140, "loss": 0.7593, "lr": 8.035448316949658e-06, "epoch": 0.16085790884718498, "percentage": 1.61, "elapsed_time": "0:04:06", "remaining_time": "4:11:09", "throughput": 2542.33, "total_tokens": 626336} {"current_steps": 1085, "total_steps": 67140, "loss": 0.9517, "lr": 8.072683943997618e-06, "epoch": 0.16160262138814419, "percentage": 1.62, "elapsed_time": "0:04:07", "remaining_time": "4:11:10", "throughput": 2542.88, "total_tokens": 629472} {"current_steps": 1090, "total_steps": 67140, "loss": 0.8841, "lr": 8.109919571045576e-06, "epoch": 0.16234733392910336, "percentage": 1.62, "elapsed_time": "0:04:08", "remaining_time": "4:11:10", "throughput": 2543.54, "total_tokens": 632608} {"current_steps": 1095, "total_steps": 67140, "loss": 0.8225, "lr": 8.147155198093536e-06, "epoch": 0.16309204647006256, "percentage": 1.63, "elapsed_time": "0:04:09", "remaining_time": "4:11:10", "throughput": 2544.04, "total_tokens": 635680} {"current_steps": 1100, "total_steps": 67140, "loss": 0.8263, "lr": 8.184390825141496e-06, "epoch": 0.16383675901102174, "percentage": 1.64, "elapsed_time": "0:04:10", "remaining_time": "4:11:06", "throughput": 2543.43, "total_tokens": 638304} {"current_steps": 1105, "total_steps": 67140, "loss": 0.809, "lr": 8.221626452189456e-06, "epoch": 0.16458147155198094, "percentage": 1.65, "elapsed_time": "0:04:12", "remaining_time": "4:11:06", "throughput": 2543.79, "total_tokens": 641312} {"current_steps": 1110, "total_steps": 67140, "loss": 0.8291, "lr": 8.258862079237414e-06, "epoch": 0.16532618409294011, "percentage": 1.65, "elapsed_time": "0:04:13", "remaining_time": "4:11:04", "throughput": 2543.64, "total_tokens": 644160} {"current_steps": 1115, "total_steps": 67140, "loss": 0.7995, "lr": 8.296097706285374e-06, "epoch": 0.16607089663389932, "percentage": 1.66, "elapsed_time": "0:04:14", "remaining_time": "4:11:02", "throughput": 2543.28, "total_tokens": 646912} {"current_steps": 1120, "total_steps": 67140, "loss": 0.8182, "lr": 8.333333333333334e-06, "epoch": 0.1668156091748585, "percentage": 1.67, "elapsed_time": "0:04:15", "remaining_time": "4:11:01", "throughput": 2543.43, "total_tokens": 649888} {"current_steps": 1125, "total_steps": 67140, "loss": 0.8387, "lr": 8.370568960381294e-06, "epoch": 0.1675603217158177, "percentage": 1.68, "elapsed_time": "0:04:16", "remaining_time": "4:10:58", "throughput": 2543.26, "total_tokens": 652672} {"current_steps": 1130, "total_steps": 67140, "loss": 0.8526, "lr": 8.407804587429252e-06, "epoch": 0.1683050342567769, "percentage": 1.68, "elapsed_time": "0:04:17", "remaining_time": "4:10:52", "throughput": 2542.18, "total_tokens": 655072} {"current_steps": 1135, "total_steps": 67140, "loss": 0.8242, "lr": 8.445040214477212e-06, "epoch": 0.16904974679773607, "percentage": 1.69, "elapsed_time": "0:04:18", "remaining_time": "4:10:52", "throughput": 2542.53, "total_tokens": 658112} {"current_steps": 1140, "total_steps": 67140, "loss": 0.8324, "lr": 8.482275841525171e-06, "epoch": 0.16979445933869527, "percentage": 1.7, "elapsed_time": "0:04:19", "remaining_time": "4:10:51", "throughput": 2542.6, "total_tokens": 661024} {"current_steps": 1145, "total_steps": 67140, "loss": 0.8499, "lr": 8.519511468573131e-06, "epoch": 0.17053917187965445, "percentage": 1.71, "elapsed_time": "0:04:21", "remaining_time": "4:10:49", "throughput": 2542.78, "total_tokens": 663936} {"current_steps": 1150, "total_steps": 67140, "loss": 0.7932, "lr": 8.556747095621091e-06, "epoch": 0.17128388442061365, "percentage": 1.71, "elapsed_time": "0:04:22", "remaining_time": "4:10:47", "throughput": 2542.73, "total_tokens": 666784} {"current_steps": 1155, "total_steps": 67140, "loss": 0.8933, "lr": 8.59398272266905e-06, "epoch": 0.17202859696157283, "percentage": 1.72, "elapsed_time": "0:04:23", "remaining_time": "4:10:48", "throughput": 2543.49, "total_tokens": 669984} {"current_steps": 1160, "total_steps": 67140, "loss": 0.8481, "lr": 8.631218349717011e-06, "epoch": 0.17277330950253203, "percentage": 1.73, "elapsed_time": "0:04:24", "remaining_time": "4:10:46", "throughput": 2542.92, "total_tokens": 672672} {"current_steps": 1165, "total_steps": 67140, "loss": 0.8239, "lr": 8.668453976764969e-06, "epoch": 0.1735180220434912, "percentage": 1.74, "elapsed_time": "0:04:25", "remaining_time": "4:10:44", "throughput": 2543.05, "total_tokens": 675584} {"current_steps": 1170, "total_steps": 67140, "loss": 0.8391, "lr": 8.705689603812929e-06, "epoch": 0.1742627345844504, "percentage": 1.74, "elapsed_time": "0:04:26", "remaining_time": "4:10:42", "throughput": 2542.69, "total_tokens": 678336} {"current_steps": 1175, "total_steps": 67140, "loss": 0.8445, "lr": 8.742925230860887e-06, "epoch": 0.17500744712540958, "percentage": 1.75, "elapsed_time": "0:04:27", "remaining_time": "4:10:40", "throughput": 2542.39, "total_tokens": 681120} {"current_steps": 1180, "total_steps": 67140, "loss": 0.8338, "lr": 8.780160857908849e-06, "epoch": 0.17575215966636878, "percentage": 1.76, "elapsed_time": "0:04:29", "remaining_time": "4:10:38", "throughput": 2542.12, "total_tokens": 683936} {"current_steps": 1185, "total_steps": 67140, "loss": 0.8039, "lr": 8.817396484956807e-06, "epoch": 0.17649687220732796, "percentage": 1.76, "elapsed_time": "0:04:30", "remaining_time": "4:10:37", "throughput": 2542.1, "total_tokens": 686816} {"current_steps": 1190, "total_steps": 67140, "loss": 0.8206, "lr": 8.854632112004767e-06, "epoch": 0.17724158474828716, "percentage": 1.77, "elapsed_time": "0:04:31", "remaining_time": "4:10:35", "throughput": 2542.02, "total_tokens": 689664} {"current_steps": 1195, "total_steps": 67140, "loss": 0.8445, "lr": 8.891867739052725e-06, "epoch": 0.17798629728924636, "percentage": 1.78, "elapsed_time": "0:04:32", "remaining_time": "4:10:32", "throughput": 2541.49, "total_tokens": 692320} {"current_steps": 1200, "total_steps": 67140, "loss": 0.7734, "lr": 8.929103366100686e-06, "epoch": 0.17873100983020554, "percentage": 1.79, "elapsed_time": "0:04:33", "remaining_time": "4:10:30", "throughput": 2541.34, "total_tokens": 695136} {"current_steps": 1205, "total_steps": 67140, "loss": 0.8254, "lr": 8.966338993148644e-06, "epoch": 0.17947572237116474, "percentage": 1.79, "elapsed_time": "0:04:34", "remaining_time": "4:10:29", "throughput": 2541.38, "total_tokens": 698048} {"current_steps": 1210, "total_steps": 67140, "loss": 0.7267, "lr": 9.003574620196604e-06, "epoch": 0.18022043491212392, "percentage": 1.8, "elapsed_time": "0:04:35", "remaining_time": "4:10:27", "throughput": 2541.22, "total_tokens": 700864} {"current_steps": 1215, "total_steps": 67140, "loss": 0.8714, "lr": 9.040810247244564e-06, "epoch": 0.18096514745308312, "percentage": 1.81, "elapsed_time": "0:04:36", "remaining_time": "4:10:27", "throughput": 2541.43, "total_tokens": 703872} {"current_steps": 1220, "total_steps": 67140, "loss": 0.8595, "lr": 9.078045874292524e-06, "epoch": 0.1817098599940423, "percentage": 1.82, "elapsed_time": "0:04:38", "remaining_time": "4:10:24", "throughput": 2540.83, "total_tokens": 706496} {"current_steps": 1225, "total_steps": 67140, "loss": 0.8288, "lr": 9.115281501340484e-06, "epoch": 0.1824545725350015, "percentage": 1.82, "elapsed_time": "0:04:39", "remaining_time": "4:10:23", "throughput": 2540.86, "total_tokens": 709440} {"current_steps": 1230, "total_steps": 67140, "loss": 0.7957, "lr": 9.152517128388442e-06, "epoch": 0.18319928507596067, "percentage": 1.83, "elapsed_time": "0:04:40", "remaining_time": "4:10:21", "throughput": 2540.38, "total_tokens": 712128} {"current_steps": 1235, "total_steps": 67140, "loss": 0.8156, "lr": 9.189752755436402e-06, "epoch": 0.18394399761691987, "percentage": 1.84, "elapsed_time": "0:04:41", "remaining_time": "4:10:19", "throughput": 2540.05, "total_tokens": 714912} {"current_steps": 1240, "total_steps": 67140, "loss": 0.8507, "lr": 9.226988382484362e-06, "epoch": 0.18468871015787905, "percentage": 1.85, "elapsed_time": "0:04:42", "remaining_time": "4:10:16", "throughput": 2539.49, "total_tokens": 717568} {"current_steps": 1245, "total_steps": 67140, "loss": 0.8844, "lr": 9.264224009532322e-06, "epoch": 0.18543342269883825, "percentage": 1.85, "elapsed_time": "0:04:43", "remaining_time": "4:10:17", "throughput": 2540.05, "total_tokens": 720704} {"current_steps": 1250, "total_steps": 67140, "loss": 0.837, "lr": 9.30145963658028e-06, "epoch": 0.18617813523979743, "percentage": 1.86, "elapsed_time": "0:04:44", "remaining_time": "4:10:17", "throughput": 2540.22, "total_tokens": 723680} {"current_steps": 1255, "total_steps": 67140, "loss": 0.8201, "lr": 9.33869526362824e-06, "epoch": 0.18692284778075663, "percentage": 1.87, "elapsed_time": "0:04:46", "remaining_time": "4:10:15", "throughput": 2540.36, "total_tokens": 726592} {"current_steps": 1260, "total_steps": 67140, "loss": 0.8252, "lr": 9.3759308906762e-06, "epoch": 0.1876675603217158, "percentage": 1.88, "elapsed_time": "0:04:47", "remaining_time": "4:10:14", "throughput": 2540.51, "total_tokens": 729536} {"current_steps": 1265, "total_steps": 67140, "loss": 0.8171, "lr": 9.41316651772416e-06, "epoch": 0.188412272862675, "percentage": 1.88, "elapsed_time": "0:04:48", "remaining_time": "4:10:14", "throughput": 2540.67, "total_tokens": 732544} {"current_steps": 1270, "total_steps": 67140, "loss": 0.7818, "lr": 9.450402144772117e-06, "epoch": 0.1891569854036342, "percentage": 1.89, "elapsed_time": "0:04:49", "remaining_time": "4:10:16", "throughput": 2541.16, "total_tokens": 735712} {"current_steps": 1275, "total_steps": 67140, "loss": 0.8475, "lr": 9.487637771820077e-06, "epoch": 0.18990169794459338, "percentage": 1.9, "elapsed_time": "0:04:50", "remaining_time": "4:10:12", "throughput": 2540.56, "total_tokens": 738304} {"current_steps": 1280, "total_steps": 67140, "loss": 0.8415, "lr": 9.524873398868039e-06, "epoch": 0.1906464104855526, "percentage": 1.91, "elapsed_time": "0:04:51", "remaining_time": "4:10:11", "throughput": 2540.63, "total_tokens": 741248} {"current_steps": 1285, "total_steps": 67140, "loss": 0.847, "lr": 9.562109025915997e-06, "epoch": 0.19139112302651176, "percentage": 1.91, "elapsed_time": "0:04:52", "remaining_time": "4:10:10", "throughput": 2540.89, "total_tokens": 744192} {"current_steps": 1290, "total_steps": 67140, "loss": 0.804, "lr": 9.599344652963957e-06, "epoch": 0.19213583556747096, "percentage": 1.92, "elapsed_time": "0:04:54", "remaining_time": "4:10:09", "throughput": 2540.9, "total_tokens": 747104} {"current_steps": 1295, "total_steps": 67140, "loss": 0.819, "lr": 9.636580280011915e-06, "epoch": 0.19288054810843014, "percentage": 1.93, "elapsed_time": "0:04:55", "remaining_time": "4:10:09", "throughput": 2540.87, "total_tokens": 750048} {"current_steps": 1300, "total_steps": 67140, "loss": 0.7809, "lr": 9.673815907059877e-06, "epoch": 0.19362526064938934, "percentage": 1.94, "elapsed_time": "0:04:56", "remaining_time": "4:10:08", "throughput": 2540.93, "total_tokens": 752992} {"current_steps": 1305, "total_steps": 67140, "loss": 0.7859, "lr": 9.711051534107835e-06, "epoch": 0.19436997319034852, "percentage": 1.94, "elapsed_time": "0:04:57", "remaining_time": "4:10:06", "throughput": 2541.09, "total_tokens": 755904} {"current_steps": 1310, "total_steps": 67140, "loss": 0.8247, "lr": 9.748287161155795e-06, "epoch": 0.19511468573130772, "percentage": 1.95, "elapsed_time": "0:04:58", "remaining_time": "4:10:05", "throughput": 2540.96, "total_tokens": 758752} {"current_steps": 1315, "total_steps": 67140, "loss": 0.8407, "lr": 9.785522788203753e-06, "epoch": 0.1958593982722669, "percentage": 1.96, "elapsed_time": "0:04:59", "remaining_time": "4:10:01", "throughput": 2540.46, "total_tokens": 761344} {"current_steps": 1320, "total_steps": 67140, "loss": 0.8161, "lr": 9.822758415251714e-06, "epoch": 0.1966041108132261, "percentage": 1.97, "elapsed_time": "0:05:00", "remaining_time": "4:09:59", "throughput": 2540.33, "total_tokens": 764160} {"current_steps": 1325, "total_steps": 67140, "loss": 0.7901, "lr": 9.859994042299672e-06, "epoch": 0.19734882335418527, "percentage": 1.97, "elapsed_time": "0:05:01", "remaining_time": "4:09:58", "throughput": 2540.48, "total_tokens": 767104} {"current_steps": 1330, "total_steps": 67140, "loss": 0.8739, "lr": 9.897229669347632e-06, "epoch": 0.19809353589514447, "percentage": 1.98, "elapsed_time": "0:05:03", "remaining_time": "4:09:55", "throughput": 2540.14, "total_tokens": 769824} {"current_steps": 1335, "total_steps": 67140, "loss": 0.8477, "lr": 9.93446529639559e-06, "epoch": 0.19883824843610368, "percentage": 1.99, "elapsed_time": "0:05:04", "remaining_time": "4:09:53", "throughput": 2539.82, "total_tokens": 772544} {"current_steps": 1340, "total_steps": 67140, "loss": 0.8241, "lr": 9.971700923443552e-06, "epoch": 0.19958296097706285, "percentage": 2.0, "elapsed_time": "0:05:05", "remaining_time": "4:09:51", "throughput": 2539.69, "total_tokens": 775360} {"current_steps": 1345, "total_steps": 67140, "loss": 0.8642, "lr": 1.0008936550491512e-05, "epoch": 0.20032767351802205, "percentage": 2.0, "elapsed_time": "0:05:06", "remaining_time": "4:09:48", "throughput": 2539.58, "total_tokens": 778144} {"current_steps": 1350, "total_steps": 67140, "loss": 0.8101, "lr": 1.004617217753947e-05, "epoch": 0.20107238605898123, "percentage": 2.01, "elapsed_time": "0:05:07", "remaining_time": "4:09:46", "throughput": 2539.21, "total_tokens": 780864} {"current_steps": 1355, "total_steps": 67140, "loss": 0.7915, "lr": 1.008340780458743e-05, "epoch": 0.20181709859994043, "percentage": 2.02, "elapsed_time": "0:05:08", "remaining_time": "4:09:45", "throughput": 2539.34, "total_tokens": 783776} {"current_steps": 1360, "total_steps": 67140, "loss": 0.8395, "lr": 1.012064343163539e-05, "epoch": 0.2025618111408996, "percentage": 2.03, "elapsed_time": "0:05:09", "remaining_time": "4:09:44", "throughput": 2539.49, "total_tokens": 786752} {"current_steps": 1365, "total_steps": 67140, "loss": 0.7894, "lr": 1.015787905868335e-05, "epoch": 0.2033065236818588, "percentage": 2.03, "elapsed_time": "0:05:10", "remaining_time": "4:09:42", "throughput": 2539.3, "total_tokens": 789536} {"current_steps": 1370, "total_steps": 67140, "loss": 0.9203, "lr": 1.0195114685731308e-05, "epoch": 0.20405123622281798, "percentage": 2.04, "elapsed_time": "0:05:12", "remaining_time": "4:09:39", "throughput": 2538.74, "total_tokens": 792160} {"current_steps": 1375, "total_steps": 67140, "loss": 0.8656, "lr": 1.0232350312779268e-05, "epoch": 0.20479594876377719, "percentage": 2.05, "elapsed_time": "0:05:13", "remaining_time": "4:09:36", "throughput": 2538.56, "total_tokens": 794912} {"current_steps": 1380, "total_steps": 67140, "loss": 0.8095, "lr": 1.0269585939827227e-05, "epoch": 0.20554066130473636, "percentage": 2.06, "elapsed_time": "0:05:14", "remaining_time": "4:09:36", "throughput": 2538.59, "total_tokens": 797824} {"current_steps": 1385, "total_steps": 67140, "loss": 0.8024, "lr": 1.0306821566875187e-05, "epoch": 0.20628537384569556, "percentage": 2.06, "elapsed_time": "0:05:15", "remaining_time": "4:09:38", "throughput": 2539.44, "total_tokens": 801184} {"current_steps": 1390, "total_steps": 67140, "loss": 0.8168, "lr": 1.0344057193923145e-05, "epoch": 0.20703008638665474, "percentage": 2.07, "elapsed_time": "0:05:16", "remaining_time": "4:09:37", "throughput": 2539.33, "total_tokens": 804032} {"current_steps": 1395, "total_steps": 67140, "loss": 0.8979, "lr": 1.0381292820971105e-05, "epoch": 0.20777479892761394, "percentage": 2.08, "elapsed_time": "0:05:17", "remaining_time": "4:09:36", "throughput": 2539.27, "total_tokens": 806912} {"current_steps": 1400, "total_steps": 67140, "loss": 0.9699, "lr": 1.0418528448019065e-05, "epoch": 0.20851951146857314, "percentage": 2.09, "elapsed_time": "0:05:18", "remaining_time": "4:09:32", "throughput": 2538.68, "total_tokens": 809472} {"current_steps": 1405, "total_steps": 67140, "loss": 0.7895, "lr": 1.0455764075067025e-05, "epoch": 0.20926422400953232, "percentage": 2.09, "elapsed_time": "0:05:19", "remaining_time": "4:09:29", "throughput": 2538.07, "total_tokens": 812064} {"current_steps": 1410, "total_steps": 67140, "loss": 0.7895, "lr": 1.0492999702114985e-05, "epoch": 0.21000893655049152, "percentage": 2.1, "elapsed_time": "0:05:21", "remaining_time": "4:09:30", "throughput": 2538.6, "total_tokens": 815232} {"current_steps": 1415, "total_steps": 67140, "loss": 0.7866, "lr": 1.0530235329162943e-05, "epoch": 0.2107536490914507, "percentage": 2.11, "elapsed_time": "0:05:22", "remaining_time": "4:09:28", "throughput": 2538.57, "total_tokens": 818080} {"current_steps": 1420, "total_steps": 67140, "loss": 0.8694, "lr": 1.0567470956210903e-05, "epoch": 0.2114983616324099, "percentage": 2.11, "elapsed_time": "0:05:23", "remaining_time": "4:09:26", "throughput": 2538.35, "total_tokens": 820832} {"current_steps": 1425, "total_steps": 67140, "loss": 0.7811, "lr": 1.0604706583258863e-05, "epoch": 0.21224307417336907, "percentage": 2.12, "elapsed_time": "0:05:24", "remaining_time": "4:09:23", "throughput": 2538.25, "total_tokens": 823584} {"current_steps": 1430, "total_steps": 67140, "loss": 0.828, "lr": 1.0641942210306823e-05, "epoch": 0.21298778671432828, "percentage": 2.13, "elapsed_time": "0:05:25", "remaining_time": "4:09:20", "throughput": 2537.77, "total_tokens": 826240} {"current_steps": 1435, "total_steps": 67140, "loss": 0.7984, "lr": 1.067917783735478e-05, "epoch": 0.21373249925528745, "percentage": 2.14, "elapsed_time": "0:05:26", "remaining_time": "4:09:17", "throughput": 2537.43, "total_tokens": 828928} {"current_steps": 1440, "total_steps": 67140, "loss": 0.8251, "lr": 1.071641346440274e-05, "epoch": 0.21447721179624665, "percentage": 2.14, "elapsed_time": "0:05:27", "remaining_time": "4:09:18", "throughput": 2538.07, "total_tokens": 832128} {"current_steps": 1445, "total_steps": 67140, "loss": 0.8323, "lr": 1.07536490914507e-05, "epoch": 0.21522192433720583, "percentage": 2.15, "elapsed_time": "0:05:29", "remaining_time": "4:09:22", "throughput": 2539.1, "total_tokens": 835616} {"current_steps": 1450, "total_steps": 67140, "loss": 0.8334, "lr": 1.079088471849866e-05, "epoch": 0.21596663687816503, "percentage": 2.16, "elapsed_time": "0:05:30", "remaining_time": "4:09:21", "throughput": 2539.14, "total_tokens": 838528} {"current_steps": 1455, "total_steps": 67140, "loss": 0.7766, "lr": 1.0828120345546618e-05, "epoch": 0.2167113494191242, "percentage": 2.17, "elapsed_time": "0:05:31", "remaining_time": "4:09:19", "throughput": 2539.2, "total_tokens": 841440} {"current_steps": 1460, "total_steps": 67140, "loss": 0.9724, "lr": 1.086535597259458e-05, "epoch": 0.2174560619600834, "percentage": 2.17, "elapsed_time": "0:05:32", "remaining_time": "4:09:19", "throughput": 2539.3, "total_tokens": 844416} {"current_steps": 1465, "total_steps": 67140, "loss": 0.8614, "lr": 1.0902591599642538e-05, "epoch": 0.2182007745010426, "percentage": 2.18, "elapsed_time": "0:05:33", "remaining_time": "4:09:17", "throughput": 2539.13, "total_tokens": 847168} {"current_steps": 1470, "total_steps": 67140, "loss": 0.8406, "lr": 1.0939827226690498e-05, "epoch": 0.21894548704200179, "percentage": 2.19, "elapsed_time": "0:05:34", "remaining_time": "4:09:16", "throughput": 2539.32, "total_tokens": 850176} {"current_steps": 1475, "total_steps": 67140, "loss": 0.8328, "lr": 1.0977062853738458e-05, "epoch": 0.219690199582961, "percentage": 2.2, "elapsed_time": "0:05:35", "remaining_time": "4:09:14", "throughput": 2539.24, "total_tokens": 852992} {"current_steps": 1480, "total_steps": 67140, "loss": 0.8023, "lr": 1.1014298480786418e-05, "epoch": 0.22043491212392016, "percentage": 2.2, "elapsed_time": "0:05:37", "remaining_time": "4:09:13", "throughput": 2539.55, "total_tokens": 855968} {"current_steps": 1485, "total_steps": 67140, "loss": 1.3279, "lr": 1.1051534107834378e-05, "epoch": 0.22117962466487937, "percentage": 2.21, "elapsed_time": "0:05:38", "remaining_time": "4:09:14", "throughput": 2540.02, "total_tokens": 859136} {"current_steps": 1490, "total_steps": 67140, "loss": 0.8657, "lr": 1.1088769734882336e-05, "epoch": 0.22192433720583854, "percentage": 2.22, "elapsed_time": "0:05:39", "remaining_time": "4:09:13", "throughput": 2540.24, "total_tokens": 862144} {"current_steps": 1495, "total_steps": 67140, "loss": 0.8138, "lr": 1.1126005361930296e-05, "epoch": 0.22266904974679774, "percentage": 2.23, "elapsed_time": "0:05:40", "remaining_time": "4:09:14", "throughput": 2541.07, "total_tokens": 865440} {"current_steps": 1500, "total_steps": 67140, "loss": 0.8344, "lr": 1.1163240988978255e-05, "epoch": 0.22341376228775692, "percentage": 2.23, "elapsed_time": "0:05:41", "remaining_time": "4:09:15", "throughput": 2541.61, "total_tokens": 868640} {"current_steps": 1505, "total_steps": 67140, "loss": 0.8112, "lr": 1.1200476616026215e-05, "epoch": 0.22415847482871612, "percentage": 2.24, "elapsed_time": "0:05:42", "remaining_time": "4:09:14", "throughput": 2541.64, "total_tokens": 871520} {"current_steps": 1510, "total_steps": 67140, "loss": 0.8025, "lr": 1.1237712243074173e-05, "epoch": 0.2249031873696753, "percentage": 2.25, "elapsed_time": "0:05:44", "remaining_time": "4:09:12", "throughput": 2541.7, "total_tokens": 874400} {"current_steps": 1515, "total_steps": 67140, "loss": 0.8041, "lr": 1.1274947870122133e-05, "epoch": 0.2256478999106345, "percentage": 2.26, "elapsed_time": "0:05:45", "remaining_time": "4:09:13", "throughput": 2542.24, "total_tokens": 877600} {"current_steps": 1520, "total_steps": 67140, "loss": 0.8462, "lr": 1.1312183497170093e-05, "epoch": 0.22639261245159367, "percentage": 2.26, "elapsed_time": "0:05:46", "remaining_time": "4:09:12", "throughput": 2542.35, "total_tokens": 880544} {"current_steps": 1525, "total_steps": 67140, "loss": 0.8201, "lr": 1.1349419124218053e-05, "epoch": 0.22713732499255287, "percentage": 2.27, "elapsed_time": "0:05:47", "remaining_time": "4:09:11", "throughput": 2542.44, "total_tokens": 883488} {"current_steps": 1530, "total_steps": 67140, "loss": 0.8389, "lr": 1.1386654751266011e-05, "epoch": 0.22788203753351208, "percentage": 2.28, "elapsed_time": "0:05:48", "remaining_time": "4:09:09", "throughput": 2542.08, "total_tokens": 886208} {"current_steps": 1535, "total_steps": 67140, "loss": 0.9066, "lr": 1.1423890378313971e-05, "epoch": 0.22862675007447125, "percentage": 2.29, "elapsed_time": "0:05:49", "remaining_time": "4:09:08", "throughput": 2542.05, "total_tokens": 889088} {"current_steps": 1540, "total_steps": 67140, "loss": 0.7988, "lr": 1.1461126005361931e-05, "epoch": 0.22937146261543045, "percentage": 2.29, "elapsed_time": "0:05:50", "remaining_time": "4:09:05", "throughput": 2541.67, "total_tokens": 891776} {"current_steps": 1545, "total_steps": 67140, "loss": 0.8126, "lr": 1.149836163240989e-05, "epoch": 0.23011617515638963, "percentage": 2.3, "elapsed_time": "0:05:52", "remaining_time": "4:09:06", "throughput": 2542.16, "total_tokens": 894944} {"current_steps": 1550, "total_steps": 67140, "loss": 0.8083, "lr": 1.153559725945785e-05, "epoch": 0.23086088769734883, "percentage": 2.31, "elapsed_time": "0:05:53", "remaining_time": "4:09:05", "throughput": 2542.11, "total_tokens": 897824} {"current_steps": 1555, "total_steps": 67140, "loss": 0.8044, "lr": 1.1572832886505809e-05, "epoch": 0.231605600238308, "percentage": 2.32, "elapsed_time": "0:05:54", "remaining_time": "4:09:03", "throughput": 2542.02, "total_tokens": 900640} {"current_steps": 1560, "total_steps": 67140, "loss": 0.8402, "lr": 1.1610068513553769e-05, "epoch": 0.2323503127792672, "percentage": 2.32, "elapsed_time": "0:05:55", "remaining_time": "4:09:01", "throughput": 2541.83, "total_tokens": 903424} {"current_steps": 1565, "total_steps": 67140, "loss": 0.8316, "lr": 1.1647304140601728e-05, "epoch": 0.23309502532022638, "percentage": 2.33, "elapsed_time": "0:05:56", "remaining_time": "4:08:58", "throughput": 2541.38, "total_tokens": 906048} {"current_steps": 1570, "total_steps": 67140, "loss": 0.8511, "lr": 1.1684539767649688e-05, "epoch": 0.2338397378611856, "percentage": 2.34, "elapsed_time": "0:05:57", "remaining_time": "4:08:57", "throughput": 2541.24, "total_tokens": 908896} {"current_steps": 1575, "total_steps": 67140, "loss": 0.7754, "lr": 1.1721775394697646e-05, "epoch": 0.23458445040214476, "percentage": 2.35, "elapsed_time": "0:05:58", "remaining_time": "4:08:56", "throughput": 2541.22, "total_tokens": 911776} {"current_steps": 1580, "total_steps": 67140, "loss": 0.8293, "lr": 1.1759011021745606e-05, "epoch": 0.23532916294310396, "percentage": 2.35, "elapsed_time": "0:05:59", "remaining_time": "4:08:57", "throughput": 2541.81, "total_tokens": 915040} {"current_steps": 1585, "total_steps": 67140, "loss": 0.8851, "lr": 1.1796246648793566e-05, "epoch": 0.23607387548406314, "percentage": 2.36, "elapsed_time": "0:06:01", "remaining_time": "4:08:56", "throughput": 2541.84, "total_tokens": 917952} {"current_steps": 1590, "total_steps": 67140, "loss": 0.8785, "lr": 1.1833482275841526e-05, "epoch": 0.23681858802502234, "percentage": 2.37, "elapsed_time": "0:06:02", "remaining_time": "4:08:53", "throughput": 2541.55, "total_tokens": 920640} {"current_steps": 1595, "total_steps": 67140, "loss": 0.7781, "lr": 1.1870717902889484e-05, "epoch": 0.23756330056598154, "percentage": 2.38, "elapsed_time": "0:06:03", "remaining_time": "4:08:53", "throughput": 2541.77, "total_tokens": 923680} {"current_steps": 1600, "total_steps": 67140, "loss": 0.8563, "lr": 1.1907953529937444e-05, "epoch": 0.23830801310694072, "percentage": 2.38, "elapsed_time": "0:06:04", "remaining_time": "4:08:51", "throughput": 2541.82, "total_tokens": 926560} {"current_steps": 1605, "total_steps": 67140, "loss": 0.8235, "lr": 1.1945189156985404e-05, "epoch": 0.23905272564789992, "percentage": 2.39, "elapsed_time": "0:06:05", "remaining_time": "4:08:50", "throughput": 2541.7, "total_tokens": 929376} {"current_steps": 1610, "total_steps": 67140, "loss": 0.8091, "lr": 1.1982424784033364e-05, "epoch": 0.2397974381888591, "percentage": 2.4, "elapsed_time": "0:06:06", "remaining_time": "4:08:48", "throughput": 2541.52, "total_tokens": 932160} {"current_steps": 1615, "total_steps": 67140, "loss": 0.774, "lr": 1.2019660411081324e-05, "epoch": 0.2405421507298183, "percentage": 2.41, "elapsed_time": "0:06:07", "remaining_time": "4:08:47", "throughput": 2541.46, "total_tokens": 935040} {"current_steps": 1620, "total_steps": 67140, "loss": 0.7916, "lr": 1.2056896038129282e-05, "epoch": 0.24128686327077747, "percentage": 2.41, "elapsed_time": "0:06:09", "remaining_time": "4:08:45", "throughput": 2541.32, "total_tokens": 937824} {"current_steps": 1625, "total_steps": 67140, "loss": 0.8146, "lr": 1.2094131665177243e-05, "epoch": 0.24203157581173668, "percentage": 2.42, "elapsed_time": "0:06:10", "remaining_time": "4:08:44", "throughput": 2541.57, "total_tokens": 940832} {"current_steps": 1630, "total_steps": 67140, "loss": 0.8462, "lr": 1.2131367292225201e-05, "epoch": 0.24277628835269585, "percentage": 2.43, "elapsed_time": "0:06:11", "remaining_time": "4:08:42", "throughput": 2541.2, "total_tokens": 943520} {"current_steps": 1635, "total_steps": 67140, "loss": 0.8411, "lr": 1.2168602919273161e-05, "epoch": 0.24352100089365505, "percentage": 2.44, "elapsed_time": "0:06:12", "remaining_time": "4:08:40", "throughput": 2541.17, "total_tokens": 946400} {"current_steps": 1640, "total_steps": 67140, "loss": 0.8387, "lr": 1.220583854632112e-05, "epoch": 0.24426571343461423, "percentage": 2.44, "elapsed_time": "0:06:13", "remaining_time": "4:08:40", "throughput": 2541.56, "total_tokens": 949504} {"current_steps": 1645, "total_steps": 67140, "loss": 0.8387, "lr": 1.2243074173369081e-05, "epoch": 0.24501042597557343, "percentage": 2.45, "elapsed_time": "0:06:14", "remaining_time": "4:08:45", "throughput": 2542.69, "total_tokens": 953184} {"current_steps": 1650, "total_steps": 67140, "loss": 0.8252, "lr": 1.228030980041704e-05, "epoch": 0.2457551385165326, "percentage": 2.46, "elapsed_time": "0:06:16", "remaining_time": "4:08:45", "throughput": 2542.93, "total_tokens": 956256} {"current_steps": 1655, "total_steps": 67140, "loss": 0.8003, "lr": 1.2317545427464999e-05, "epoch": 0.2464998510574918, "percentage": 2.46, "elapsed_time": "0:06:17", "remaining_time": "4:08:44", "throughput": 2542.94, "total_tokens": 959168} {"current_steps": 1660, "total_steps": 67140, "loss": 0.8891, "lr": 1.2354781054512959e-05, "epoch": 0.247244563598451, "percentage": 2.47, "elapsed_time": "0:06:18", "remaining_time": "4:08:43", "throughput": 2542.77, "total_tokens": 962016} {"current_steps": 1665, "total_steps": 67140, "loss": 0.873, "lr": 1.2392016681560919e-05, "epoch": 0.2479892761394102, "percentage": 2.48, "elapsed_time": "0:06:19", "remaining_time": "4:08:42", "throughput": 2542.68, "total_tokens": 964896} {"current_steps": 1670, "total_steps": 67140, "loss": 0.8549, "lr": 1.2429252308608877e-05, "epoch": 0.2487339886803694, "percentage": 2.49, "elapsed_time": "0:06:20", "remaining_time": "4:08:41", "throughput": 2542.52, "total_tokens": 967712} {"current_steps": 1675, "total_steps": 67140, "loss": 0.8274, "lr": 1.2466487935656837e-05, "epoch": 0.24947870122132856, "percentage": 2.49, "elapsed_time": "0:06:21", "remaining_time": "4:08:40", "throughput": 2542.77, "total_tokens": 970752} {"current_steps": 1680, "total_steps": 67140, "loss": 0.8368, "lr": 1.2503723562704797e-05, "epoch": 0.25022341376228774, "percentage": 2.5, "elapsed_time": "0:06:22", "remaining_time": "4:08:42", "throughput": 2543.44, "total_tokens": 974080} {"current_steps": 1685, "total_steps": 67140, "loss": 0.832, "lr": 1.2540959189752758e-05, "epoch": 0.25096812630324694, "percentage": 2.51, "elapsed_time": "0:06:24", "remaining_time": "4:08:41", "throughput": 2543.38, "total_tokens": 976960} {"current_steps": 1690, "total_steps": 67140, "loss": 0.8012, "lr": 1.2578194816800715e-05, "epoch": 0.25171283884420614, "percentage": 2.52, "elapsed_time": "0:06:25", "remaining_time": "4:08:42", "throughput": 2543.94, "total_tokens": 980192} {"current_steps": 1695, "total_steps": 67140, "loss": 0.7924, "lr": 1.2615430443848674e-05, "epoch": 0.25245755138516535, "percentage": 2.52, "elapsed_time": "0:06:26", "remaining_time": "4:08:40", "throughput": 2543.69, "total_tokens": 982944} {"current_steps": 1700, "total_steps": 67140, "loss": 0.8289, "lr": 1.2652666070896634e-05, "epoch": 0.2532022639261245, "percentage": 2.53, "elapsed_time": "0:06:27", "remaining_time": "4:08:38", "throughput": 2543.43, "total_tokens": 985696} {"current_steps": 1705, "total_steps": 67140, "loss": 0.8432, "lr": 1.2689901697944596e-05, "epoch": 0.2539469764670837, "percentage": 2.54, "elapsed_time": "0:06:28", "remaining_time": "4:08:36", "throughput": 2543.2, "total_tokens": 988480} {"current_steps": 1710, "total_steps": 67140, "loss": 0.8255, "lr": 1.2727137324992552e-05, "epoch": 0.2546916890080429, "percentage": 2.55, "elapsed_time": "0:06:29", "remaining_time": "4:08:35", "throughput": 2543.29, "total_tokens": 991392} {"current_steps": 1715, "total_steps": 67140, "loss": 0.8194, "lr": 1.2764372952040512e-05, "epoch": 0.2554364015490021, "percentage": 2.55, "elapsed_time": "0:06:30", "remaining_time": "4:08:32", "throughput": 2542.99, "total_tokens": 994048} {"current_steps": 1720, "total_steps": 67140, "loss": 0.7976, "lr": 1.2801608579088472e-05, "epoch": 0.25618111408996125, "percentage": 2.56, "elapsed_time": "0:06:31", "remaining_time": "4:08:28", "throughput": 2542.41, "total_tokens": 996576} {"current_steps": 1725, "total_steps": 67140, "loss": 0.8129, "lr": 1.2838844206136434e-05, "epoch": 0.25692582663092045, "percentage": 2.57, "elapsed_time": "0:06:33", "remaining_time": "4:08:28", "throughput": 2542.7, "total_tokens": 999616} {"current_steps": 1730, "total_steps": 67140, "loss": 0.7758, "lr": 1.287607983318439e-05, "epoch": 0.25767053917187965, "percentage": 2.58, "elapsed_time": "0:06:34", "remaining_time": "4:08:28", "throughput": 2542.97, "total_tokens": 1002720} {"current_steps": 1735, "total_steps": 67140, "loss": 0.8752, "lr": 1.291331546023235e-05, "epoch": 0.25841525171283886, "percentage": 2.58, "elapsed_time": "0:06:35", "remaining_time": "4:08:26", "throughput": 2542.67, "total_tokens": 1005440} {"current_steps": 1740, "total_steps": 67140, "loss": 0.7863, "lr": 1.295055108728031e-05, "epoch": 0.25915996425379806, "percentage": 2.59, "elapsed_time": "0:06:36", "remaining_time": "4:08:23", "throughput": 2542.07, "total_tokens": 1007936} {"current_steps": 1745, "total_steps": 67140, "loss": 0.8869, "lr": 1.2987786714328271e-05, "epoch": 0.2599046767947572, "percentage": 2.6, "elapsed_time": "0:06:37", "remaining_time": "4:08:21", "throughput": 2542.09, "total_tokens": 1010848} {"current_steps": 1750, "total_steps": 67140, "loss": 0.8411, "lr": 1.3025022341376231e-05, "epoch": 0.2606493893357164, "percentage": 2.61, "elapsed_time": "0:06:38", "remaining_time": "4:08:20", "throughput": 2541.99, "total_tokens": 1013664} {"current_steps": 1755, "total_steps": 67140, "loss": 0.8157, "lr": 1.3062257968424188e-05, "epoch": 0.2613941018766756, "percentage": 2.61, "elapsed_time": "0:06:39", "remaining_time": "4:08:19", "throughput": 2542.49, "total_tokens": 1016800} {"current_steps": 1760, "total_steps": 67140, "loss": 0.8327, "lr": 1.3099493595472147e-05, "epoch": 0.2621388144176348, "percentage": 2.62, "elapsed_time": "0:06:41", "remaining_time": "4:08:18", "throughput": 2542.36, "total_tokens": 1019648} {"current_steps": 1765, "total_steps": 67140, "loss": 0.804, "lr": 1.3136729222520109e-05, "epoch": 0.26288352695859396, "percentage": 2.63, "elapsed_time": "0:06:42", "remaining_time": "4:08:16", "throughput": 2542.29, "total_tokens": 1022432} {"current_steps": 1770, "total_steps": 67140, "loss": 0.8143, "lr": 1.3173964849568069e-05, "epoch": 0.26362823949955316, "percentage": 2.64, "elapsed_time": "0:06:43", "remaining_time": "4:08:15", "throughput": 2542.52, "total_tokens": 1025472} {"current_steps": 1775, "total_steps": 67140, "loss": 0.8252, "lr": 1.3211200476616025e-05, "epoch": 0.26437295204051237, "percentage": 2.64, "elapsed_time": "0:06:44", "remaining_time": "4:08:14", "throughput": 2542.41, "total_tokens": 1028288} {"current_steps": 1780, "total_steps": 67140, "loss": 0.8058, "lr": 1.3248436103663985e-05, "epoch": 0.26511766458147157, "percentage": 2.65, "elapsed_time": "0:06:45", "remaining_time": "4:08:11", "throughput": 2542.23, "total_tokens": 1031040} {"current_steps": 1785, "total_steps": 67140, "loss": 0.852, "lr": 1.3285671730711947e-05, "epoch": 0.2658623771224307, "percentage": 2.66, "elapsed_time": "0:06:46", "remaining_time": "4:08:10", "throughput": 2541.95, "total_tokens": 1033792} {"current_steps": 1790, "total_steps": 67140, "loss": 0.8148, "lr": 1.3322907357759907e-05, "epoch": 0.2666070896633899, "percentage": 2.67, "elapsed_time": "0:06:47", "remaining_time": "4:08:08", "throughput": 2541.53, "total_tokens": 1036448} {"current_steps": 1795, "total_steps": 67140, "loss": 0.7996, "lr": 1.3360142984807863e-05, "epoch": 0.2673518022043491, "percentage": 2.67, "elapsed_time": "0:06:48", "remaining_time": "4:08:05", "throughput": 2541.3, "total_tokens": 1039168} {"current_steps": 1800, "total_steps": 67140, "loss": 0.7911, "lr": 1.3397378611855823e-05, "epoch": 0.2680965147453083, "percentage": 2.68, "elapsed_time": "0:06:50", "remaining_time": "4:08:04", "throughput": 2541.15, "total_tokens": 1041952} {"current_steps": 1805, "total_steps": 67140, "loss": 0.8098, "lr": 1.3434614238903784e-05, "epoch": 0.2688412272862675, "percentage": 2.69, "elapsed_time": "0:06:51", "remaining_time": "4:08:01", "throughput": 2540.88, "total_tokens": 1044608} {"current_steps": 1810, "total_steps": 67140, "loss": 0.9276, "lr": 1.3471849865951744e-05, "epoch": 0.2695859398272267, "percentage": 2.7, "elapsed_time": "0:06:52", "remaining_time": "4:08:00", "throughput": 2540.93, "total_tokens": 1047552} {"current_steps": 1815, "total_steps": 67140, "loss": 0.8009, "lr": 1.3509085492999704e-05, "epoch": 0.2703306523681859, "percentage": 2.7, "elapsed_time": "0:06:53", "remaining_time": "4:08:04", "throughput": 2541.89, "total_tokens": 1051200} {"current_steps": 1820, "total_steps": 67140, "loss": 0.8269, "lr": 1.354632112004766e-05, "epoch": 0.2710753649091451, "percentage": 2.71, "elapsed_time": "0:06:54", "remaining_time": "4:08:02", "throughput": 2541.56, "total_tokens": 1053888} {"current_steps": 1825, "total_steps": 67140, "loss": 0.7616, "lr": 1.3583556747095622e-05, "epoch": 0.2718200774501043, "percentage": 2.72, "elapsed_time": "0:06:55", "remaining_time": "4:07:59", "throughput": 2541.21, "total_tokens": 1056544} {"current_steps": 1830, "total_steps": 67140, "loss": 0.9282, "lr": 1.3620792374143582e-05, "epoch": 0.2725647899910634, "percentage": 2.73, "elapsed_time": "0:06:56", "remaining_time": "4:07:57", "throughput": 2540.99, "total_tokens": 1059296} {"current_steps": 1835, "total_steps": 67140, "loss": 0.8151, "lr": 1.3658028001191542e-05, "epoch": 0.27330950253202263, "percentage": 2.73, "elapsed_time": "0:06:58", "remaining_time": "4:07:56", "throughput": 2541.01, "total_tokens": 1062176} {"current_steps": 1840, "total_steps": 67140, "loss": 0.8991, "lr": 1.3695263628239498e-05, "epoch": 0.27405421507298183, "percentage": 2.74, "elapsed_time": "0:06:59", "remaining_time": "4:07:55", "throughput": 2540.86, "total_tokens": 1064992} {"current_steps": 1845, "total_steps": 67140, "loss": 0.895, "lr": 1.373249925528746e-05, "epoch": 0.27479892761394104, "percentage": 2.75, "elapsed_time": "0:07:00", "remaining_time": "4:07:53", "throughput": 2540.84, "total_tokens": 1067872} {"current_steps": 1850, "total_steps": 67140, "loss": 0.8558, "lr": 1.376973488233542e-05, "epoch": 0.2755436401549002, "percentage": 2.76, "elapsed_time": "0:07:01", "remaining_time": "4:07:52", "throughput": 2540.94, "total_tokens": 1070816} {"current_steps": 1855, "total_steps": 67140, "loss": 0.8051, "lr": 1.380697050938338e-05, "epoch": 0.2762883526958594, "percentage": 2.76, "elapsed_time": "0:07:02", "remaining_time": "4:07:50", "throughput": 2540.85, "total_tokens": 1073600} {"current_steps": 1860, "total_steps": 67140, "loss": 0.8314, "lr": 1.3844206136431338e-05, "epoch": 0.2770330652368186, "percentage": 2.77, "elapsed_time": "0:07:03", "remaining_time": "4:07:49", "throughput": 2540.89, "total_tokens": 1076512} {"current_steps": 1865, "total_steps": 67140, "loss": 0.8524, "lr": 1.3881441763479298e-05, "epoch": 0.2777777777777778, "percentage": 2.78, "elapsed_time": "0:07:04", "remaining_time": "4:07:47", "throughput": 2540.66, "total_tokens": 1079264} {"current_steps": 1870, "total_steps": 67140, "loss": 0.9392, "lr": 1.3918677390527257e-05, "epoch": 0.278522490318737, "percentage": 2.79, "elapsed_time": "0:07:05", "remaining_time": "4:07:46", "throughput": 2540.71, "total_tokens": 1082144} {"current_steps": 1875, "total_steps": 67140, "loss": 0.8168, "lr": 1.3955913017575217e-05, "epoch": 0.27926720285969614, "percentage": 2.79, "elapsed_time": "0:07:07", "remaining_time": "4:07:44", "throughput": 2540.62, "total_tokens": 1084960} {"current_steps": 1880, "total_steps": 67140, "loss": 0.8084, "lr": 1.3993148644623177e-05, "epoch": 0.28001191540065534, "percentage": 2.8, "elapsed_time": "0:07:08", "remaining_time": "4:07:44", "throughput": 2540.67, "total_tokens": 1087936} {"current_steps": 1885, "total_steps": 67140, "loss": 0.8305, "lr": 1.4030384271671135e-05, "epoch": 0.28075662794161454, "percentage": 2.81, "elapsed_time": "0:07:09", "remaining_time": "4:07:44", "throughput": 2540.83, "total_tokens": 1091008} {"current_steps": 1890, "total_steps": 67140, "loss": 0.9858, "lr": 1.4067619898719095e-05, "epoch": 0.28150134048257375, "percentage": 2.82, "elapsed_time": "0:07:10", "remaining_time": "4:07:41", "throughput": 2540.57, "total_tokens": 1093664} {"current_steps": 1895, "total_steps": 67140, "loss": 0.8249, "lr": 1.4104855525767055e-05, "epoch": 0.2822460530235329, "percentage": 2.82, "elapsed_time": "0:07:11", "remaining_time": "4:07:40", "throughput": 2540.75, "total_tokens": 1096640} {"current_steps": 1900, "total_steps": 67140, "loss": 0.754, "lr": 1.4142091152815015e-05, "epoch": 0.2829907655644921, "percentage": 2.83, "elapsed_time": "0:07:12", "remaining_time": "4:07:37", "throughput": 2540.3, "total_tokens": 1099200} {"current_steps": 1905, "total_steps": 67140, "loss": 0.9017, "lr": 1.4179326779862973e-05, "epoch": 0.2837354781054513, "percentage": 2.84, "elapsed_time": "0:07:13", "remaining_time": "4:07:38", "throughput": 2540.66, "total_tokens": 1102368} {"current_steps": 1910, "total_steps": 67140, "loss": 0.8283, "lr": 1.4216562406910933e-05, "epoch": 0.2844801906464105, "percentage": 2.84, "elapsed_time": "0:07:15", "remaining_time": "4:07:36", "throughput": 2540.32, "total_tokens": 1105056} {"current_steps": 1915, "total_steps": 67140, "loss": 0.7989, "lr": 1.4253798033958893e-05, "epoch": 0.28522490318736965, "percentage": 2.85, "elapsed_time": "0:07:16", "remaining_time": "4:07:35", "throughput": 2540.39, "total_tokens": 1108032} {"current_steps": 1920, "total_steps": 67140, "loss": 0.8267, "lr": 1.4291033661006853e-05, "epoch": 0.28596961572832885, "percentage": 2.86, "elapsed_time": "0:07:17", "remaining_time": "4:07:34", "throughput": 2540.36, "total_tokens": 1110880} {"current_steps": 1925, "total_steps": 67140, "loss": 0.8895, "lr": 1.432826928805481e-05, "epoch": 0.28671432826928805, "percentage": 2.87, "elapsed_time": "0:07:18", "remaining_time": "4:07:31", "throughput": 2540.16, "total_tokens": 1113568} {"current_steps": 1930, "total_steps": 67140, "loss": 0.816, "lr": 1.436550491510277e-05, "epoch": 0.28745904081024726, "percentage": 2.87, "elapsed_time": "0:07:19", "remaining_time": "4:07:29", "throughput": 2540.14, "total_tokens": 1116416} {"current_steps": 1935, "total_steps": 67140, "loss": 0.8171, "lr": 1.440274054215073e-05, "epoch": 0.28820375335120646, "percentage": 2.88, "elapsed_time": "0:07:20", "remaining_time": "4:07:28", "throughput": 2540.04, "total_tokens": 1119232} {"current_steps": 1940, "total_steps": 67140, "loss": 0.7989, "lr": 1.443997616919869e-05, "epoch": 0.2889484658921656, "percentage": 2.89, "elapsed_time": "0:07:21", "remaining_time": "4:07:27", "throughput": 2540.05, "total_tokens": 1122144} {"current_steps": 1945, "total_steps": 67140, "loss": 0.8008, "lr": 1.447721179624665e-05, "epoch": 0.2896931784331248, "percentage": 2.9, "elapsed_time": "0:07:22", "remaining_time": "4:07:26", "throughput": 2540.08, "total_tokens": 1125056} {"current_steps": 1950, "total_steps": 67140, "loss": 0.8327, "lr": 1.4514447423294608e-05, "epoch": 0.290437890974084, "percentage": 2.9, "elapsed_time": "0:07:24", "remaining_time": "4:07:24", "throughput": 2539.79, "total_tokens": 1127744} {"current_steps": 1955, "total_steps": 67140, "loss": 0.8072, "lr": 1.4551683050342568e-05, "epoch": 0.2911826035150432, "percentage": 2.91, "elapsed_time": "0:07:25", "remaining_time": "4:07:21", "throughput": 2539.55, "total_tokens": 1130432} {"current_steps": 1960, "total_steps": 67140, "loss": 0.7675, "lr": 1.4588918677390528e-05, "epoch": 0.29192731605600236, "percentage": 2.92, "elapsed_time": "0:07:26", "remaining_time": "4:07:20", "throughput": 2539.3, "total_tokens": 1133184} {"current_steps": 1965, "total_steps": 67140, "loss": 0.8188, "lr": 1.4626154304438488e-05, "epoch": 0.29267202859696156, "percentage": 2.93, "elapsed_time": "0:07:27", "remaining_time": "4:07:20", "throughput": 2539.5, "total_tokens": 1136256} {"current_steps": 1970, "total_steps": 67140, "loss": 0.8094, "lr": 1.4663389931486446e-05, "epoch": 0.29341674113792077, "percentage": 2.93, "elapsed_time": "0:07:28", "remaining_time": "4:07:18", "throughput": 2539.49, "total_tokens": 1139104} {"current_steps": 1975, "total_steps": 67140, "loss": 0.762, "lr": 1.4700625558534406e-05, "epoch": 0.29416145367887997, "percentage": 2.94, "elapsed_time": "0:07:29", "remaining_time": "4:07:18", "throughput": 2539.73, "total_tokens": 1142176} {"current_steps": 1980, "total_steps": 67140, "loss": 0.8528, "lr": 1.4737861185582366e-05, "epoch": 0.2949061662198391, "percentage": 2.95, "elapsed_time": "0:07:30", "remaining_time": "4:07:16", "throughput": 2539.53, "total_tokens": 1144896} {"current_steps": 1985, "total_steps": 67140, "loss": 0.7739, "lr": 1.4775096812630326e-05, "epoch": 0.2956508787607983, "percentage": 2.96, "elapsed_time": "0:07:32", "remaining_time": "4:07:17", "throughput": 2540.06, "total_tokens": 1148192} {"current_steps": 1990, "total_steps": 67140, "loss": 0.8239, "lr": 1.4812332439678284e-05, "epoch": 0.2963955913017575, "percentage": 2.96, "elapsed_time": "0:07:33", "remaining_time": "4:07:15", "throughput": 2539.67, "total_tokens": 1150848} {"current_steps": 1995, "total_steps": 67140, "loss": 0.8435, "lr": 1.4849568066726244e-05, "epoch": 0.2971403038427167, "percentage": 2.97, "elapsed_time": "0:07:34", "remaining_time": "4:07:14", "throughput": 2539.78, "total_tokens": 1153792} {"current_steps": 2000, "total_steps": 67140, "loss": 0.8383, "lr": 1.4886803693774203e-05, "epoch": 0.2978850163836759, "percentage": 2.98, "elapsed_time": "0:07:35", "remaining_time": "4:07:12", "throughput": 2539.64, "total_tokens": 1156544} {"current_steps": 2005, "total_steps": 67140, "loss": 0.8626, "lr": 1.4924039320822163e-05, "epoch": 0.2986297289246351, "percentage": 2.99, "elapsed_time": "0:07:36", "remaining_time": "4:07:10", "throughput": 2539.51, "total_tokens": 1159360} {"current_steps": 2010, "total_steps": 67140, "loss": 0.8969, "lr": 1.4961274947870125e-05, "epoch": 0.2993744414655943, "percentage": 2.99, "elapsed_time": "0:07:37", "remaining_time": "4:07:09", "throughput": 2539.46, "total_tokens": 1162240} {"current_steps": 2015, "total_steps": 67140, "loss": 0.8089, "lr": 1.4998510574918081e-05, "epoch": 0.3001191540065535, "percentage": 3.0, "elapsed_time": "0:07:38", "remaining_time": "4:07:07", "throughput": 2539.44, "total_tokens": 1165056} {"current_steps": 2020, "total_steps": 67140, "loss": 0.8131, "lr": 1.5035746201966041e-05, "epoch": 0.3008638665475127, "percentage": 3.01, "elapsed_time": "0:07:39", "remaining_time": "4:07:05", "throughput": 2538.98, "total_tokens": 1167616} {"current_steps": 2025, "total_steps": 67140, "loss": 0.8279, "lr": 1.5072981829014001e-05, "epoch": 0.30160857908847183, "percentage": 3.02, "elapsed_time": "0:07:41", "remaining_time": "4:07:04", "throughput": 2538.84, "total_tokens": 1170432} {"current_steps": 2030, "total_steps": 67140, "loss": 0.7964, "lr": 1.5110217456061963e-05, "epoch": 0.30235329162943103, "percentage": 3.02, "elapsed_time": "0:07:42", "remaining_time": "4:07:02", "throughput": 2538.7, "total_tokens": 1173216} {"current_steps": 2035, "total_steps": 67140, "loss": 0.7741, "lr": 1.5147453083109919e-05, "epoch": 0.30309800417039023, "percentage": 3.03, "elapsed_time": "0:07:43", "remaining_time": "4:07:02", "throughput": 2538.69, "total_tokens": 1176192} {"current_steps": 2040, "total_steps": 67140, "loss": 0.8406, "lr": 1.5184688710157879e-05, "epoch": 0.30384271671134944, "percentage": 3.04, "elapsed_time": "0:07:44", "remaining_time": "4:07:02", "throughput": 2539.02, "total_tokens": 1179296} {"current_steps": 2045, "total_steps": 67140, "loss": 0.8564, "lr": 1.5221924337205839e-05, "epoch": 0.3045874292523086, "percentage": 3.05, "elapsed_time": "0:07:45", "remaining_time": "4:07:01", "throughput": 2539.08, "total_tokens": 1182240} {"current_steps": 2050, "total_steps": 67140, "loss": 0.8391, "lr": 1.52591599642538e-05, "epoch": 0.3053321417932678, "percentage": 3.05, "elapsed_time": "0:07:46", "remaining_time": "4:07:00", "throughput": 2539.0, "total_tokens": 1185088} {"current_steps": 2055, "total_steps": 67140, "loss": 0.8133, "lr": 1.529639559130176e-05, "epoch": 0.306076854334227, "percentage": 3.06, "elapsed_time": "0:07:47", "remaining_time": "4:06:59", "throughput": 2539.21, "total_tokens": 1188128} {"current_steps": 2060, "total_steps": 67140, "loss": 0.8007, "lr": 1.5333631218349718e-05, "epoch": 0.3068215668751862, "percentage": 3.07, "elapsed_time": "0:07:49", "remaining_time": "4:06:57", "throughput": 2539.13, "total_tokens": 1190944} {"current_steps": 2065, "total_steps": 67140, "loss": 0.8381, "lr": 1.5370866845397678e-05, "epoch": 0.3075662794161454, "percentage": 3.08, "elapsed_time": "0:07:50", "remaining_time": "4:06:56", "throughput": 2539.29, "total_tokens": 1193920} {"current_steps": 2070, "total_steps": 67140, "loss": 0.8008, "lr": 1.5408102472445638e-05, "epoch": 0.30831099195710454, "percentage": 3.08, "elapsed_time": "0:07:51", "remaining_time": "4:06:54", "throughput": 2539.12, "total_tokens": 1196640} {"current_steps": 2075, "total_steps": 67140, "loss": 0.859, "lr": 1.5445338099493598e-05, "epoch": 0.30905570449806374, "percentage": 3.09, "elapsed_time": "0:07:52", "remaining_time": "4:06:53", "throughput": 2539.22, "total_tokens": 1199616} {"current_steps": 2080, "total_steps": 67140, "loss": 0.8235, "lr": 1.5482573726541554e-05, "epoch": 0.30980041703902295, "percentage": 3.1, "elapsed_time": "0:07:53", "remaining_time": "4:06:52", "throughput": 2539.05, "total_tokens": 1202368} {"current_steps": 2085, "total_steps": 67140, "loss": 0.8023, "lr": 1.5519809353589514e-05, "epoch": 0.31054512957998215, "percentage": 3.11, "elapsed_time": "0:07:54", "remaining_time": "4:06:50", "throughput": 2539.21, "total_tokens": 1205312} {"current_steps": 2090, "total_steps": 67140, "loss": 0.8231, "lr": 1.5557044980637474e-05, "epoch": 0.3112898421209413, "percentage": 3.11, "elapsed_time": "0:07:55", "remaining_time": "4:06:51", "throughput": 2539.73, "total_tokens": 1208608} {"current_steps": 2095, "total_steps": 67140, "loss": 0.8268, "lr": 1.5594280607685434e-05, "epoch": 0.3120345546619005, "percentage": 3.12, "elapsed_time": "0:07:57", "remaining_time": "4:06:50", "throughput": 2539.76, "total_tokens": 1211520} {"current_steps": 2100, "total_steps": 67140, "loss": 0.8107, "lr": 1.5631516234733394e-05, "epoch": 0.3127792672028597, "percentage": 3.13, "elapsed_time": "0:07:58", "remaining_time": "4:06:50", "throughput": 2540.01, "total_tokens": 1214592} {"current_steps": 2105, "total_steps": 67140, "loss": 0.8254, "lr": 1.5668751861781354e-05, "epoch": 0.3135239797438189, "percentage": 3.14, "elapsed_time": "0:07:59", "remaining_time": "4:06:48", "throughput": 2540.03, "total_tokens": 1217440} {"current_steps": 2110, "total_steps": 67140, "loss": 0.8137, "lr": 1.5705987488829313e-05, "epoch": 0.31426869228477805, "percentage": 3.14, "elapsed_time": "0:08:00", "remaining_time": "4:06:47", "throughput": 2540.12, "total_tokens": 1220416} {"current_steps": 2115, "total_steps": 67140, "loss": 0.8132, "lr": 1.5743223115877273e-05, "epoch": 0.31501340482573725, "percentage": 3.15, "elapsed_time": "0:08:01", "remaining_time": "4:06:45", "throughput": 2539.54, "total_tokens": 1222912} {"current_steps": 2120, "total_steps": 67140, "loss": 0.812, "lr": 1.578045874292523e-05, "epoch": 0.31575811736669646, "percentage": 3.16, "elapsed_time": "0:08:02", "remaining_time": "4:06:44", "throughput": 2539.75, "total_tokens": 1225952} {"current_steps": 2125, "total_steps": 67140, "loss": 0.8083, "lr": 1.581769436997319e-05, "epoch": 0.31650282990765566, "percentage": 3.17, "elapsed_time": "0:08:03", "remaining_time": "4:06:42", "throughput": 2539.63, "total_tokens": 1228736} {"current_steps": 2130, "total_steps": 67140, "loss": 0.8249, "lr": 1.585492999702115e-05, "epoch": 0.31724754244861486, "percentage": 3.17, "elapsed_time": "0:08:04", "remaining_time": "4:06:41", "throughput": 2539.6, "total_tokens": 1231584} {"current_steps": 2135, "total_steps": 67140, "loss": 0.7956, "lr": 1.589216562406911e-05, "epoch": 0.317992254989574, "percentage": 3.18, "elapsed_time": "0:08:06", "remaining_time": "4:06:39", "throughput": 2539.57, "total_tokens": 1234432} {"current_steps": 2140, "total_steps": 67140, "loss": 0.8012, "lr": 1.5929401251117073e-05, "epoch": 0.3187369675305332, "percentage": 3.19, "elapsed_time": "0:08:07", "remaining_time": "4:06:38", "throughput": 2539.66, "total_tokens": 1237376} {"current_steps": 2145, "total_steps": 67140, "loss": 0.8011, "lr": 1.596663687816503e-05, "epoch": 0.3194816800714924, "percentage": 3.19, "elapsed_time": "0:08:08", "remaining_time": "4:06:38", "throughput": 2539.72, "total_tokens": 1240352} {"current_steps": 2150, "total_steps": 67140, "loss": 0.8401, "lr": 1.600387250521299e-05, "epoch": 0.3202263926124516, "percentage": 3.2, "elapsed_time": "0:08:09", "remaining_time": "4:06:35", "throughput": 2539.33, "total_tokens": 1242944} {"current_steps": 2155, "total_steps": 67140, "loss": 0.8325, "lr": 1.604110813226095e-05, "epoch": 0.32097110515341076, "percentage": 3.21, "elapsed_time": "0:08:10", "remaining_time": "4:06:34", "throughput": 2539.27, "total_tokens": 1245760} {"current_steps": 2160, "total_steps": 67140, "loss": 1.1421, "lr": 1.607834375930891e-05, "epoch": 0.32171581769436997, "percentage": 3.22, "elapsed_time": "0:08:11", "remaining_time": "4:06:31", "throughput": 2538.91, "total_tokens": 1248352} {"current_steps": 2165, "total_steps": 67140, "loss": 0.8353, "lr": 1.6115579386356865e-05, "epoch": 0.32246053023532917, "percentage": 3.22, "elapsed_time": "0:08:12", "remaining_time": "4:06:30", "throughput": 2538.62, "total_tokens": 1251072} {"current_steps": 2170, "total_steps": 67140, "loss": 0.8223, "lr": 1.6152815013404825e-05, "epoch": 0.32320524277628837, "percentage": 3.23, "elapsed_time": "0:08:13", "remaining_time": "4:06:28", "throughput": 2538.38, "total_tokens": 1253792} {"current_steps": 2175, "total_steps": 67140, "loss": 1.113, "lr": 1.6190050640452785e-05, "epoch": 0.3239499553172475, "percentage": 3.24, "elapsed_time": "0:08:15", "remaining_time": "4:06:26", "throughput": 2538.15, "total_tokens": 1256512} {"current_steps": 2180, "total_steps": 67140, "loss": 0.8199, "lr": 1.6227286267500748e-05, "epoch": 0.3246946678582067, "percentage": 3.25, "elapsed_time": "0:08:16", "remaining_time": "4:06:24", "throughput": 2537.98, "total_tokens": 1259200} {"current_steps": 2185, "total_steps": 67140, "loss": 0.8207, "lr": 1.6264521894548704e-05, "epoch": 0.3254393803991659, "percentage": 3.25, "elapsed_time": "0:08:17", "remaining_time": "4:06:23", "throughput": 2538.19, "total_tokens": 1262208} {"current_steps": 2190, "total_steps": 67140, "loss": 0.8023, "lr": 1.6301757521596664e-05, "epoch": 0.3261840929401251, "percentage": 3.26, "elapsed_time": "0:08:18", "remaining_time": "4:06:21", "throughput": 2538.03, "total_tokens": 1264960} {"current_steps": 2195, "total_steps": 67140, "loss": 0.7491, "lr": 1.6338993148644624e-05, "epoch": 0.32692880548108433, "percentage": 3.27, "elapsed_time": "0:08:19", "remaining_time": "4:06:20", "throughput": 2538.21, "total_tokens": 1268000} {"current_steps": 2200, "total_steps": 67140, "loss": 0.8252, "lr": 1.6376228775692584e-05, "epoch": 0.3276735180220435, "percentage": 3.28, "elapsed_time": "0:08:20", "remaining_time": "4:06:21", "throughput": 2538.72, "total_tokens": 1271296} {"current_steps": 2205, "total_steps": 67140, "loss": 0.821, "lr": 1.6413464402740544e-05, "epoch": 0.3284182305630027, "percentage": 3.28, "elapsed_time": "0:08:21", "remaining_time": "4:06:21", "throughput": 2538.92, "total_tokens": 1274368} {"current_steps": 2210, "total_steps": 67140, "loss": 0.8159, "lr": 1.64507000297885e-05, "epoch": 0.3291629431039619, "percentage": 3.29, "elapsed_time": "0:08:23", "remaining_time": "4:06:20", "throughput": 2538.86, "total_tokens": 1277216} {"current_steps": 2215, "total_steps": 67140, "loss": 0.8163, "lr": 1.648793565683646e-05, "epoch": 0.3299076556449211, "percentage": 3.3, "elapsed_time": "0:08:24", "remaining_time": "4:06:18", "throughput": 2538.84, "total_tokens": 1280064} {"current_steps": 2220, "total_steps": 67140, "loss": 0.7614, "lr": 1.6525171283884423e-05, "epoch": 0.33065236818588023, "percentage": 3.31, "elapsed_time": "0:08:25", "remaining_time": "4:06:17", "throughput": 2538.75, "total_tokens": 1282880} {"current_steps": 2225, "total_steps": 67140, "loss": 0.8568, "lr": 1.6562406910932383e-05, "epoch": 0.33139708072683943, "percentage": 3.31, "elapsed_time": "0:08:26", "remaining_time": "4:06:16", "throughput": 2538.84, "total_tokens": 1285856} {"current_steps": 2230, "total_steps": 67140, "loss": 0.7924, "lr": 1.659964253798034e-05, "epoch": 0.33214179326779864, "percentage": 3.32, "elapsed_time": "0:08:27", "remaining_time": "4:06:14", "throughput": 2538.72, "total_tokens": 1288576} {"current_steps": 2235, "total_steps": 67140, "loss": 0.8141, "lr": 1.66368781650283e-05, "epoch": 0.33288650580875784, "percentage": 3.33, "elapsed_time": "0:08:28", "remaining_time": "4:06:12", "throughput": 2538.61, "total_tokens": 1291360} {"current_steps": 2240, "total_steps": 67140, "loss": 0.8206, "lr": 1.667411379207626e-05, "epoch": 0.333631218349717, "percentage": 3.34, "elapsed_time": "0:08:29", "remaining_time": "4:06:11", "throughput": 2538.75, "total_tokens": 1294368} {"current_steps": 2245, "total_steps": 67140, "loss": 0.8092, "lr": 1.671134941912422e-05, "epoch": 0.3343759308906762, "percentage": 3.34, "elapsed_time": "0:08:30", "remaining_time": "4:06:10", "throughput": 2538.65, "total_tokens": 1297152} {"current_steps": 2250, "total_steps": 67140, "loss": 0.8098, "lr": 1.6748585046172176e-05, "epoch": 0.3351206434316354, "percentage": 3.35, "elapsed_time": "0:08:32", "remaining_time": "4:06:11", "throughput": 2539.37, "total_tokens": 1300640} {"current_steps": 2255, "total_steps": 67140, "loss": 0.8064, "lr": 1.6785820673220136e-05, "epoch": 0.3358653559725946, "percentage": 3.36, "elapsed_time": "0:08:33", "remaining_time": "4:06:10", "throughput": 2539.3, "total_tokens": 1303488} {"current_steps": 2260, "total_steps": 67140, "loss": 1.2177, "lr": 1.68230563002681e-05, "epoch": 0.3366100685135538, "percentage": 3.37, "elapsed_time": "0:08:34", "remaining_time": "4:06:10", "throughput": 2539.41, "total_tokens": 1306528} {"current_steps": 2265, "total_steps": 67140, "loss": 1.0531, "lr": 1.686029192731606e-05, "epoch": 0.33735478105451294, "percentage": 3.37, "elapsed_time": "0:08:35", "remaining_time": "4:06:10", "throughput": 2539.87, "total_tokens": 1309792} {"current_steps": 2270, "total_steps": 67140, "loss": 0.835, "lr": 1.689752755436402e-05, "epoch": 0.33809949359547214, "percentage": 3.38, "elapsed_time": "0:08:36", "remaining_time": "4:06:08", "throughput": 2539.58, "total_tokens": 1312448} {"current_steps": 2275, "total_steps": 67140, "loss": 0.8343, "lr": 1.6934763181411975e-05, "epoch": 0.33884420613643135, "percentage": 3.39, "elapsed_time": "0:08:37", "remaining_time": "4:06:06", "throughput": 2539.41, "total_tokens": 1315136} {"current_steps": 2280, "total_steps": 67140, "loss": 0.8007, "lr": 1.6971998808459935e-05, "epoch": 0.33958891867739055, "percentage": 3.4, "elapsed_time": "0:08:39", "remaining_time": "4:06:05", "throughput": 2539.55, "total_tokens": 1318144} {"current_steps": 2285, "total_steps": 67140, "loss": 0.8031, "lr": 1.7009234435507895e-05, "epoch": 0.3403336312183497, "percentage": 3.4, "elapsed_time": "0:08:40", "remaining_time": "4:06:03", "throughput": 2539.55, "total_tokens": 1320992} {"current_steps": 2290, "total_steps": 67140, "loss": 0.8873, "lr": 1.7046470062555855e-05, "epoch": 0.3410783437593089, "percentage": 3.41, "elapsed_time": "0:08:41", "remaining_time": "4:06:02", "throughput": 2539.47, "total_tokens": 1323808} {"current_steps": 2295, "total_steps": 67140, "loss": 0.8413, "lr": 1.7083705689603814e-05, "epoch": 0.3418230563002681, "percentage": 3.42, "elapsed_time": "0:08:42", "remaining_time": "4:05:59", "throughput": 2539.15, "total_tokens": 1326400} {"current_steps": 2300, "total_steps": 67140, "loss": 0.8264, "lr": 1.7120941316651774e-05, "epoch": 0.3425677688412273, "percentage": 3.43, "elapsed_time": "0:08:43", "remaining_time": "4:05:58", "throughput": 2539.03, "total_tokens": 1329184} {"current_steps": 2305, "total_steps": 67140, "loss": 0.794, "lr": 1.7158176943699734e-05, "epoch": 0.34331248138218645, "percentage": 3.43, "elapsed_time": "0:08:44", "remaining_time": "4:05:57", "throughput": 2539.25, "total_tokens": 1332224} {"current_steps": 2310, "total_steps": 67140, "loss": 0.7891, "lr": 1.7195412570747694e-05, "epoch": 0.34405719392314565, "percentage": 3.44, "elapsed_time": "0:08:45", "remaining_time": "4:05:56", "throughput": 2539.29, "total_tokens": 1335168} {"current_steps": 2315, "total_steps": 67140, "loss": 0.8767, "lr": 1.723264819779565e-05, "epoch": 0.34480190646410486, "percentage": 3.45, "elapsed_time": "0:08:46", "remaining_time": "4:05:55", "throughput": 2539.27, "total_tokens": 1338016} {"current_steps": 2320, "total_steps": 67140, "loss": 0.8321, "lr": 1.726988382484361e-05, "epoch": 0.34554661900506406, "percentage": 3.46, "elapsed_time": "0:08:48", "remaining_time": "4:05:52", "throughput": 2538.95, "total_tokens": 1340640} {"current_steps": 2325, "total_steps": 67140, "loss": 0.8011, "lr": 1.730711945189157e-05, "epoch": 0.34629133154602326, "percentage": 3.46, "elapsed_time": "0:08:49", "remaining_time": "4:05:52", "throughput": 2539.09, "total_tokens": 1343648} {"current_steps": 2330, "total_steps": 67140, "loss": 0.7867, "lr": 1.734435507893953e-05, "epoch": 0.3470360440869824, "percentage": 3.47, "elapsed_time": "0:08:50", "remaining_time": "4:05:50", "throughput": 2539.08, "total_tokens": 1346464} {"current_steps": 2335, "total_steps": 67140, "loss": 0.7928, "lr": 1.738159070598749e-05, "epoch": 0.3477807566279416, "percentage": 3.48, "elapsed_time": "0:08:51", "remaining_time": "4:05:49", "throughput": 2539.22, "total_tokens": 1349408} {"current_steps": 2340, "total_steps": 67140, "loss": 0.8558, "lr": 1.741882633303545e-05, "epoch": 0.3485254691689008, "percentage": 3.49, "elapsed_time": "0:08:52", "remaining_time": "4:05:47", "throughput": 2539.22, "total_tokens": 1352288} {"current_steps": 2345, "total_steps": 67140, "loss": 0.7812, "lr": 1.745606196008341e-05, "epoch": 0.34927018170986, "percentage": 3.49, "elapsed_time": "0:08:53", "remaining_time": "4:05:45", "throughput": 2538.93, "total_tokens": 1354944} {"current_steps": 2350, "total_steps": 67140, "loss": 0.8045, "lr": 1.749329758713137e-05, "epoch": 0.35001489425081916, "percentage": 3.5, "elapsed_time": "0:08:54", "remaining_time": "4:05:45", "throughput": 2539.26, "total_tokens": 1358048} {"current_steps": 2355, "total_steps": 67140, "loss": 0.8376, "lr": 1.753053321417933e-05, "epoch": 0.35075960679177837, "percentage": 3.51, "elapsed_time": "0:08:55", "remaining_time": "4:05:42", "throughput": 2539.04, "total_tokens": 1360704} {"current_steps": 2360, "total_steps": 67140, "loss": 0.8094, "lr": 1.7567768841227286e-05, "epoch": 0.35150431933273757, "percentage": 3.52, "elapsed_time": "0:08:56", "remaining_time": "4:05:40", "throughput": 2538.63, "total_tokens": 1363232} {"current_steps": 2365, "total_steps": 67140, "loss": 0.7936, "lr": 1.7605004468275246e-05, "epoch": 0.35224903187369677, "percentage": 3.52, "elapsed_time": "0:08:58", "remaining_time": "4:05:39", "throughput": 2538.76, "total_tokens": 1366272} {"current_steps": 2370, "total_steps": 67140, "loss": 0.8107, "lr": 1.7642240095323205e-05, "epoch": 0.3529937444146559, "percentage": 3.53, "elapsed_time": "0:08:59", "remaining_time": "4:05:37", "throughput": 2538.64, "total_tokens": 1369024} {"current_steps": 2375, "total_steps": 67140, "loss": 0.7999, "lr": 1.7679475722371165e-05, "epoch": 0.3537384569556151, "percentage": 3.54, "elapsed_time": "0:09:00", "remaining_time": "4:05:36", "throughput": 2538.67, "total_tokens": 1371936} {"current_steps": 2380, "total_steps": 67140, "loss": 0.8048, "lr": 1.7716711349419125e-05, "epoch": 0.3544831694965743, "percentage": 3.54, "elapsed_time": "0:09:01", "remaining_time": "4:05:35", "throughput": 2538.9, "total_tokens": 1374976} {"current_steps": 2385, "total_steps": 67140, "loss": 0.811, "lr": 1.7753946976467085e-05, "epoch": 0.3552278820375335, "percentage": 3.55, "elapsed_time": "0:09:02", "remaining_time": "4:05:35", "throughput": 2539.37, "total_tokens": 1378208} {"current_steps": 2390, "total_steps": 67140, "loss": 0.8175, "lr": 1.7791182603515045e-05, "epoch": 0.35597259457849273, "percentage": 3.56, "elapsed_time": "0:09:03", "remaining_time": "4:05:34", "throughput": 2539.29, "total_tokens": 1381056} {"current_steps": 2395, "total_steps": 67140, "loss": 0.8096, "lr": 1.7828418230563005e-05, "epoch": 0.3567173071194519, "percentage": 3.57, "elapsed_time": "0:09:05", "remaining_time": "4:05:35", "throughput": 2539.8, "total_tokens": 1384384} {"current_steps": 2400, "total_steps": 67140, "loss": 0.865, "lr": 1.786565385761096e-05, "epoch": 0.3574620196604111, "percentage": 3.57, "elapsed_time": "0:09:06", "remaining_time": "4:05:33", "throughput": 2539.69, "total_tokens": 1387200} {"current_steps": 2405, "total_steps": 67140, "loss": 0.8289, "lr": 1.790288948465892e-05, "epoch": 0.3582067322013703, "percentage": 3.58, "elapsed_time": "0:09:07", "remaining_time": "4:05:33", "throughput": 2539.83, "total_tokens": 1390272} {"current_steps": 2410, "total_steps": 67140, "loss": 0.8108, "lr": 1.794012511170688e-05, "epoch": 0.3589514447423295, "percentage": 3.59, "elapsed_time": "0:09:08", "remaining_time": "4:05:33", "throughput": 2540.09, "total_tokens": 1393408} {"current_steps": 2415, "total_steps": 67140, "loss": 0.8332, "lr": 1.797736073875484e-05, "epoch": 0.35969615728328863, "percentage": 3.6, "elapsed_time": "0:09:09", "remaining_time": "4:05:32", "throughput": 2540.22, "total_tokens": 1396352} {"current_steps": 2420, "total_steps": 67140, "loss": 0.8087, "lr": 1.80145963658028e-05, "epoch": 0.36044086982424783, "percentage": 3.6, "elapsed_time": "0:09:10", "remaining_time": "4:05:31", "throughput": 2540.35, "total_tokens": 1399328} {"current_steps": 2425, "total_steps": 67140, "loss": 0.8944, "lr": 1.805183199285076e-05, "epoch": 0.36118558236520704, "percentage": 3.61, "elapsed_time": "0:09:11", "remaining_time": "4:05:29", "throughput": 2540.24, "total_tokens": 1402080} {"current_steps": 2430, "total_steps": 67140, "loss": 0.7992, "lr": 1.808906761989872e-05, "epoch": 0.36193029490616624, "percentage": 3.62, "elapsed_time": "0:09:13", "remaining_time": "4:05:26", "throughput": 2539.82, "total_tokens": 1404576} {"current_steps": 2435, "total_steps": 67140, "loss": 0.8077, "lr": 1.812630324694668e-05, "epoch": 0.3626750074471254, "percentage": 3.63, "elapsed_time": "0:09:14", "remaining_time": "4:05:26", "throughput": 2539.89, "total_tokens": 1407552} {"current_steps": 2440, "total_steps": 67140, "loss": 0.7669, "lr": 1.816353887399464e-05, "epoch": 0.3634197199880846, "percentage": 3.63, "elapsed_time": "0:09:15", "remaining_time": "4:05:24", "throughput": 2539.68, "total_tokens": 1410272} {"current_steps": 2445, "total_steps": 67140, "loss": 0.8473, "lr": 1.8200774501042596e-05, "epoch": 0.3641644325290438, "percentage": 3.64, "elapsed_time": "0:09:16", "remaining_time": "4:05:22", "throughput": 2539.54, "total_tokens": 1412992} {"current_steps": 2450, "total_steps": 67140, "loss": 0.8161, "lr": 1.8238010128090556e-05, "epoch": 0.364909145070003, "percentage": 3.65, "elapsed_time": "0:09:17", "remaining_time": "4:05:21", "throughput": 2539.48, "total_tokens": 1415840} {"current_steps": 2455, "total_steps": 67140, "loss": 0.7825, "lr": 1.8275245755138516e-05, "epoch": 0.3656538576109622, "percentage": 3.66, "elapsed_time": "0:09:18", "remaining_time": "4:05:19", "throughput": 2539.3, "total_tokens": 1418560} {"current_steps": 2460, "total_steps": 67140, "loss": 0.7928, "lr": 1.8312481382186476e-05, "epoch": 0.36639857015192134, "percentage": 3.66, "elapsed_time": "0:09:19", "remaining_time": "4:05:19", "throughput": 2539.53, "total_tokens": 1421664} {"current_steps": 2465, "total_steps": 67140, "loss": 0.8028, "lr": 1.8349717009234436e-05, "epoch": 0.36714328269288055, "percentage": 3.67, "elapsed_time": "0:09:20", "remaining_time": "4:05:17", "throughput": 2539.53, "total_tokens": 1424512} {"current_steps": 2470, "total_steps": 67140, "loss": 0.7821, "lr": 1.8386952636282396e-05, "epoch": 0.36788799523383975, "percentage": 3.68, "elapsed_time": "0:09:22", "remaining_time": "4:05:16", "throughput": 2539.51, "total_tokens": 1427392} {"current_steps": 2475, "total_steps": 67140, "loss": 0.7836, "lr": 1.8424188263330356e-05, "epoch": 0.36863270777479895, "percentage": 3.69, "elapsed_time": "0:09:23", "remaining_time": "4:05:14", "throughput": 2539.22, "total_tokens": 1430048} {"current_steps": 2480, "total_steps": 67140, "loss": 0.8589, "lr": 1.8461423890378315e-05, "epoch": 0.3693774203157581, "percentage": 3.69, "elapsed_time": "0:09:24", "remaining_time": "4:05:12", "throughput": 2538.98, "total_tokens": 1432704} {"current_steps": 2485, "total_steps": 67140, "loss": 0.8221, "lr": 1.8498659517426275e-05, "epoch": 0.3701221328567173, "percentage": 3.7, "elapsed_time": "0:09:25", "remaining_time": "4:05:10", "throughput": 2538.89, "total_tokens": 1435488} {"current_steps": 2490, "total_steps": 67140, "loss": 0.8163, "lr": 1.8535895144474232e-05, "epoch": 0.3708668453976765, "percentage": 3.71, "elapsed_time": "0:09:26", "remaining_time": "4:05:08", "throughput": 2538.64, "total_tokens": 1438176} {"current_steps": 2495, "total_steps": 67140, "loss": 0.8527, "lr": 1.857313077152219e-05, "epoch": 0.3716115579386357, "percentage": 3.72, "elapsed_time": "0:09:27", "remaining_time": "4:05:06", "throughput": 2538.39, "total_tokens": 1440800} {"current_steps": 2500, "total_steps": 67140, "loss": 0.8082, "lr": 1.8610366398570155e-05, "epoch": 0.37235627047959485, "percentage": 3.72, "elapsed_time": "0:09:28", "remaining_time": "4:05:05", "throughput": 2538.52, "total_tokens": 1443808} {"current_steps": 2505, "total_steps": 67140, "loss": 0.802, "lr": 1.8647602025618115e-05, "epoch": 0.37310098302055406, "percentage": 3.73, "elapsed_time": "0:09:29", "remaining_time": "4:05:04", "throughput": 2538.6, "total_tokens": 1446752} {"current_steps": 2510, "total_steps": 67140, "loss": 0.791, "lr": 1.868483765266607e-05, "epoch": 0.37384569556151326, "percentage": 3.74, "elapsed_time": "0:09:31", "remaining_time": "4:05:04", "throughput": 2538.74, "total_tokens": 1449792} {"current_steps": 2515, "total_steps": 67140, "loss": 0.79, "lr": 1.872207327971403e-05, "epoch": 0.37459040810247246, "percentage": 3.75, "elapsed_time": "0:09:32", "remaining_time": "4:05:03", "throughput": 2538.73, "total_tokens": 1452672} {"current_steps": 2520, "total_steps": 67140, "loss": 0.8412, "lr": 1.875930890676199e-05, "epoch": 0.3753351206434316, "percentage": 3.75, "elapsed_time": "0:09:33", "remaining_time": "4:05:01", "throughput": 2538.67, "total_tokens": 1455456} {"current_steps": 2525, "total_steps": 67140, "loss": 0.8189, "lr": 1.879654453380995e-05, "epoch": 0.3760798331843908, "percentage": 3.76, "elapsed_time": "0:09:34", "remaining_time": "4:04:59", "throughput": 2538.55, "total_tokens": 1458208} {"current_steps": 2530, "total_steps": 67140, "loss": 0.8245, "lr": 1.8833780160857907e-05, "epoch": 0.37682454572535, "percentage": 3.77, "elapsed_time": "0:09:35", "remaining_time": "4:04:58", "throughput": 2538.47, "total_tokens": 1461024} {"current_steps": 2535, "total_steps": 67140, "loss": 0.8051, "lr": 1.8871015787905867e-05, "epoch": 0.3775692582663092, "percentage": 3.78, "elapsed_time": "0:09:36", "remaining_time": "4:04:56", "throughput": 2538.33, "total_tokens": 1463776} {"current_steps": 2540, "total_steps": 67140, "loss": 0.8204, "lr": 1.890825141495383e-05, "epoch": 0.3783139708072684, "percentage": 3.78, "elapsed_time": "0:09:37", "remaining_time": "4:04:55", "throughput": 2538.36, "total_tokens": 1466688} {"current_steps": 2545, "total_steps": 67140, "loss": 0.7153, "lr": 1.894548704200179e-05, "epoch": 0.37905868334822757, "percentage": 3.79, "elapsed_time": "0:09:38", "remaining_time": "4:04:54", "throughput": 2538.3, "total_tokens": 1469536} {"current_steps": 2550, "total_steps": 67140, "loss": 0.9849, "lr": 1.898272266904975e-05, "epoch": 0.37980339588918677, "percentage": 3.8, "elapsed_time": "0:09:40", "remaining_time": "4:04:51", "throughput": 2537.94, "total_tokens": 1472096} {"current_steps": 2555, "total_steps": 67140, "loss": 1.1735, "lr": 1.9019958296097706e-05, "epoch": 0.38054810843014597, "percentage": 3.81, "elapsed_time": "0:09:41", "remaining_time": "4:04:51", "throughput": 2537.95, "total_tokens": 1475008} {"current_steps": 2560, "total_steps": 67140, "loss": 0.9002, "lr": 1.9057193923145666e-05, "epoch": 0.3812928209711052, "percentage": 3.81, "elapsed_time": "0:09:42", "remaining_time": "4:04:49", "throughput": 2537.66, "total_tokens": 1477664} {"current_steps": 2565, "total_steps": 67140, "loss": 0.8423, "lr": 1.9094429550193626e-05, "epoch": 0.3820375335120643, "percentage": 3.82, "elapsed_time": "0:09:43", "remaining_time": "4:04:47", "throughput": 2537.73, "total_tokens": 1480576} {"current_steps": 2570, "total_steps": 67140, "loss": 0.8087, "lr": 1.9131665177241586e-05, "epoch": 0.3827822460530235, "percentage": 3.83, "elapsed_time": "0:09:44", "remaining_time": "4:04:46", "throughput": 2537.82, "total_tokens": 1483488} {"current_steps": 2575, "total_steps": 67140, "loss": 0.8138, "lr": 1.9168900804289542e-05, "epoch": 0.3835269585939827, "percentage": 3.84, "elapsed_time": "0:09:45", "remaining_time": "4:04:45", "throughput": 2537.86, "total_tokens": 1486368} {"current_steps": 2580, "total_steps": 67140, "loss": 0.818, "lr": 1.9206136431337506e-05, "epoch": 0.38427167113494193, "percentage": 3.84, "elapsed_time": "0:09:46", "remaining_time": "4:04:44", "throughput": 2537.78, "total_tokens": 1489216} {"current_steps": 2585, "total_steps": 67140, "loss": 0.8128, "lr": 1.9243372058385466e-05, "epoch": 0.3850163836759011, "percentage": 3.85, "elapsed_time": "0:09:47", "remaining_time": "4:04:42", "throughput": 2537.74, "total_tokens": 1492032} {"current_steps": 2590, "total_steps": 67140, "loss": 0.7771, "lr": 1.9280607685433425e-05, "epoch": 0.3857610962168603, "percentage": 3.86, "elapsed_time": "0:09:49", "remaining_time": "4:04:40", "throughput": 2537.59, "total_tokens": 1494784} {"current_steps": 2595, "total_steps": 67140, "loss": 0.7263, "lr": 1.9317843312481382e-05, "epoch": 0.3865058087578195, "percentage": 3.87, "elapsed_time": "0:09:50", "remaining_time": "4:04:40", "throughput": 2537.82, "total_tokens": 1497856} {"current_steps": 2600, "total_steps": 67140, "loss": 1.0673, "lr": 1.9355078939529342e-05, "epoch": 0.3872505212987787, "percentage": 3.87, "elapsed_time": "0:09:51", "remaining_time": "4:04:38", "throughput": 2537.55, "total_tokens": 1500512} {"current_steps": 2605, "total_steps": 67140, "loss": 1.0956, "lr": 1.93923145665773e-05, "epoch": 0.3879952338397379, "percentage": 3.88, "elapsed_time": "0:09:52", "remaining_time": "4:04:36", "throughput": 2537.53, "total_tokens": 1503328} {"current_steps": 2610, "total_steps": 67140, "loss": 1.0844, "lr": 1.942955019362526e-05, "epoch": 0.38873994638069703, "percentage": 3.89, "elapsed_time": "0:09:53", "remaining_time": "4:04:35", "throughput": 2537.29, "total_tokens": 1506016} {"current_steps": 2615, "total_steps": 67140, "loss": 1.2134, "lr": 1.946678582067322e-05, "epoch": 0.38948465892165623, "percentage": 3.89, "elapsed_time": "0:09:54", "remaining_time": "4:04:33", "throughput": 2537.15, "total_tokens": 1508736} {"current_steps": 2620, "total_steps": 67140, "loss": 0.8445, "lr": 1.950402144772118e-05, "epoch": 0.39022937146261544, "percentage": 3.9, "elapsed_time": "0:09:56", "remaining_time": "4:04:38", "throughput": 2538.24, "total_tokens": 1512896} {"current_steps": 2625, "total_steps": 67140, "loss": 0.8305, "lr": 1.954125707476914e-05, "epoch": 0.39097408400357464, "percentage": 3.91, "elapsed_time": "0:09:57", "remaining_time": "4:04:36", "throughput": 2538.18, "total_tokens": 1515712} {"current_steps": 2630, "total_steps": 67140, "loss": 0.8257, "lr": 1.95784927018171e-05, "epoch": 0.3917187965445338, "percentage": 3.92, "elapsed_time": "0:09:58", "remaining_time": "4:04:35", "throughput": 2538.17, "total_tokens": 1518560} {"current_steps": 2635, "total_steps": 67140, "loss": 0.8286, "lr": 1.961572832886506e-05, "epoch": 0.392463509085493, "percentage": 3.92, "elapsed_time": "0:09:59", "remaining_time": "4:04:34", "throughput": 2538.25, "total_tokens": 1521536} {"current_steps": 2640, "total_steps": 67140, "loss": 0.824, "lr": 1.9652963955913017e-05, "epoch": 0.3932082216264522, "percentage": 3.93, "elapsed_time": "0:10:00", "remaining_time": "4:04:34", "throughput": 2538.31, "total_tokens": 1524544} {"current_steps": 2645, "total_steps": 67140, "loss": 0.8159, "lr": 1.9690199582960977e-05, "epoch": 0.3939529341674114, "percentage": 3.94, "elapsed_time": "0:10:01", "remaining_time": "4:04:34", "throughput": 2538.65, "total_tokens": 1527744} {"current_steps": 2650, "total_steps": 67140, "loss": 0.8089, "lr": 1.9727435210008937e-05, "epoch": 0.39469764670837054, "percentage": 3.95, "elapsed_time": "0:10:02", "remaining_time": "4:04:32", "throughput": 2538.61, "total_tokens": 1530592} {"current_steps": 2655, "total_steps": 67140, "loss": 0.8022, "lr": 1.9764670837056897e-05, "epoch": 0.39544235924932974, "percentage": 3.95, "elapsed_time": "0:10:04", "remaining_time": "4:04:31", "throughput": 2538.69, "total_tokens": 1533568} {"current_steps": 2660, "total_steps": 67140, "loss": 0.8653, "lr": 1.9801906464104857e-05, "epoch": 0.39618707179028895, "percentage": 3.96, "elapsed_time": "0:10:05", "remaining_time": "4:04:30", "throughput": 2538.79, "total_tokens": 1536512} {"current_steps": 2665, "total_steps": 67140, "loss": 0.8423, "lr": 1.9839142091152816e-05, "epoch": 0.39693178433124815, "percentage": 3.97, "elapsed_time": "0:10:06", "remaining_time": "4:04:30", "throughput": 2538.91, "total_tokens": 1539520} {"current_steps": 2670, "total_steps": 67140, "loss": 0.8154, "lr": 1.9876377718200776e-05, "epoch": 0.39767649687220735, "percentage": 3.98, "elapsed_time": "0:10:07", "remaining_time": "4:04:29", "throughput": 2538.98, "total_tokens": 1542464} {"current_steps": 2675, "total_steps": 67140, "loss": 0.7289, "lr": 1.9913613345248736e-05, "epoch": 0.3984212094131665, "percentage": 3.98, "elapsed_time": "0:10:08", "remaining_time": "4:04:27", "throughput": 2539.02, "total_tokens": 1545344} {"current_steps": 2680, "total_steps": 67140, "loss": 0.7757, "lr": 1.9950848972296696e-05, "epoch": 0.3991659219541257, "percentage": 3.99, "elapsed_time": "0:10:09", "remaining_time": "4:04:26", "throughput": 2539.06, "total_tokens": 1548256} {"current_steps": 2685, "total_steps": 67140, "loss": 0.8067, "lr": 1.9988084599344652e-05, "epoch": 0.3999106344950849, "percentage": 4.0, "elapsed_time": "0:10:10", "remaining_time": "4:04:26", "throughput": 2539.22, "total_tokens": 1551328} {"current_steps": 2690, "total_steps": 67140, "loss": 0.9948, "lr": 2.0025320226392612e-05, "epoch": 0.4006553470360441, "percentage": 4.01, "elapsed_time": "0:10:12", "remaining_time": "4:04:24", "throughput": 2539.07, "total_tokens": 1554048} {"current_steps": 2695, "total_steps": 67140, "loss": 0.8306, "lr": 2.0062555853440572e-05, "epoch": 0.40140005957700325, "percentage": 4.01, "elapsed_time": "0:10:13", "remaining_time": "4:04:22", "throughput": 2538.81, "total_tokens": 1556704} {"current_steps": 2700, "total_steps": 67140, "loss": 0.8198, "lr": 2.0099791480488532e-05, "epoch": 0.40214477211796246, "percentage": 4.02, "elapsed_time": "0:10:14", "remaining_time": "4:04:21", "throughput": 2538.9, "total_tokens": 1559680} {"current_steps": 2705, "total_steps": 67140, "loss": 0.8041, "lr": 2.0137027107536492e-05, "epoch": 0.40288948465892166, "percentage": 4.03, "elapsed_time": "0:10:15", "remaining_time": "4:04:20", "throughput": 2538.77, "total_tokens": 1562464} {"current_steps": 2710, "total_steps": 67140, "loss": 0.8012, "lr": 2.0174262734584452e-05, "epoch": 0.40363419719988086, "percentage": 4.04, "elapsed_time": "0:10:16", "remaining_time": "4:04:19", "throughput": 2538.82, "total_tokens": 1565376} {"current_steps": 2715, "total_steps": 67140, "loss": 0.7979, "lr": 2.021149836163241e-05, "epoch": 0.40437890974084, "percentage": 4.04, "elapsed_time": "0:10:17", "remaining_time": "4:04:17", "throughput": 2538.81, "total_tokens": 1568256} {"current_steps": 2720, "total_steps": 67140, "loss": 0.8219, "lr": 2.024873398868037e-05, "epoch": 0.4051236222817992, "percentage": 4.05, "elapsed_time": "0:10:18", "remaining_time": "4:04:17", "throughput": 2539.09, "total_tokens": 1571424} {"current_steps": 2725, "total_steps": 67140, "loss": 0.7847, "lr": 2.0285969615728328e-05, "epoch": 0.4058683348227584, "percentage": 4.06, "elapsed_time": "0:10:19", "remaining_time": "4:04:15", "throughput": 2538.96, "total_tokens": 1574112} {"current_steps": 2730, "total_steps": 67140, "loss": 0.8211, "lr": 2.0323205242776288e-05, "epoch": 0.4066130473637176, "percentage": 4.07, "elapsed_time": "0:10:21", "remaining_time": "4:04:14", "throughput": 2538.97, "total_tokens": 1577024} {"current_steps": 2735, "total_steps": 67140, "loss": 0.7901, "lr": 2.0360440869824248e-05, "epoch": 0.4073577599046768, "percentage": 4.07, "elapsed_time": "0:10:22", "remaining_time": "4:04:13", "throughput": 2538.84, "total_tokens": 1579808} {"current_steps": 2740, "total_steps": 67140, "loss": 0.83, "lr": 2.0397676496872207e-05, "epoch": 0.40810247244563597, "percentage": 4.08, "elapsed_time": "0:10:23", "remaining_time": "4:04:12", "throughput": 2538.91, "total_tokens": 1582752} {"current_steps": 2745, "total_steps": 67140, "loss": 0.7893, "lr": 2.043491212392017e-05, "epoch": 0.40884718498659517, "percentage": 4.09, "elapsed_time": "0:10:24", "remaining_time": "4:04:11", "throughput": 2539.0, "total_tokens": 1585728} {"current_steps": 2750, "total_steps": 67140, "loss": 0.8043, "lr": 2.0472147750968127e-05, "epoch": 0.40959189752755437, "percentage": 4.1, "elapsed_time": "0:10:25", "remaining_time": "4:04:09", "throughput": 2538.91, "total_tokens": 1588480} {"current_steps": 2755, "total_steps": 67140, "loss": 0.8264, "lr": 2.0509383378016087e-05, "epoch": 0.4103366100685136, "percentage": 4.1, "elapsed_time": "0:10:26", "remaining_time": "4:04:09", "throughput": 2539.18, "total_tokens": 1591680} {"current_steps": 2760, "total_steps": 67140, "loss": 0.8289, "lr": 2.0546619005064047e-05, "epoch": 0.4110813226094727, "percentage": 4.11, "elapsed_time": "0:10:27", "remaining_time": "4:04:08", "throughput": 2539.13, "total_tokens": 1594496} {"current_steps": 2765, "total_steps": 67140, "loss": 0.8149, "lr": 2.0583854632112007e-05, "epoch": 0.4118260351504319, "percentage": 4.12, "elapsed_time": "0:10:29", "remaining_time": "4:04:06", "throughput": 2539.17, "total_tokens": 1597408} {"current_steps": 2770, "total_steps": 67140, "loss": 0.818, "lr": 2.0621090259159963e-05, "epoch": 0.4125707476913911, "percentage": 4.13, "elapsed_time": "0:10:30", "remaining_time": "4:04:05", "throughput": 2539.16, "total_tokens": 1600288} {"current_steps": 2775, "total_steps": 67140, "loss": 0.8214, "lr": 2.0658325886207923e-05, "epoch": 0.41331546023235033, "percentage": 4.13, "elapsed_time": "0:10:31", "remaining_time": "4:04:04", "throughput": 2539.18, "total_tokens": 1603200} {"current_steps": 2780, "total_steps": 67140, "loss": 0.7981, "lr": 2.0695561513255883e-05, "epoch": 0.4140601727733095, "percentage": 4.14, "elapsed_time": "0:10:32", "remaining_time": "4:04:03", "throughput": 2539.25, "total_tokens": 1606144} {"current_steps": 2785, "total_steps": 67140, "loss": 0.7929, "lr": 2.0732797140303846e-05, "epoch": 0.4148048853142687, "percentage": 4.15, "elapsed_time": "0:10:33", "remaining_time": "4:04:02", "throughput": 2539.38, "total_tokens": 1609152} {"current_steps": 2790, "total_steps": 67140, "loss": 0.7985, "lr": 2.0770032767351803e-05, "epoch": 0.4155495978552279, "percentage": 4.16, "elapsed_time": "0:10:34", "remaining_time": "4:04:01", "throughput": 2539.57, "total_tokens": 1612192} {"current_steps": 2795, "total_steps": 67140, "loss": 0.8087, "lr": 2.0807268394399762e-05, "epoch": 0.4162943103961871, "percentage": 4.16, "elapsed_time": "0:10:35", "remaining_time": "4:04:00", "throughput": 2539.47, "total_tokens": 1614944} {"current_steps": 2800, "total_steps": 67140, "loss": 0.7982, "lr": 2.0844504021447722e-05, "epoch": 0.4170390229371463, "percentage": 4.17, "elapsed_time": "0:10:37", "remaining_time": "4:03:58", "throughput": 2539.53, "total_tokens": 1617856} {"current_steps": 2805, "total_steps": 67140, "loss": 0.7835, "lr": 2.0881739648495682e-05, "epoch": 0.41778373547810543, "percentage": 4.18, "elapsed_time": "0:10:38", "remaining_time": "4:03:58", "throughput": 2539.72, "total_tokens": 1620928} {"current_steps": 2810, "total_steps": 67140, "loss": 0.7978, "lr": 2.0918975275543642e-05, "epoch": 0.41852844801906464, "percentage": 4.19, "elapsed_time": "0:10:39", "remaining_time": "4:03:56", "throughput": 2539.69, "total_tokens": 1623744} {"current_steps": 2815, "total_steps": 67140, "loss": 0.8482, "lr": 2.09562109025916e-05, "epoch": 0.41927316056002384, "percentage": 4.19, "elapsed_time": "0:10:40", "remaining_time": "4:03:55", "throughput": 2539.77, "total_tokens": 1626720} {"current_steps": 2820, "total_steps": 67140, "loss": 0.8709, "lr": 2.099344652963956e-05, "epoch": 0.42001787310098304, "percentage": 4.2, "elapsed_time": "0:10:41", "remaining_time": "4:03:55", "throughput": 2539.82, "total_tokens": 1629696} {"current_steps": 2825, "total_steps": 67140, "loss": 0.843, "lr": 2.103068215668752e-05, "epoch": 0.4207625856419422, "percentage": 4.21, "elapsed_time": "0:10:42", "remaining_time": "4:03:53", "throughput": 2539.66, "total_tokens": 1632416} {"current_steps": 2830, "total_steps": 67140, "loss": 0.7854, "lr": 2.106791778373548e-05, "epoch": 0.4215072981829014, "percentage": 4.22, "elapsed_time": "0:10:43", "remaining_time": "4:03:51", "throughput": 2539.54, "total_tokens": 1635168} {"current_steps": 2835, "total_steps": 67140, "loss": 0.7903, "lr": 2.1105153410783438e-05, "epoch": 0.4222520107238606, "percentage": 4.22, "elapsed_time": "0:10:44", "remaining_time": "4:03:49", "throughput": 2539.26, "total_tokens": 1637760} {"current_steps": 2840, "total_steps": 67140, "loss": 0.8039, "lr": 2.1142389037831398e-05, "epoch": 0.4229967232648198, "percentage": 4.23, "elapsed_time": "0:10:46", "remaining_time": "4:03:47", "throughput": 2539.13, "total_tokens": 1640480} {"current_steps": 2845, "total_steps": 67140, "loss": 0.8519, "lr": 2.1179624664879358e-05, "epoch": 0.42374143580577894, "percentage": 4.24, "elapsed_time": "0:10:47", "remaining_time": "4:03:46", "throughput": 2539.01, "total_tokens": 1643232} {"current_steps": 2850, "total_steps": 67140, "loss": 0.7222, "lr": 2.1216860291927317e-05, "epoch": 0.42448614834673815, "percentage": 4.24, "elapsed_time": "0:10:48", "remaining_time": "4:03:44", "throughput": 2539.16, "total_tokens": 1646208} {"current_steps": 2855, "total_steps": 67140, "loss": 0.978, "lr": 2.1254095918975274e-05, "epoch": 0.42523086088769735, "percentage": 4.25, "elapsed_time": "0:10:49", "remaining_time": "4:03:43", "throughput": 2538.91, "total_tokens": 1648864} {"current_steps": 2860, "total_steps": 67140, "loss": 0.8888, "lr": 2.1291331546023234e-05, "epoch": 0.42597557342865655, "percentage": 4.26, "elapsed_time": "0:10:50", "remaining_time": "4:03:41", "throughput": 2538.82, "total_tokens": 1651648} {"current_steps": 2865, "total_steps": 67140, "loss": 0.8909, "lr": 2.1328567173071197e-05, "epoch": 0.42672028596961575, "percentage": 4.27, "elapsed_time": "0:10:51", "remaining_time": "4:03:39", "throughput": 2538.58, "total_tokens": 1654272} {"current_steps": 2870, "total_steps": 67140, "loss": 0.8107, "lr": 2.1365802800119157e-05, "epoch": 0.4274649985105749, "percentage": 4.27, "elapsed_time": "0:10:52", "remaining_time": "4:03:38", "throughput": 2538.74, "total_tokens": 1657280} {"current_steps": 2875, "total_steps": 67140, "loss": 0.8155, "lr": 2.1403038427167117e-05, "epoch": 0.4282097110515341, "percentage": 4.28, "elapsed_time": "0:10:53", "remaining_time": "4:03:36", "throughput": 2538.62, "total_tokens": 1660000} {"current_steps": 2880, "total_steps": 67140, "loss": 0.772, "lr": 2.1440274054215073e-05, "epoch": 0.4289544235924933, "percentage": 4.29, "elapsed_time": "0:10:55", "remaining_time": "4:03:35", "throughput": 2538.61, "total_tokens": 1662880} {"current_steps": 2885, "total_steps": 67140, "loss": 0.7775, "lr": 2.1477509681263033e-05, "epoch": 0.4296991361334525, "percentage": 4.3, "elapsed_time": "0:10:56", "remaining_time": "4:03:34", "throughput": 2538.64, "total_tokens": 1665760} {"current_steps": 2890, "total_steps": 67140, "loss": 0.939, "lr": 2.1514745308310993e-05, "epoch": 0.43044384867441166, "percentage": 4.3, "elapsed_time": "0:10:57", "remaining_time": "4:03:33", "throughput": 2538.62, "total_tokens": 1668640} {"current_steps": 2895, "total_steps": 67140, "loss": 0.887, "lr": 2.1551980935358953e-05, "epoch": 0.43118856121537086, "percentage": 4.31, "elapsed_time": "0:10:58", "remaining_time": "4:03:32", "throughput": 2538.62, "total_tokens": 1671552} {"current_steps": 2900, "total_steps": 67140, "loss": 1.0482, "lr": 2.1589216562406913e-05, "epoch": 0.43193327375633006, "percentage": 4.32, "elapsed_time": "0:10:59", "remaining_time": "4:03:31", "throughput": 2538.6, "total_tokens": 1674432} {"current_steps": 2905, "total_steps": 67140, "loss": 0.8411, "lr": 2.1626452189454872e-05, "epoch": 0.43267798629728926, "percentage": 4.33, "elapsed_time": "0:11:00", "remaining_time": "4:03:29", "throughput": 2538.5, "total_tokens": 1677248} {"current_steps": 2910, "total_steps": 67140, "loss": 0.8101, "lr": 2.1663687816502832e-05, "epoch": 0.4334226988382484, "percentage": 4.33, "elapsed_time": "0:11:01", "remaining_time": "4:03:28", "throughput": 2538.46, "total_tokens": 1680064} {"current_steps": 2915, "total_steps": 67140, "loss": 0.819, "lr": 2.1700923443550792e-05, "epoch": 0.4341674113792076, "percentage": 4.34, "elapsed_time": "0:11:02", "remaining_time": "4:03:27", "throughput": 2538.33, "total_tokens": 1682848} {"current_steps": 2920, "total_steps": 67140, "loss": 0.8216, "lr": 2.173815907059875e-05, "epoch": 0.4349121239201668, "percentage": 4.35, "elapsed_time": "0:11:04", "remaining_time": "4:03:26", "throughput": 2538.35, "total_tokens": 1685792} {"current_steps": 2925, "total_steps": 67140, "loss": 0.8134, "lr": 2.177539469764671e-05, "epoch": 0.435656836461126, "percentage": 4.36, "elapsed_time": "0:11:05", "remaining_time": "4:03:24", "throughput": 2538.15, "total_tokens": 1688448} {"current_steps": 2930, "total_steps": 67140, "loss": 0.8206, "lr": 2.1812630324694668e-05, "epoch": 0.4364015490020852, "percentage": 4.36, "elapsed_time": "0:11:06", "remaining_time": "4:03:23", "throughput": 2538.13, "total_tokens": 1691328} {"current_steps": 2935, "total_steps": 67140, "loss": 0.8053, "lr": 2.1849865951742628e-05, "epoch": 0.43714626154304437, "percentage": 4.37, "elapsed_time": "0:11:07", "remaining_time": "4:03:22", "throughput": 2538.3, "total_tokens": 1694336} {"current_steps": 2940, "total_steps": 67140, "loss": 0.8074, "lr": 2.1887101578790588e-05, "epoch": 0.43789097408400357, "percentage": 4.38, "elapsed_time": "0:11:08", "remaining_time": "4:03:20", "throughput": 2538.14, "total_tokens": 1697056} {"current_steps": 2945, "total_steps": 67140, "loss": 0.8099, "lr": 2.1924337205838548e-05, "epoch": 0.4386356866249628, "percentage": 4.39, "elapsed_time": "0:11:09", "remaining_time": "4:03:18", "throughput": 2538.02, "total_tokens": 1699808} {"current_steps": 2950, "total_steps": 67140, "loss": 0.7736, "lr": 2.1961572832886508e-05, "epoch": 0.439380399165922, "percentage": 4.39, "elapsed_time": "0:11:10", "remaining_time": "4:03:18", "throughput": 2538.11, "total_tokens": 1702848} {"current_steps": 2955, "total_steps": 67140, "loss": 0.7975, "lr": 2.1998808459934468e-05, "epoch": 0.4401251117068811, "percentage": 4.4, "elapsed_time": "0:11:12", "remaining_time": "4:03:17", "throughput": 2538.06, "total_tokens": 1705696} {"current_steps": 2960, "total_steps": 67140, "loss": 0.7947, "lr": 2.2036044086982427e-05, "epoch": 0.4408698242478403, "percentage": 4.41, "elapsed_time": "0:11:13", "remaining_time": "4:03:16", "throughput": 2538.09, "total_tokens": 1708576} {"current_steps": 2965, "total_steps": 67140, "loss": 0.7549, "lr": 2.2073279714030384e-05, "epoch": 0.4416145367887995, "percentage": 4.42, "elapsed_time": "0:11:14", "remaining_time": "4:03:14", "throughput": 2538.01, "total_tokens": 1711328} {"current_steps": 2970, "total_steps": 67140, "loss": 0.8116, "lr": 2.2110515341078344e-05, "epoch": 0.44235924932975873, "percentage": 4.42, "elapsed_time": "0:11:15", "remaining_time": "4:03:13", "throughput": 2538.19, "total_tokens": 1714368} {"current_steps": 2975, "total_steps": 67140, "loss": 0.8477, "lr": 2.2147750968126304e-05, "epoch": 0.4431039618707179, "percentage": 4.43, "elapsed_time": "0:11:16", "remaining_time": "4:03:12", "throughput": 2538.21, "total_tokens": 1717248} {"current_steps": 2980, "total_steps": 67140, "loss": 0.8349, "lr": 2.2184986595174263e-05, "epoch": 0.4438486744116771, "percentage": 4.44, "elapsed_time": "0:11:17", "remaining_time": "4:03:11", "throughput": 2538.47, "total_tokens": 1720384} {"current_steps": 2985, "total_steps": 67140, "loss": 0.802, "lr": 2.2222222222222223e-05, "epoch": 0.4445933869526363, "percentage": 4.45, "elapsed_time": "0:11:18", "remaining_time": "4:03:10", "throughput": 2538.63, "total_tokens": 1723360} {"current_steps": 2990, "total_steps": 67140, "loss": 0.8091, "lr": 2.2259457849270183e-05, "epoch": 0.4453380994935955, "percentage": 4.45, "elapsed_time": "0:11:19", "remaining_time": "4:03:08", "throughput": 2538.3, "total_tokens": 1725920} {"current_steps": 2995, "total_steps": 67140, "loss": 0.7513, "lr": 2.2296693476318143e-05, "epoch": 0.4460828120345547, "percentage": 4.46, "elapsed_time": "0:11:21", "remaining_time": "4:03:06", "throughput": 2538.23, "total_tokens": 1728672} {"current_steps": 3000, "total_steps": 67140, "loss": 0.825, "lr": 2.2333929103366103e-05, "epoch": 0.44682752457551383, "percentage": 4.47, "elapsed_time": "0:11:22", "remaining_time": "4:03:04", "throughput": 2538.17, "total_tokens": 1731488} {"current_steps": 3005, "total_steps": 67140, "loss": 0.851, "lr": 2.2371164730414063e-05, "epoch": 0.44757223711647304, "percentage": 4.48, "elapsed_time": "0:11:23", "remaining_time": "4:03:04", "throughput": 2538.28, "total_tokens": 1734496} {"current_steps": 3010, "total_steps": 67140, "loss": 0.8375, "lr": 2.240840035746202e-05, "epoch": 0.44831694965743224, "percentage": 4.48, "elapsed_time": "0:11:24", "remaining_time": "4:03:03", "throughput": 2538.25, "total_tokens": 1737408} {"current_steps": 3015, "total_steps": 67140, "loss": 0.7872, "lr": 2.244563598450998e-05, "epoch": 0.44906166219839144, "percentage": 4.49, "elapsed_time": "0:11:25", "remaining_time": "4:03:01", "throughput": 2538.1, "total_tokens": 1740096} {"current_steps": 3020, "total_steps": 67140, "loss": 0.7825, "lr": 2.248287161155794e-05, "epoch": 0.4498063747393506, "percentage": 4.5, "elapsed_time": "0:11:26", "remaining_time": "4:02:59", "throughput": 2537.88, "total_tokens": 1742688} {"current_steps": 3025, "total_steps": 67140, "loss": 0.8149, "lr": 2.25201072386059e-05, "epoch": 0.4505510872803098, "percentage": 4.51, "elapsed_time": "0:11:27", "remaining_time": "4:02:58", "throughput": 2538.03, "total_tokens": 1745760} {"current_steps": 3030, "total_steps": 67140, "loss": 0.8057, "lr": 2.255734286565386e-05, "epoch": 0.451295799821269, "percentage": 4.51, "elapsed_time": "0:11:28", "remaining_time": "4:02:58", "throughput": 2538.13, "total_tokens": 1748768} {"current_steps": 3035, "total_steps": 67140, "loss": 0.8026, "lr": 2.259457849270182e-05, "epoch": 0.4520405123622282, "percentage": 4.52, "elapsed_time": "0:11:30", "remaining_time": "4:02:57", "throughput": 2538.12, "total_tokens": 1751680} {"current_steps": 3040, "total_steps": 67140, "loss": 0.8169, "lr": 2.2631814119749778e-05, "epoch": 0.45278522490318734, "percentage": 4.53, "elapsed_time": "0:11:31", "remaining_time": "4:02:56", "throughput": 2538.03, "total_tokens": 1754496} {"current_steps": 3045, "total_steps": 67140, "loss": 0.8415, "lr": 2.2669049746797738e-05, "epoch": 0.45352993744414655, "percentage": 4.54, "elapsed_time": "0:11:32", "remaining_time": "4:02:53", "throughput": 2537.71, "total_tokens": 1757024} {"current_steps": 3050, "total_steps": 67140, "loss": 0.7941, "lr": 2.2706285373845695e-05, "epoch": 0.45427464998510575, "percentage": 4.54, "elapsed_time": "0:11:33", "remaining_time": "4:02:52", "throughput": 2537.78, "total_tokens": 1759936} {"current_steps": 3055, "total_steps": 67140, "loss": 0.7864, "lr": 2.2743521000893654e-05, "epoch": 0.45501936252606495, "percentage": 4.55, "elapsed_time": "0:11:34", "remaining_time": "4:02:51", "throughput": 2537.89, "total_tokens": 1762880} {"current_steps": 3060, "total_steps": 67140, "loss": 0.7976, "lr": 2.2780756627941614e-05, "epoch": 0.45576407506702415, "percentage": 4.56, "elapsed_time": "0:11:35", "remaining_time": "4:02:51", "throughput": 2537.99, "total_tokens": 1765952} {"current_steps": 3065, "total_steps": 67140, "loss": 0.7689, "lr": 2.2817992254989574e-05, "epoch": 0.4565087876079833, "percentage": 4.57, "elapsed_time": "0:11:36", "remaining_time": "4:02:49", "throughput": 2537.9, "total_tokens": 1768704} {"current_steps": 3070, "total_steps": 67140, "loss": 0.7909, "lr": 2.2855227882037537e-05, "epoch": 0.4572535001489425, "percentage": 4.57, "elapsed_time": "0:11:38", "remaining_time": "4:02:47", "throughput": 2537.83, "total_tokens": 1771488} {"current_steps": 3075, "total_steps": 67140, "loss": 0.8151, "lr": 2.2892463509085494e-05, "epoch": 0.4579982126899017, "percentage": 4.58, "elapsed_time": "0:11:39", "remaining_time": "4:02:47", "throughput": 2538.04, "total_tokens": 1774624} {"current_steps": 3080, "total_steps": 67140, "loss": 0.8575, "lr": 2.2929699136133454e-05, "epoch": 0.4587429252308609, "percentage": 4.59, "elapsed_time": "0:11:40", "remaining_time": "4:02:47", "throughput": 2538.21, "total_tokens": 1777728} {"current_steps": 3085, "total_steps": 67140, "loss": 0.8042, "lr": 2.2966934763181414e-05, "epoch": 0.45948763777182006, "percentage": 4.59, "elapsed_time": "0:11:41", "remaining_time": "4:02:45", "throughput": 2538.26, "total_tokens": 1780640} {"current_steps": 3090, "total_steps": 67140, "loss": 0.8787, "lr": 2.3004170390229373e-05, "epoch": 0.46023235031277926, "percentage": 4.6, "elapsed_time": "0:11:42", "remaining_time": "4:02:44", "throughput": 2538.29, "total_tokens": 1783520} {"current_steps": 3095, "total_steps": 67140, "loss": 0.785, "lr": 2.304140601727733e-05, "epoch": 0.46097706285373846, "percentage": 4.61, "elapsed_time": "0:11:43", "remaining_time": "4:02:42", "throughput": 2538.17, "total_tokens": 1786240} {"current_steps": 3100, "total_steps": 67140, "loss": 0.8045, "lr": 2.307864164432529e-05, "epoch": 0.46172177539469766, "percentage": 4.62, "elapsed_time": "0:11:44", "remaining_time": "4:02:41", "throughput": 2538.23, "total_tokens": 1789184} {"current_steps": 3105, "total_steps": 67140, "loss": 0.8292, "lr": 2.3115877271373253e-05, "epoch": 0.4624664879356568, "percentage": 4.62, "elapsed_time": "0:11:46", "remaining_time": "4:02:40", "throughput": 2538.16, "total_tokens": 1791968} {"current_steps": 3110, "total_steps": 67140, "loss": 0.8058, "lr": 2.3153112898421213e-05, "epoch": 0.463211200476616, "percentage": 4.63, "elapsed_time": "0:11:47", "remaining_time": "4:02:39", "throughput": 2538.1, "total_tokens": 1794816} {"current_steps": 3115, "total_steps": 67140, "loss": 0.8127, "lr": 2.319034852546917e-05, "epoch": 0.4639559130175752, "percentage": 4.64, "elapsed_time": "0:11:48", "remaining_time": "4:02:37", "throughput": 2538.14, "total_tokens": 1797696} {"current_steps": 3120, "total_steps": 67140, "loss": 0.8214, "lr": 2.322758415251713e-05, "epoch": 0.4647006255585344, "percentage": 4.65, "elapsed_time": "0:11:49", "remaining_time": "4:02:36", "throughput": 2538.21, "total_tokens": 1800640} {"current_steps": 3125, "total_steps": 67140, "loss": 0.8343, "lr": 2.326481977956509e-05, "epoch": 0.4654453380994936, "percentage": 4.65, "elapsed_time": "0:11:50", "remaining_time": "4:02:35", "throughput": 2538.24, "total_tokens": 1803552} {"current_steps": 3130, "total_steps": 67140, "loss": 0.8078, "lr": 2.330205540661305e-05, "epoch": 0.46619005064045277, "percentage": 4.66, "elapsed_time": "0:11:51", "remaining_time": "4:02:34", "throughput": 2538.42, "total_tokens": 1806624} {"current_steps": 3135, "total_steps": 67140, "loss": 0.7926, "lr": 2.333929103366101e-05, "epoch": 0.46693476318141197, "percentage": 4.67, "elapsed_time": "0:11:52", "remaining_time": "4:02:34", "throughput": 2538.66, "total_tokens": 1809760} {"current_steps": 3140, "total_steps": 67140, "loss": 0.8006, "lr": 2.3376526660708965e-05, "epoch": 0.4676794757223712, "percentage": 4.68, "elapsed_time": "0:11:53", "remaining_time": "4:02:32", "throughput": 2538.61, "total_tokens": 1812544} {"current_steps": 3145, "total_steps": 67140, "loss": 0.8171, "lr": 2.341376228775693e-05, "epoch": 0.4684241882633304, "percentage": 4.68, "elapsed_time": "0:11:55", "remaining_time": "4:02:30", "throughput": 2538.32, "total_tokens": 1815072} {"current_steps": 3150, "total_steps": 67140, "loss": 0.8089, "lr": 2.3450997914804888e-05, "epoch": 0.4691689008042895, "percentage": 4.69, "elapsed_time": "0:11:56", "remaining_time": "4:02:28", "throughput": 2538.16, "total_tokens": 1817760} {"current_steps": 3155, "total_steps": 67140, "loss": 0.8073, "lr": 2.3488233541852848e-05, "epoch": 0.4699136133452487, "percentage": 4.7, "elapsed_time": "0:11:57", "remaining_time": "4:02:27", "throughput": 2538.04, "total_tokens": 1820512} {"current_steps": 3160, "total_steps": 67140, "loss": 0.81, "lr": 2.3525469168900805e-05, "epoch": 0.47065832588620793, "percentage": 4.71, "elapsed_time": "0:11:58", "remaining_time": "4:02:26", "throughput": 2538.45, "total_tokens": 1823808} {"current_steps": 3165, "total_steps": 67140, "loss": 0.7948, "lr": 2.3562704795948764e-05, "epoch": 0.47140303842716713, "percentage": 4.71, "elapsed_time": "0:11:59", "remaining_time": "4:02:25", "throughput": 2538.48, "total_tokens": 1826656} {"current_steps": 3170, "total_steps": 67140, "loss": 0.8306, "lr": 2.3599940422996724e-05, "epoch": 0.4721477509681263, "percentage": 4.72, "elapsed_time": "0:12:00", "remaining_time": "4:02:26", "throughput": 2539.12, "total_tokens": 1830304} {"current_steps": 3175, "total_steps": 67140, "loss": 0.8011, "lr": 2.3637176050044684e-05, "epoch": 0.4728924635090855, "percentage": 4.73, "elapsed_time": "0:12:02", "remaining_time": "4:02:25", "throughput": 2539.33, "total_tokens": 1833408} {"current_steps": 3180, "total_steps": 67140, "loss": 0.7885, "lr": 2.367441167709264e-05, "epoch": 0.4736371760500447, "percentage": 4.74, "elapsed_time": "0:12:03", "remaining_time": "4:02:24", "throughput": 2539.13, "total_tokens": 1836096} {"current_steps": 3185, "total_steps": 67140, "loss": 0.8015, "lr": 2.3711647304140604e-05, "epoch": 0.4743818885910039, "percentage": 4.74, "elapsed_time": "0:12:04", "remaining_time": "4:02:22", "throughput": 2539.12, "total_tokens": 1838912} {"current_steps": 3190, "total_steps": 67140, "loss": 0.7958, "lr": 2.3748882931188564e-05, "epoch": 0.4751266011319631, "percentage": 4.75, "elapsed_time": "0:12:05", "remaining_time": "4:02:21", "throughput": 2539.14, "total_tokens": 1841824} {"current_steps": 3195, "total_steps": 67140, "loss": 0.8026, "lr": 2.3786118558236524e-05, "epoch": 0.47587131367292224, "percentage": 4.76, "elapsed_time": "0:12:06", "remaining_time": "4:02:20", "throughput": 2539.2, "total_tokens": 1844800} {"current_steps": 3200, "total_steps": 67140, "loss": 0.8187, "lr": 2.3823354185284483e-05, "epoch": 0.47661602621388144, "percentage": 4.77, "elapsed_time": "0:12:07", "remaining_time": "4:02:19", "throughput": 2539.2, "total_tokens": 1847648} {"current_steps": 3205, "total_steps": 67140, "loss": 0.7782, "lr": 2.386058981233244e-05, "epoch": 0.47736073875484064, "percentage": 4.77, "elapsed_time": "0:12:08", "remaining_time": "4:02:17", "throughput": 2539.19, "total_tokens": 1850464} {"current_steps": 3210, "total_steps": 67140, "loss": 0.7974, "lr": 2.38978254393804e-05, "epoch": 0.47810545129579984, "percentage": 4.78, "elapsed_time": "0:12:09", "remaining_time": "4:02:15", "throughput": 2539.15, "total_tokens": 1853248} {"current_steps": 3215, "total_steps": 67140, "loss": 0.792, "lr": 2.393506106642836e-05, "epoch": 0.478850163836759, "percentage": 4.79, "elapsed_time": "0:12:10", "remaining_time": "4:02:14", "throughput": 2539.0, "total_tokens": 1856000} {"current_steps": 3220, "total_steps": 67140, "loss": 0.8005, "lr": 2.397229669347632e-05, "epoch": 0.4795948763777182, "percentage": 4.8, "elapsed_time": "0:12:12", "remaining_time": "4:02:13", "throughput": 2539.04, "total_tokens": 1858944} {"current_steps": 3225, "total_steps": 67140, "loss": 0.7765, "lr": 2.400953232052428e-05, "epoch": 0.4803395889186774, "percentage": 4.8, "elapsed_time": "0:12:13", "remaining_time": "4:02:13", "throughput": 2539.24, "total_tokens": 1862080} {"current_steps": 3230, "total_steps": 67140, "loss": 0.7977, "lr": 2.404676794757224e-05, "epoch": 0.4810843014596366, "percentage": 4.81, "elapsed_time": "0:12:14", "remaining_time": "4:02:12", "throughput": 2539.32, "total_tokens": 1865088} {"current_steps": 3235, "total_steps": 67140, "loss": 0.798, "lr": 2.40840035746202e-05, "epoch": 0.48182901400059575, "percentage": 4.82, "elapsed_time": "0:12:15", "remaining_time": "4:02:10", "throughput": 2538.94, "total_tokens": 1867552} {"current_steps": 3240, "total_steps": 67140, "loss": 0.8523, "lr": 2.412123920166816e-05, "epoch": 0.48257372654155495, "percentage": 4.83, "elapsed_time": "0:12:16", "remaining_time": "4:02:10", "throughput": 2539.24, "total_tokens": 1870784} {"current_steps": 3245, "total_steps": 67140, "loss": 0.8352, "lr": 2.4158474828716115e-05, "epoch": 0.48331843908251415, "percentage": 4.83, "elapsed_time": "0:12:17", "remaining_time": "4:02:09", "throughput": 2539.45, "total_tokens": 1873920} {"current_steps": 3250, "total_steps": 67140, "loss": 0.7789, "lr": 2.4195710455764075e-05, "epoch": 0.48406315162347335, "percentage": 4.84, "elapsed_time": "0:12:19", "remaining_time": "4:02:09", "throughput": 2539.68, "total_tokens": 1877056} {"current_steps": 3255, "total_steps": 67140, "loss": 0.817, "lr": 2.4232946082812035e-05, "epoch": 0.48480786416443256, "percentage": 4.85, "elapsed_time": "0:12:20", "remaining_time": "4:02:08", "throughput": 2539.85, "total_tokens": 1880160} {"current_steps": 3260, "total_steps": 67140, "loss": 0.824, "lr": 2.4270181709859995e-05, "epoch": 0.4855525767053917, "percentage": 4.86, "elapsed_time": "0:12:21", "remaining_time": "4:02:07", "throughput": 2539.73, "total_tokens": 1882912} {"current_steps": 3265, "total_steps": 67140, "loss": 0.8139, "lr": 2.4307417336907955e-05, "epoch": 0.4862972892463509, "percentage": 4.86, "elapsed_time": "0:12:22", "remaining_time": "4:02:05", "throughput": 2539.55, "total_tokens": 1885536} {"current_steps": 3270, "total_steps": 67140, "loss": 0.8198, "lr": 2.4344652963955915e-05, "epoch": 0.4870420017873101, "percentage": 4.87, "elapsed_time": "0:12:23", "remaining_time": "4:02:04", "throughput": 2539.55, "total_tokens": 1888416} {"current_steps": 3275, "total_steps": 67140, "loss": 0.8168, "lr": 2.4381888591003874e-05, "epoch": 0.4877867143282693, "percentage": 4.88, "elapsed_time": "0:12:24", "remaining_time": "4:02:03", "throughput": 2539.68, "total_tokens": 1891456} {"current_steps": 3280, "total_steps": 67140, "loss": 0.8166, "lr": 2.4419124218051834e-05, "epoch": 0.48853142686922846, "percentage": 4.89, "elapsed_time": "0:12:25", "remaining_time": "4:02:01", "throughput": 2539.6, "total_tokens": 1894240} {"current_steps": 3285, "total_steps": 67140, "loss": 0.8086, "lr": 2.4456359845099794e-05, "epoch": 0.48927613941018766, "percentage": 4.89, "elapsed_time": "0:12:27", "remaining_time": "4:02:00", "throughput": 2539.55, "total_tokens": 1897088} {"current_steps": 3290, "total_steps": 67140, "loss": 0.8148, "lr": 2.449359547214775e-05, "epoch": 0.49002085195114686, "percentage": 4.9, "elapsed_time": "0:12:28", "remaining_time": "4:02:00", "throughput": 2539.76, "total_tokens": 1900192} {"current_steps": 3295, "total_steps": 67140, "loss": 0.8207, "lr": 2.453083109919571e-05, "epoch": 0.49076556449210607, "percentage": 4.91, "elapsed_time": "0:12:29", "remaining_time": "4:01:59", "throughput": 2539.78, "total_tokens": 1903136} {"current_steps": 3300, "total_steps": 67140, "loss": 0.7766, "lr": 2.456806672624367e-05, "epoch": 0.4915102770330652, "percentage": 4.92, "elapsed_time": "0:12:30", "remaining_time": "4:01:57", "throughput": 2539.8, "total_tokens": 1906016} {"current_steps": 3305, "total_steps": 67140, "loss": 0.8123, "lr": 2.460530235329163e-05, "epoch": 0.4922549895740244, "percentage": 4.92, "elapsed_time": "0:12:31", "remaining_time": "4:01:57", "throughput": 2540.05, "total_tokens": 1909184} {"current_steps": 3310, "total_steps": 67140, "loss": 0.8203, "lr": 2.464253798033959e-05, "epoch": 0.4929997021149836, "percentage": 4.93, "elapsed_time": "0:12:32", "remaining_time": "4:01:55", "throughput": 2539.88, "total_tokens": 1911872} {"current_steps": 3315, "total_steps": 67140, "loss": 1.0299, "lr": 2.467977360738755e-05, "epoch": 0.4937444146559428, "percentage": 4.94, "elapsed_time": "0:12:33", "remaining_time": "4:01:55", "throughput": 2539.89, "total_tokens": 1914848} {"current_steps": 3320, "total_steps": 67140, "loss": 0.7773, "lr": 2.471700923443551e-05, "epoch": 0.494489127196902, "percentage": 4.94, "elapsed_time": "0:12:35", "remaining_time": "4:01:54", "throughput": 2540.04, "total_tokens": 1917920} {"current_steps": 3325, "total_steps": 67140, "loss": 0.84, "lr": 2.475424486148347e-05, "epoch": 0.49523383973786117, "percentage": 4.95, "elapsed_time": "0:12:36", "remaining_time": "4:01:53", "throughput": 2540.0, "total_tokens": 1920704} {"current_steps": 3330, "total_steps": 67140, "loss": 0.8743, "lr": 2.4791480488531426e-05, "epoch": 0.4959785522788204, "percentage": 4.96, "elapsed_time": "0:12:37", "remaining_time": "4:01:50", "throughput": 2539.74, "total_tokens": 1923264} {"current_steps": 3335, "total_steps": 67140, "loss": 3.2495, "lr": 2.4828716115579386e-05, "epoch": 0.4967232648197796, "percentage": 4.97, "elapsed_time": "0:12:38", "remaining_time": "4:01:49", "throughput": 2539.67, "total_tokens": 1926048} {"current_steps": 3340, "total_steps": 67140, "loss": 0.8086, "lr": 2.4865951742627346e-05, "epoch": 0.4974679773607388, "percentage": 4.97, "elapsed_time": "0:12:39", "remaining_time": "4:01:48", "throughput": 2539.63, "total_tokens": 1928896} {"current_steps": 3345, "total_steps": 67140, "loss": 0.8048, "lr": 2.4903187369675306e-05, "epoch": 0.4982126899016979, "percentage": 4.98, "elapsed_time": "0:12:40", "remaining_time": "4:01:47", "throughput": 2539.61, "total_tokens": 1931776} {"current_steps": 3350, "total_steps": 67140, "loss": 0.7965, "lr": 2.494042299672327e-05, "epoch": 0.4989574024426571, "percentage": 4.99, "elapsed_time": "0:12:41", "remaining_time": "4:01:45", "throughput": 2539.6, "total_tokens": 1934624} {"current_steps": 3355, "total_steps": 67140, "loss": 0.8057, "lr": 2.4977658623771225e-05, "epoch": 0.49970211498361633, "percentage": 5.0, "elapsed_time": "0:12:42", "remaining_time": "4:01:44", "throughput": 2539.67, "total_tokens": 1937600} {"current_steps": 3357, "total_steps": 67140, "eval_loss": 0.8055608868598938, "epoch": 0.5, "percentage": 5.0, "elapsed_time": "0:13:57", "remaining_time": "4:25:14", "throughput": 2314.59, "total_tokens": 1938656} {"current_steps": 3360, "total_steps": 67140, "loss": 0.825, "lr": 2.501489425081919e-05, "epoch": 0.5004468275245755, "percentage": 5.0, "elapsed_time": "0:13:59", "remaining_time": "4:25:37", "throughput": 2310.81, "total_tokens": 1940192} {"current_steps": 3365, "total_steps": 67140, "loss": 0.7827, "lr": 2.505212987786714e-05, "epoch": 0.5011915400655347, "percentage": 5.01, "elapsed_time": "0:14:00", "remaining_time": "4:25:33", "throughput": 2310.97, "total_tokens": 1942912} {"current_steps": 3370, "total_steps": 67140, "loss": 0.8375, "lr": 2.50893655049151e-05, "epoch": 0.5019362526064939, "percentage": 5.02, "elapsed_time": "0:14:01", "remaining_time": "4:25:29", "throughput": 2311.07, "total_tokens": 1945504} {"current_steps": 3375, "total_steps": 67140, "loss": 0.8303, "lr": 2.512660113196306e-05, "epoch": 0.5026809651474531, "percentage": 5.03, "elapsed_time": "0:14:02", "remaining_time": "4:25:26", "throughput": 2311.44, "total_tokens": 1948512} {"current_steps": 3380, "total_steps": 67140, "loss": 0.8212, "lr": 2.516383675901102e-05, "epoch": 0.5034256776884123, "percentage": 5.03, "elapsed_time": "0:14:04", "remaining_time": "4:25:23", "throughput": 2311.73, "total_tokens": 1951392} {"current_steps": 3385, "total_steps": 67140, "loss": 0.7828, "lr": 2.520107238605898e-05, "epoch": 0.5041703902293715, "percentage": 5.04, "elapsed_time": "0:14:05", "remaining_time": "4:25:19", "throughput": 2312.06, "total_tokens": 1954272} {"current_steps": 3390, "total_steps": 67140, "loss": 0.8129, "lr": 2.5238308013106944e-05, "epoch": 0.5049151027703307, "percentage": 5.05, "elapsed_time": "0:14:06", "remaining_time": "4:25:16", "throughput": 2312.26, "total_tokens": 1957024} {"current_steps": 3395, "total_steps": 67140, "loss": 0.8098, "lr": 2.5275543640154904e-05, "epoch": 0.5056598153112899, "percentage": 5.06, "elapsed_time": "0:14:07", "remaining_time": "4:25:12", "throughput": 2312.45, "total_tokens": 1959744} {"current_steps": 3400, "total_steps": 67140, "loss": 0.8029, "lr": 2.5312779267202864e-05, "epoch": 0.506404527852249, "percentage": 5.06, "elapsed_time": "0:14:08", "remaining_time": "4:25:09", "throughput": 2312.81, "total_tokens": 1962688} {"current_steps": 3405, "total_steps": 67140, "loss": 0.7834, "lr": 2.5350014894250824e-05, "epoch": 0.5071492403932082, "percentage": 5.07, "elapsed_time": "0:14:09", "remaining_time": "4:25:05", "throughput": 2313.0, "total_tokens": 1965440} {"current_steps": 3410, "total_steps": 67140, "loss": 0.8122, "lr": 2.5387250521298777e-05, "epoch": 0.5078939529341674, "percentage": 5.08, "elapsed_time": "0:14:10", "remaining_time": "4:25:01", "throughput": 2313.2, "total_tokens": 1968192} {"current_steps": 3415, "total_steps": 67140, "loss": 0.8081, "lr": 2.5424486148346737e-05, "epoch": 0.5086386654751266, "percentage": 5.09, "elapsed_time": "0:14:11", "remaining_time": "4:24:57", "throughput": 2313.39, "total_tokens": 1970912} {"current_steps": 3420, "total_steps": 67140, "loss": 0.809, "lr": 2.5461721775394697e-05, "epoch": 0.5093833780160858, "percentage": 5.09, "elapsed_time": "0:14:13", "remaining_time": "4:24:54", "throughput": 2313.85, "total_tokens": 1973984} {"current_steps": 3425, "total_steps": 67140, "loss": 0.7974, "lr": 2.5498957402442656e-05, "epoch": 0.510128090557045, "percentage": 5.1, "elapsed_time": "0:14:14", "remaining_time": "4:24:51", "throughput": 2314.11, "total_tokens": 1976800} {"current_steps": 3430, "total_steps": 67140, "loss": 0.8135, "lr": 2.553619302949062e-05, "epoch": 0.5108728030980042, "percentage": 5.11, "elapsed_time": "0:14:15", "remaining_time": "4:24:48", "throughput": 2314.47, "total_tokens": 1979776} {"current_steps": 3435, "total_steps": 67140, "loss": 0.8615, "lr": 2.557342865653858e-05, "epoch": 0.5116175156389634, "percentage": 5.12, "elapsed_time": "0:14:16", "remaining_time": "4:24:44", "throughput": 2314.78, "total_tokens": 1982656} {"current_steps": 3440, "total_steps": 67140, "loss": 0.8901, "lr": 2.561066428358654e-05, "epoch": 0.5123622281799225, "percentage": 5.12, "elapsed_time": "0:14:17", "remaining_time": "4:24:40", "throughput": 2314.93, "total_tokens": 1985312} {"current_steps": 3445, "total_steps": 67140, "loss": 0.7952, "lr": 2.56478999106345e-05, "epoch": 0.5131069407208817, "percentage": 5.13, "elapsed_time": "0:14:18", "remaining_time": "4:24:37", "throughput": 2315.38, "total_tokens": 1988384} {"current_steps": 3450, "total_steps": 67140, "loss": 0.8241, "lr": 2.5685135537682452e-05, "epoch": 0.5138516532618409, "percentage": 5.14, "elapsed_time": "0:14:19", "remaining_time": "4:24:34", "throughput": 2315.7, "total_tokens": 1991296} {"current_steps": 3455, "total_steps": 67140, "loss": 0.8016, "lr": 2.5722371164730412e-05, "epoch": 0.5145963658028001, "percentage": 5.15, "elapsed_time": "0:14:21", "remaining_time": "4:24:30", "throughput": 2315.81, "total_tokens": 1993952} {"current_steps": 3460, "total_steps": 67140, "loss": 0.8226, "lr": 2.5759606791778372e-05, "epoch": 0.5153410783437593, "percentage": 5.15, "elapsed_time": "0:14:22", "remaining_time": "4:24:28", "throughput": 2316.23, "total_tokens": 1997024} {"current_steps": 3465, "total_steps": 67140, "loss": 0.8071, "lr": 2.5796842418826332e-05, "epoch": 0.5160857908847185, "percentage": 5.16, "elapsed_time": "0:14:23", "remaining_time": "4:24:24", "throughput": 2316.41, "total_tokens": 1999776} {"current_steps": 3470, "total_steps": 67140, "loss": 0.8023, "lr": 2.5834078045874295e-05, "epoch": 0.5168305034256777, "percentage": 5.17, "elapsed_time": "0:14:24", "remaining_time": "4:24:21", "throughput": 2316.79, "total_tokens": 2002752} {"current_steps": 3475, "total_steps": 67140, "loss": 0.817, "lr": 2.5871313672922255e-05, "epoch": 0.5175752159666369, "percentage": 5.18, "elapsed_time": "0:14:25", "remaining_time": "4:24:17", "throughput": 2316.92, "total_tokens": 2005408} {"current_steps": 3480, "total_steps": 67140, "loss": 0.8045, "lr": 2.5908549299970215e-05, "epoch": 0.5183199285075961, "percentage": 5.18, "elapsed_time": "0:14:26", "remaining_time": "4:24:14", "throughput": 2317.23, "total_tokens": 2008320} {"current_steps": 3485, "total_steps": 67140, "loss": 0.8066, "lr": 2.5945784927018175e-05, "epoch": 0.5190646410485552, "percentage": 5.19, "elapsed_time": "0:14:27", "remaining_time": "4:24:10", "throughput": 2317.38, "total_tokens": 2011040} {"current_steps": 3490, "total_steps": 67140, "loss": 0.7889, "lr": 2.5983020554066135e-05, "epoch": 0.5198093535895144, "percentage": 5.2, "elapsed_time": "0:14:28", "remaining_time": "4:24:07", "throughput": 2317.65, "total_tokens": 2013888} {"current_steps": 3495, "total_steps": 67140, "loss": 0.8211, "lr": 2.6020256181114088e-05, "epoch": 0.5205540661304736, "percentage": 5.21, "elapsed_time": "0:14:30", "remaining_time": "4:24:04", "throughput": 2318.14, "total_tokens": 2017024} {"current_steps": 3500, "total_steps": 67140, "loss": 0.829, "lr": 2.6057491808162047e-05, "epoch": 0.5212987786714328, "percentage": 5.21, "elapsed_time": "0:14:31", "remaining_time": "4:24:01", "throughput": 2318.47, "total_tokens": 2019968} {"current_steps": 3505, "total_steps": 67140, "loss": 0.803, "lr": 2.609472743521001e-05, "epoch": 0.522043491212392, "percentage": 5.22, "elapsed_time": "0:14:32", "remaining_time": "4:23:59", "throughput": 2318.96, "total_tokens": 2023104} {"current_steps": 3510, "total_steps": 67140, "loss": 0.8072, "lr": 2.613196306225797e-05, "epoch": 0.5227882037533512, "percentage": 5.23, "elapsed_time": "0:14:33", "remaining_time": "4:23:56", "throughput": 2319.25, "total_tokens": 2026016} {"current_steps": 3515, "total_steps": 67140, "loss": 0.7893, "lr": 2.616919868930593e-05, "epoch": 0.5235329162943104, "percentage": 5.24, "elapsed_time": "0:14:34", "remaining_time": "4:23:53", "throughput": 2319.59, "total_tokens": 2028960} {"current_steps": 3520, "total_steps": 67140, "loss": 0.8002, "lr": 2.620643431635389e-05, "epoch": 0.5242776288352696, "percentage": 5.24, "elapsed_time": "0:14:35", "remaining_time": "4:23:50", "throughput": 2320.08, "total_tokens": 2032096} {"current_steps": 3525, "total_steps": 67140, "loss": 0.8123, "lr": 2.624366994340185e-05, "epoch": 0.5250223413762288, "percentage": 5.25, "elapsed_time": "0:14:36", "remaining_time": "4:23:46", "throughput": 2320.1, "total_tokens": 2034656} {"current_steps": 3530, "total_steps": 67140, "loss": 0.8248, "lr": 2.628090557044981e-05, "epoch": 0.5257670539171879, "percentage": 5.26, "elapsed_time": "0:14:38", "remaining_time": "4:23:43", "throughput": 2320.56, "total_tokens": 2037760} {"current_steps": 3535, "total_steps": 67140, "loss": 0.8127, "lr": 2.631814119749777e-05, "epoch": 0.5265117664581471, "percentage": 5.27, "elapsed_time": "0:14:39", "remaining_time": "4:23:42", "throughput": 2321.24, "total_tokens": 2041248} {"current_steps": 3540, "total_steps": 67140, "loss": 2.403, "lr": 2.6355376824545723e-05, "epoch": 0.5272564789991063, "percentage": 5.27, "elapsed_time": "0:14:40", "remaining_time": "4:23:40", "throughput": 2321.71, "total_tokens": 2044384} {"current_steps": 3545, "total_steps": 67140, "loss": 1.2059, "lr": 2.6392612451593686e-05, "epoch": 0.5280011915400655, "percentage": 5.28, "elapsed_time": "0:14:41", "remaining_time": "4:23:36", "throughput": 2321.73, "total_tokens": 2046944} {"current_steps": 3550, "total_steps": 67140, "loss": 0.809, "lr": 2.6429848078641646e-05, "epoch": 0.5287459040810247, "percentage": 5.29, "elapsed_time": "0:14:42", "remaining_time": "4:23:32", "throughput": 2322.0, "total_tokens": 2049792} {"current_steps": 3555, "total_steps": 67140, "loss": 0.8107, "lr": 2.6467083705689606e-05, "epoch": 0.5294906166219839, "percentage": 5.29, "elapsed_time": "0:14:43", "remaining_time": "4:23:29", "throughput": 2322.31, "total_tokens": 2052736} {"current_steps": 3560, "total_steps": 67140, "loss": 0.7782, "lr": 2.6504319332737566e-05, "epoch": 0.5302353291629431, "percentage": 5.3, "elapsed_time": "0:14:45", "remaining_time": "4:23:26", "throughput": 2322.57, "total_tokens": 2055616} {"current_steps": 3565, "total_steps": 67140, "loss": 0.7957, "lr": 2.6541554959785526e-05, "epoch": 0.5309800417039023, "percentage": 5.31, "elapsed_time": "0:14:46", "remaining_time": "4:23:23", "throughput": 2322.81, "total_tokens": 2058464} {"current_steps": 3570, "total_steps": 67140, "loss": 0.789, "lr": 2.6578790586833485e-05, "epoch": 0.5317247542448614, "percentage": 5.32, "elapsed_time": "0:14:47", "remaining_time": "4:23:20", "throughput": 2322.91, "total_tokens": 2061152} {"current_steps": 3575, "total_steps": 67140, "loss": 0.7702, "lr": 2.6616026213881445e-05, "epoch": 0.5324694667858206, "percentage": 5.32, "elapsed_time": "0:14:48", "remaining_time": "4:23:16", "throughput": 2323.12, "total_tokens": 2063936} {"current_steps": 3580, "total_steps": 67140, "loss": 0.9007, "lr": 2.66532618409294e-05, "epoch": 0.5332141793267798, "percentage": 5.33, "elapsed_time": "0:14:49", "remaining_time": "4:23:13", "throughput": 2323.28, "total_tokens": 2066688} {"current_steps": 3585, "total_steps": 67140, "loss": 0.8206, "lr": 2.669049746797736e-05, "epoch": 0.533958891867739, "percentage": 5.34, "elapsed_time": "0:14:50", "remaining_time": "4:23:10", "throughput": 2323.64, "total_tokens": 2069664} {"current_steps": 3590, "total_steps": 67140, "loss": 0.7621, "lr": 2.672773309502532e-05, "epoch": 0.5347036044086982, "percentage": 5.35, "elapsed_time": "0:14:51", "remaining_time": "4:23:07", "throughput": 2324.01, "total_tokens": 2072672} {"current_steps": 3595, "total_steps": 67140, "loss": 0.8719, "lr": 2.676496872207328e-05, "epoch": 0.5354483169496574, "percentage": 5.35, "elapsed_time": "0:14:53", "remaining_time": "4:23:04", "throughput": 2324.44, "total_tokens": 2075776} {"current_steps": 3600, "total_steps": 67140, "loss": 0.7907, "lr": 2.680220434912124e-05, "epoch": 0.5361930294906166, "percentage": 5.36, "elapsed_time": "0:14:54", "remaining_time": "4:23:01", "throughput": 2324.7, "total_tokens": 2078656} {"current_steps": 3605, "total_steps": 67140, "loss": 0.8467, "lr": 2.68394399761692e-05, "epoch": 0.5369377420315758, "percentage": 5.37, "elapsed_time": "0:14:55", "remaining_time": "4:22:59", "throughput": 2325.2, "total_tokens": 2081824} {"current_steps": 3610, "total_steps": 67140, "loss": 0.8335, "lr": 2.687667560321716e-05, "epoch": 0.537682454572535, "percentage": 5.38, "elapsed_time": "0:14:56", "remaining_time": "4:22:56", "throughput": 2325.45, "total_tokens": 2084672} {"current_steps": 3615, "total_steps": 67140, "loss": 0.8306, "lr": 2.691391123026512e-05, "epoch": 0.5384271671134941, "percentage": 5.38, "elapsed_time": "0:14:57", "remaining_time": "4:22:52", "throughput": 2325.53, "total_tokens": 2087296} {"current_steps": 3620, "total_steps": 67140, "loss": 0.798, "lr": 2.695114685731308e-05, "epoch": 0.5391718796544533, "percentage": 5.39, "elapsed_time": "0:14:58", "remaining_time": "4:22:49", "throughput": 2325.85, "total_tokens": 2090272} {"current_steps": 3625, "total_steps": 67140, "loss": 0.7542, "lr": 2.6988382484361037e-05, "epoch": 0.5399165921954125, "percentage": 5.4, "elapsed_time": "0:14:59", "remaining_time": "4:22:46", "throughput": 2326.13, "total_tokens": 2093152} {"current_steps": 3630, "total_steps": 67140, "loss": 0.7307, "lr": 2.7025618111408997e-05, "epoch": 0.5406613047363718, "percentage": 5.41, "elapsed_time": "0:15:00", "remaining_time": "4:22:43", "throughput": 2326.51, "total_tokens": 2096160} {"current_steps": 3635, "total_steps": 67140, "loss": 0.9703, "lr": 2.7062853738456957e-05, "epoch": 0.541406017277331, "percentage": 5.41, "elapsed_time": "0:15:02", "remaining_time": "4:22:39", "throughput": 2326.61, "total_tokens": 2098784} {"current_steps": 3640, "total_steps": 67140, "loss": 0.7715, "lr": 2.7100089365504917e-05, "epoch": 0.5421507298182902, "percentage": 5.42, "elapsed_time": "0:15:03", "remaining_time": "4:22:35", "throughput": 2326.72, "total_tokens": 2101440} {"current_steps": 3645, "total_steps": 67140, "loss": 0.7876, "lr": 2.7137324992552876e-05, "epoch": 0.5428954423592494, "percentage": 5.43, "elapsed_time": "0:15:04", "remaining_time": "4:22:33", "throughput": 2327.04, "total_tokens": 2104448} {"current_steps": 3650, "total_steps": 67140, "loss": 0.8206, "lr": 2.7174560619600836e-05, "epoch": 0.5436401549002086, "percentage": 5.44, "elapsed_time": "0:15:05", "remaining_time": "4:22:30", "throughput": 2327.26, "total_tokens": 2107232} {"current_steps": 3655, "total_steps": 67140, "loss": 0.7931, "lr": 2.7211796246648796e-05, "epoch": 0.5443848674411678, "percentage": 5.44, "elapsed_time": "0:15:06", "remaining_time": "4:22:27", "throughput": 2327.67, "total_tokens": 2110336} {"current_steps": 3660, "total_steps": 67140, "loss": 0.8454, "lr": 2.7249031873696756e-05, "epoch": 0.5451295799821269, "percentage": 5.45, "elapsed_time": "0:15:07", "remaining_time": "4:22:25", "throughput": 2328.1, "total_tokens": 2113472} {"current_steps": 3665, "total_steps": 67140, "loss": 0.7812, "lr": 2.7286267500744716e-05, "epoch": 0.5458742925230861, "percentage": 5.46, "elapsed_time": "0:15:09", "remaining_time": "4:22:25", "throughput": 2328.87, "total_tokens": 2117216} {"current_steps": 3670, "total_steps": 67140, "loss": 0.7273, "lr": 2.7323503127792672e-05, "epoch": 0.5466190050640453, "percentage": 5.47, "elapsed_time": "0:15:10", "remaining_time": "4:22:22", "throughput": 2329.18, "total_tokens": 2120128} {"current_steps": 3675, "total_steps": 67140, "loss": 0.7772, "lr": 2.7360738754840632e-05, "epoch": 0.5473637176050045, "percentage": 5.47, "elapsed_time": "0:15:11", "remaining_time": "4:22:19", "throughput": 2329.68, "total_tokens": 2123328} {"current_steps": 3680, "total_steps": 67140, "loss": 0.6639, "lr": 2.7397974381888592e-05, "epoch": 0.5481084301459637, "percentage": 5.48, "elapsed_time": "0:15:12", "remaining_time": "4:22:17", "throughput": 2330.2, "total_tokens": 2126528} {"current_steps": 3685, "total_steps": 67140, "loss": 0.9772, "lr": 2.7435210008936552e-05, "epoch": 0.5488531426869229, "percentage": 5.49, "elapsed_time": "0:15:13", "remaining_time": "4:22:13", "throughput": 2330.34, "total_tokens": 2129248} {"current_steps": 3690, "total_steps": 67140, "loss": 0.7476, "lr": 2.7472445635984512e-05, "epoch": 0.5495978552278821, "percentage": 5.5, "elapsed_time": "0:15:14", "remaining_time": "4:22:11", "throughput": 2330.62, "total_tokens": 2132192} {"current_steps": 3695, "total_steps": 67140, "loss": 0.7049, "lr": 2.750968126303247e-05, "epoch": 0.5503425677688413, "percentage": 5.5, "elapsed_time": "0:15:15", "remaining_time": "4:22:08", "throughput": 2330.93, "total_tokens": 2135104} {"current_steps": 3700, "total_steps": 67140, "loss": 0.7679, "lr": 2.754691689008043e-05, "epoch": 0.5510872803098004, "percentage": 5.51, "elapsed_time": "0:15:17", "remaining_time": "4:22:04", "throughput": 2331.08, "total_tokens": 2137824} {"current_steps": 3705, "total_steps": 67140, "loss": 0.7013, "lr": 2.758415251712839e-05, "epoch": 0.5518319928507596, "percentage": 5.52, "elapsed_time": "0:15:18", "remaining_time": "4:22:01", "throughput": 2331.23, "total_tokens": 2140608} {"current_steps": 3710, "total_steps": 67140, "loss": 0.8018, "lr": 2.7621388144176348e-05, "epoch": 0.5525767053917188, "percentage": 5.53, "elapsed_time": "0:15:19", "remaining_time": "4:21:58", "throughput": 2331.42, "total_tokens": 2143392} {"current_steps": 3715, "total_steps": 67140, "loss": 0.732, "lr": 2.7658623771224308e-05, "epoch": 0.553321417932678, "percentage": 5.53, "elapsed_time": "0:15:20", "remaining_time": "4:21:55", "throughput": 2331.78, "total_tokens": 2146432} {"current_steps": 3720, "total_steps": 67140, "loss": 0.7096, "lr": 2.7695859398272267e-05, "epoch": 0.5540661304736372, "percentage": 5.54, "elapsed_time": "0:15:21", "remaining_time": "4:21:52", "throughput": 2331.99, "total_tokens": 2149248} {"current_steps": 3725, "total_steps": 67140, "loss": 0.8367, "lr": 2.7733095025320227e-05, "epoch": 0.5548108430145964, "percentage": 5.55, "elapsed_time": "0:15:22", "remaining_time": "4:21:50", "throughput": 2332.39, "total_tokens": 2152352} {"current_steps": 3730, "total_steps": 67140, "loss": 0.7197, "lr": 2.7770330652368187e-05, "epoch": 0.5555555555555556, "percentage": 5.56, "elapsed_time": "0:15:23", "remaining_time": "4:21:47", "throughput": 2332.67, "total_tokens": 2155264} {"current_steps": 3735, "total_steps": 67140, "loss": 0.8037, "lr": 2.7807566279416147e-05, "epoch": 0.5563002680965148, "percentage": 5.56, "elapsed_time": "0:15:25", "remaining_time": "4:21:44", "throughput": 2333.03, "total_tokens": 2158336} {"current_steps": 3740, "total_steps": 67140, "loss": 0.7423, "lr": 2.7844801906464107e-05, "epoch": 0.557044980637474, "percentage": 5.57, "elapsed_time": "0:15:26", "remaining_time": "4:21:42", "throughput": 2333.38, "total_tokens": 2161344} {"current_steps": 3745, "total_steps": 67140, "loss": 0.5675, "lr": 2.7882037533512067e-05, "epoch": 0.5577896931784331, "percentage": 5.58, "elapsed_time": "0:15:27", "remaining_time": "4:21:38", "throughput": 2333.49, "total_tokens": 2164032} {"current_steps": 3750, "total_steps": 67140, "loss": 0.8706, "lr": 2.7919273160560027e-05, "epoch": 0.5585344057193923, "percentage": 5.59, "elapsed_time": "0:15:28", "remaining_time": "4:21:35", "throughput": 2333.76, "total_tokens": 2166912} {"current_steps": 3755, "total_steps": 67140, "loss": 0.6318, "lr": 2.7956508787607983e-05, "epoch": 0.5592791182603515, "percentage": 5.59, "elapsed_time": "0:15:29", "remaining_time": "4:21:33", "throughput": 2334.17, "total_tokens": 2170016} {"current_steps": 3760, "total_steps": 67140, "loss": 0.8313, "lr": 2.7993744414655943e-05, "epoch": 0.5600238308013107, "percentage": 5.6, "elapsed_time": "0:15:30", "remaining_time": "4:21:28", "throughput": 2334.12, "total_tokens": 2172448} {"current_steps": 3765, "total_steps": 67140, "loss": 0.8923, "lr": 2.8030980041703903e-05, "epoch": 0.5607685433422699, "percentage": 5.61, "elapsed_time": "0:15:31", "remaining_time": "4:21:26", "throughput": 2334.69, "total_tokens": 2175776} {"current_steps": 3770, "total_steps": 67140, "loss": 0.8054, "lr": 2.8068215668751863e-05, "epoch": 0.5615132558832291, "percentage": 5.62, "elapsed_time": "0:15:33", "remaining_time": "4:21:23", "throughput": 2334.87, "total_tokens": 2178560} {"current_steps": 3775, "total_steps": 67140, "loss": 0.7923, "lr": 2.8105451295799822e-05, "epoch": 0.5622579684241883, "percentage": 5.62, "elapsed_time": "0:15:34", "remaining_time": "4:21:21", "throughput": 2335.25, "total_tokens": 2181600} {"current_steps": 3780, "total_steps": 67140, "loss": 0.6438, "lr": 2.8142686922847782e-05, "epoch": 0.5630026809651475, "percentage": 5.63, "elapsed_time": "0:15:35", "remaining_time": "4:21:18", "throughput": 2335.45, "total_tokens": 2184448} {"current_steps": 3785, "total_steps": 67140, "loss": 0.6635, "lr": 2.8179922549895742e-05, "epoch": 0.5637473935061067, "percentage": 5.64, "elapsed_time": "0:15:36", "remaining_time": "4:21:15", "throughput": 2335.75, "total_tokens": 2187424} {"current_steps": 3790, "total_steps": 67140, "loss": 0.6552, "lr": 2.8217158176943702e-05, "epoch": 0.5644921060470658, "percentage": 5.64, "elapsed_time": "0:15:37", "remaining_time": "4:21:12", "throughput": 2335.82, "total_tokens": 2190080} {"current_steps": 3795, "total_steps": 67140, "loss": 0.7144, "lr": 2.825439380399166e-05, "epoch": 0.565236818588025, "percentage": 5.65, "elapsed_time": "0:15:38", "remaining_time": "4:21:08", "throughput": 2335.96, "total_tokens": 2192800} {"current_steps": 3800, "total_steps": 67140, "loss": 0.668, "lr": 2.8291629431039618e-05, "epoch": 0.5659815311289842, "percentage": 5.66, "elapsed_time": "0:15:39", "remaining_time": "4:21:06", "throughput": 2336.33, "total_tokens": 2195840} {"current_steps": 3805, "total_steps": 67140, "loss": 0.6981, "lr": 2.8328865058087578e-05, "epoch": 0.5667262436699434, "percentage": 5.67, "elapsed_time": "0:15:41", "remaining_time": "4:21:05", "throughput": 2337.03, "total_tokens": 2199424} {"current_steps": 3810, "total_steps": 67140, "loss": 0.8038, "lr": 2.8366100685135538e-05, "epoch": 0.5674709562109026, "percentage": 5.67, "elapsed_time": "0:15:42", "remaining_time": "4:21:01", "throughput": 2337.22, "total_tokens": 2202208} {"current_steps": 3815, "total_steps": 67140, "loss": 0.7356, "lr": 2.8403336312183498e-05, "epoch": 0.5682156687518618, "percentage": 5.68, "elapsed_time": "0:15:43", "remaining_time": "4:20:59", "throughput": 2337.49, "total_tokens": 2205152} {"current_steps": 3820, "total_steps": 67140, "loss": 0.7182, "lr": 2.8440571939231458e-05, "epoch": 0.568960381292821, "percentage": 5.69, "elapsed_time": "0:15:44", "remaining_time": "4:20:56", "throughput": 2337.86, "total_tokens": 2208224} {"current_steps": 3825, "total_steps": 67140, "loss": 0.6459, "lr": 2.8477807566279418e-05, "epoch": 0.5697050938337802, "percentage": 5.7, "elapsed_time": "0:15:45", "remaining_time": "4:20:54", "throughput": 2338.24, "total_tokens": 2211296} {"current_steps": 3830, "total_steps": 67140, "loss": 0.6414, "lr": 2.8515043193327377e-05, "epoch": 0.5704498063747393, "percentage": 5.7, "elapsed_time": "0:15:46", "remaining_time": "4:20:51", "throughput": 2338.48, "total_tokens": 2214176} {"current_steps": 3835, "total_steps": 67140, "loss": 0.6803, "lr": 2.8552278820375337e-05, "epoch": 0.5711945189156985, "percentage": 5.71, "elapsed_time": "0:15:47", "remaining_time": "4:20:47", "throughput": 2338.34, "total_tokens": 2216512} {"current_steps": 3840, "total_steps": 67140, "loss": 0.627, "lr": 2.8589514447423294e-05, "epoch": 0.5719392314566577, "percentage": 5.72, "elapsed_time": "0:15:49", "remaining_time": "4:20:44", "throughput": 2338.56, "total_tokens": 2219392} {"current_steps": 3845, "total_steps": 67140, "loss": 0.8507, "lr": 2.8626750074471254e-05, "epoch": 0.5726839439976169, "percentage": 5.73, "elapsed_time": "0:15:50", "remaining_time": "4:20:41", "throughput": 2338.86, "total_tokens": 2222368} {"current_steps": 3850, "total_steps": 67140, "loss": 0.6506, "lr": 2.8663985701519213e-05, "epoch": 0.5734286565385761, "percentage": 5.73, "elapsed_time": "0:15:51", "remaining_time": "4:20:39", "throughput": 2339.25, "total_tokens": 2225472} {"current_steps": 3855, "total_steps": 67140, "loss": 0.8723, "lr": 2.8701221328567173e-05, "epoch": 0.5741733690795353, "percentage": 5.74, "elapsed_time": "0:15:52", "remaining_time": "4:20:36", "throughput": 2339.57, "total_tokens": 2228416} {"current_steps": 3860, "total_steps": 67140, "loss": 0.7261, "lr": 2.8738456955615133e-05, "epoch": 0.5749180816204945, "percentage": 5.75, "elapsed_time": "0:15:53", "remaining_time": "4:20:32", "throughput": 2339.69, "total_tokens": 2231104} {"current_steps": 3865, "total_steps": 67140, "loss": 0.7642, "lr": 2.8775692582663093e-05, "epoch": 0.5756627941614537, "percentage": 5.76, "elapsed_time": "0:15:54", "remaining_time": "4:20:29", "throughput": 2339.8, "total_tokens": 2233760} {"current_steps": 3870, "total_steps": 67140, "loss": 0.7142, "lr": 2.8812928209711053e-05, "epoch": 0.5764075067024129, "percentage": 5.76, "elapsed_time": "0:15:55", "remaining_time": "4:20:26", "throughput": 2340.03, "total_tokens": 2236608} {"current_steps": 3875, "total_steps": 67140, "loss": 0.7366, "lr": 2.8850163836759013e-05, "epoch": 0.577152219243372, "percentage": 5.77, "elapsed_time": "0:15:56", "remaining_time": "4:20:22", "throughput": 2340.26, "total_tokens": 2239424} {"current_steps": 3880, "total_steps": 67140, "loss": 0.8853, "lr": 2.8887399463806976e-05, "epoch": 0.5778969317843312, "percentage": 5.78, "elapsed_time": "0:15:58", "remaining_time": "4:20:20", "throughput": 2340.46, "total_tokens": 2242272} {"current_steps": 3885, "total_steps": 67140, "loss": 0.9069, "lr": 2.892463509085493e-05, "epoch": 0.5786416443252904, "percentage": 5.79, "elapsed_time": "0:15:59", "remaining_time": "4:20:17", "throughput": 2340.75, "total_tokens": 2245216} {"current_steps": 3890, "total_steps": 67140, "loss": 0.5945, "lr": 2.896187071790289e-05, "epoch": 0.5793863568662496, "percentage": 5.79, "elapsed_time": "0:16:00", "remaining_time": "4:20:15", "throughput": 2341.16, "total_tokens": 2248352} {"current_steps": 3895, "total_steps": 67140, "loss": 0.7678, "lr": 2.899910634495085e-05, "epoch": 0.5801310694072088, "percentage": 5.8, "elapsed_time": "0:16:01", "remaining_time": "4:20:11", "throughput": 2341.22, "total_tokens": 2251008} {"current_steps": 3900, "total_steps": 67140, "loss": 0.6608, "lr": 2.903634197199881e-05, "epoch": 0.580875781948168, "percentage": 5.81, "elapsed_time": "0:16:02", "remaining_time": "4:20:09", "throughput": 2341.54, "total_tokens": 2254048} {"current_steps": 3905, "total_steps": 67140, "loss": 0.7443, "lr": 2.907357759904677e-05, "epoch": 0.5816204944891272, "percentage": 5.82, "elapsed_time": "0:16:03", "remaining_time": "4:20:07", "throughput": 2341.88, "total_tokens": 2257088} {"current_steps": 3910, "total_steps": 67140, "loss": 0.6792, "lr": 2.9110813226094728e-05, "epoch": 0.5823652070300864, "percentage": 5.82, "elapsed_time": "0:16:04", "remaining_time": "4:20:04", "throughput": 2342.13, "total_tokens": 2260000} {"current_steps": 3915, "total_steps": 67140, "loss": 0.7799, "lr": 2.914804885314269e-05, "epoch": 0.5831099195710456, "percentage": 5.83, "elapsed_time": "0:16:06", "remaining_time": "4:20:00", "throughput": 2342.24, "total_tokens": 2262688} {"current_steps": 3920, "total_steps": 67140, "loss": 0.8205, "lr": 2.918528448019065e-05, "epoch": 0.5838546321120047, "percentage": 5.84, "elapsed_time": "0:16:07", "remaining_time": "4:19:57", "throughput": 2342.46, "total_tokens": 2265536} {"current_steps": 3925, "total_steps": 67140, "loss": 0.6774, "lr": 2.9222520107238604e-05, "epoch": 0.5845993446529639, "percentage": 5.85, "elapsed_time": "0:16:08", "remaining_time": "4:19:55", "throughput": 2342.73, "total_tokens": 2268512} {"current_steps": 3930, "total_steps": 67140, "loss": 0.6587, "lr": 2.9259755734286564e-05, "epoch": 0.5853440571939231, "percentage": 5.85, "elapsed_time": "0:16:09", "remaining_time": "4:19:53", "throughput": 2343.16, "total_tokens": 2271712} {"current_steps": 3935, "total_steps": 67140, "loss": 0.8712, "lr": 2.9296991361334524e-05, "epoch": 0.5860887697348823, "percentage": 5.86, "elapsed_time": "0:16:10", "remaining_time": "4:19:50", "throughput": 2343.37, "total_tokens": 2274560} {"current_steps": 3940, "total_steps": 67140, "loss": 0.6763, "lr": 2.9334226988382484e-05, "epoch": 0.5868334822758415, "percentage": 5.87, "elapsed_time": "0:16:11", "remaining_time": "4:19:47", "throughput": 2343.54, "total_tokens": 2277376} {"current_steps": 3945, "total_steps": 67140, "loss": 0.6969, "lr": 2.9371462615430444e-05, "epoch": 0.5875781948168007, "percentage": 5.88, "elapsed_time": "0:16:12", "remaining_time": "4:19:43", "throughput": 2343.49, "total_tokens": 2279840} {"current_steps": 3950, "total_steps": 67140, "loss": 0.8504, "lr": 2.9408698242478404e-05, "epoch": 0.5883229073577599, "percentage": 5.88, "elapsed_time": "0:16:13", "remaining_time": "4:19:40", "throughput": 2343.66, "total_tokens": 2282560} {"current_steps": 3955, "total_steps": 67140, "loss": 0.6501, "lr": 2.9445933869526367e-05, "epoch": 0.5890676198987191, "percentage": 5.89, "elapsed_time": "0:16:15", "remaining_time": "4:19:37", "throughput": 2343.96, "total_tokens": 2285536} {"current_steps": 3960, "total_steps": 67140, "loss": 0.651, "lr": 2.9483169496574327e-05, "epoch": 0.5898123324396782, "percentage": 5.9, "elapsed_time": "0:16:16", "remaining_time": "4:19:34", "throughput": 2344.12, "total_tokens": 2288288} {"current_steps": 3965, "total_steps": 67140, "loss": 0.7228, "lr": 2.9520405123622287e-05, "epoch": 0.5905570449806374, "percentage": 5.91, "elapsed_time": "0:16:17", "remaining_time": "4:19:31", "throughput": 2344.23, "total_tokens": 2291040} {"current_steps": 3970, "total_steps": 67140, "loss": 0.6424, "lr": 2.955764075067024e-05, "epoch": 0.5913017575215966, "percentage": 5.91, "elapsed_time": "0:16:18", "remaining_time": "4:19:28", "throughput": 2344.38, "total_tokens": 2293792} {"current_steps": 3975, "total_steps": 67140, "loss": 0.7633, "lr": 2.95948763777182e-05, "epoch": 0.5920464700625558, "percentage": 5.92, "elapsed_time": "0:16:19", "remaining_time": "4:19:25", "throughput": 2344.69, "total_tokens": 2296800} {"current_steps": 3980, "total_steps": 67140, "loss": 0.7857, "lr": 2.963211200476616e-05, "epoch": 0.592791182603515, "percentage": 5.93, "elapsed_time": "0:16:20", "remaining_time": "4:19:23", "throughput": 2344.98, "total_tokens": 2299744} {"current_steps": 3985, "total_steps": 67140, "loss": 0.6181, "lr": 2.966934763181412e-05, "epoch": 0.5935358951444742, "percentage": 5.94, "elapsed_time": "0:16:21", "remaining_time": "4:19:20", "throughput": 2345.31, "total_tokens": 2302784} {"current_steps": 3990, "total_steps": 67140, "loss": 0.6188, "lr": 2.970658325886208e-05, "epoch": 0.5942806076854334, "percentage": 5.94, "elapsed_time": "0:16:22", "remaining_time": "4:19:17", "throughput": 2345.52, "total_tokens": 2305632} {"current_steps": 3995, "total_steps": 67140, "loss": 0.8434, "lr": 2.9743818885910042e-05, "epoch": 0.5950253202263927, "percentage": 5.95, "elapsed_time": "0:16:24", "remaining_time": "4:19:15", "throughput": 2345.78, "total_tokens": 2308576} {"current_steps": 4000, "total_steps": 67140, "loss": 0.7794, "lr": 2.9781054512958002e-05, "epoch": 0.5957700327673519, "percentage": 5.96, "elapsed_time": "0:16:25", "remaining_time": "4:19:12", "throughput": 2346.06, "total_tokens": 2311552} {"current_steps": 4005, "total_steps": 67140, "loss": 0.7391, "lr": 2.9818290140005962e-05, "epoch": 0.596514745308311, "percentage": 5.97, "elapsed_time": "0:16:26", "remaining_time": "4:19:10", "throughput": 2346.24, "total_tokens": 2314400} {"current_steps": 4010, "total_steps": 67140, "loss": 0.9084, "lr": 2.9855525767053922e-05, "epoch": 0.5972594578492701, "percentage": 5.97, "elapsed_time": "0:16:27", "remaining_time": "4:19:07", "throughput": 2346.38, "total_tokens": 2317184} {"current_steps": 4015, "total_steps": 67140, "loss": 0.7568, "lr": 2.9892761394101875e-05, "epoch": 0.5980041703902294, "percentage": 5.98, "elapsed_time": "0:16:28", "remaining_time": "4:19:04", "throughput": 2346.68, "total_tokens": 2320160} {"current_steps": 4020, "total_steps": 67140, "loss": 0.8545, "lr": 2.9929997021149835e-05, "epoch": 0.5987488829311886, "percentage": 5.99, "elapsed_time": "0:16:29", "remaining_time": "4:19:01", "throughput": 2346.84, "total_tokens": 2322976} {"current_steps": 4025, "total_steps": 67140, "loss": 0.6787, "lr": 2.9967232648197795e-05, "epoch": 0.5994935954721478, "percentage": 5.99, "elapsed_time": "0:16:30", "remaining_time": "4:18:59", "throughput": 2347.07, "total_tokens": 2325888} {"current_steps": 4030, "total_steps": 67140, "loss": 0.7274, "lr": 3.0004468275245755e-05, "epoch": 0.600238308013107, "percentage": 6.0, "elapsed_time": "0:16:32", "remaining_time": "4:18:56", "throughput": 2347.23, "total_tokens": 2328672} {"current_steps": 4035, "total_steps": 67140, "loss": 0.7174, "lr": 3.0041703902293718e-05, "epoch": 0.6009830205540662, "percentage": 6.01, "elapsed_time": "0:16:33", "remaining_time": "4:18:53", "throughput": 2347.52, "total_tokens": 2331680} {"current_steps": 4040, "total_steps": 67140, "loss": 0.7083, "lr": 3.0078939529341678e-05, "epoch": 0.6017277330950254, "percentage": 6.02, "elapsed_time": "0:16:34", "remaining_time": "4:18:50", "throughput": 2347.56, "total_tokens": 2334272} {"current_steps": 4045, "total_steps": 67140, "loss": 0.7861, "lr": 3.0116175156389638e-05, "epoch": 0.6024724456359845, "percentage": 6.02, "elapsed_time": "0:16:35", "remaining_time": "4:18:47", "throughput": 2347.63, "total_tokens": 2336928} {"current_steps": 4050, "total_steps": 67140, "loss": 0.5679, "lr": 3.0153410783437597e-05, "epoch": 0.6032171581769437, "percentage": 6.03, "elapsed_time": "0:16:36", "remaining_time": "4:18:44", "throughput": 2347.96, "total_tokens": 2340000} {"current_steps": 4055, "total_steps": 67140, "loss": 0.6866, "lr": 3.019064641048555e-05, "epoch": 0.6039618707179029, "percentage": 6.04, "elapsed_time": "0:16:37", "remaining_time": "4:18:41", "throughput": 2348.12, "total_tokens": 2342784} {"current_steps": 4060, "total_steps": 67140, "loss": 0.8483, "lr": 3.022788203753351e-05, "epoch": 0.6047065832588621, "percentage": 6.05, "elapsed_time": "0:16:38", "remaining_time": "4:18:39", "throughput": 2348.22, "total_tokens": 2345504} {"current_steps": 4065, "total_steps": 67140, "loss": 0.5815, "lr": 3.026511766458147e-05, "epoch": 0.6054512957998213, "percentage": 6.05, "elapsed_time": "0:16:39", "remaining_time": "4:18:36", "throughput": 2348.48, "total_tokens": 2348448} {"current_steps": 4070, "total_steps": 67140, "loss": 0.7463, "lr": 3.030235329162943e-05, "epoch": 0.6061960083407805, "percentage": 6.06, "elapsed_time": "0:16:41", "remaining_time": "4:18:33", "throughput": 2348.65, "total_tokens": 2351264} {"current_steps": 4075, "total_steps": 67140, "loss": 0.7816, "lr": 3.0339588918677393e-05, "epoch": 0.6069407208817397, "percentage": 6.07, "elapsed_time": "0:16:42", "remaining_time": "4:18:30", "throughput": 2348.74, "total_tokens": 2353920} {"current_steps": 4080, "total_steps": 67140, "loss": 0.5994, "lr": 3.0376824545725353e-05, "epoch": 0.6076854334226989, "percentage": 6.08, "elapsed_time": "0:16:43", "remaining_time": "4:18:27", "throughput": 2348.83, "total_tokens": 2356608} {"current_steps": 4085, "total_steps": 67140, "loss": 0.6605, "lr": 3.0414060172773313e-05, "epoch": 0.6084301459636581, "percentage": 6.08, "elapsed_time": "0:16:44", "remaining_time": "4:18:24", "throughput": 2348.97, "total_tokens": 2359392} {"current_steps": 4090, "total_steps": 67140, "loss": 0.7971, "lr": 3.0451295799821273e-05, "epoch": 0.6091748585046172, "percentage": 6.09, "elapsed_time": "0:16:45", "remaining_time": "4:18:22", "throughput": 2349.34, "total_tokens": 2362528} {"current_steps": 4095, "total_steps": 67140, "loss": 0.6758, "lr": 3.0488531426869233e-05, "epoch": 0.6099195710455764, "percentage": 6.1, "elapsed_time": "0:16:46", "remaining_time": "4:18:19", "throughput": 2349.47, "total_tokens": 2365280} {"current_steps": 4100, "total_steps": 67140, "loss": 0.6738, "lr": 3.0525767053917186e-05, "epoch": 0.6106642835865356, "percentage": 6.11, "elapsed_time": "0:16:47", "remaining_time": "4:18:16", "throughput": 2349.65, "total_tokens": 2368096} {"current_steps": 4105, "total_steps": 67140, "loss": 0.6434, "lr": 3.056300268096515e-05, "epoch": 0.6114089961274948, "percentage": 6.11, "elapsed_time": "0:16:48", "remaining_time": "4:18:13", "throughput": 2349.9, "total_tokens": 2370976} {"current_steps": 4110, "total_steps": 67140, "loss": 0.8909, "lr": 3.0600238308013105e-05, "epoch": 0.612153708668454, "percentage": 6.12, "elapsed_time": "0:16:50", "remaining_time": "4:18:10", "throughput": 2350.13, "total_tokens": 2373888} {"current_steps": 4115, "total_steps": 67140, "loss": 0.7431, "lr": 3.063747393506107e-05, "epoch": 0.6128984212094132, "percentage": 6.13, "elapsed_time": "0:16:51", "remaining_time": "4:18:07", "throughput": 2350.31, "total_tokens": 2376704} {"current_steps": 4120, "total_steps": 67140, "loss": 0.6988, "lr": 3.0674709562109025e-05, "epoch": 0.6136431337503724, "percentage": 6.14, "elapsed_time": "0:16:52", "remaining_time": "4:18:05", "throughput": 2350.43, "total_tokens": 2379456} {"current_steps": 4125, "total_steps": 67140, "loss": 0.7473, "lr": 3.071194518915699e-05, "epoch": 0.6143878462913316, "percentage": 6.14, "elapsed_time": "0:16:53", "remaining_time": "4:18:03", "throughput": 2350.81, "total_tokens": 2382624} {"current_steps": 4130, "total_steps": 67140, "loss": 0.7691, "lr": 3.0749180816204945e-05, "epoch": 0.6151325588322908, "percentage": 6.15, "elapsed_time": "0:16:54", "remaining_time": "4:18:00", "throughput": 2351.02, "total_tokens": 2385472} {"current_steps": 4135, "total_steps": 67140, "loss": 0.821, "lr": 3.078641644325291e-05, "epoch": 0.6158772713732499, "percentage": 6.16, "elapsed_time": "0:16:55", "remaining_time": "4:17:57", "throughput": 2351.24, "total_tokens": 2388384} {"current_steps": 4140, "total_steps": 67140, "loss": 0.6293, "lr": 3.082365207030087e-05, "epoch": 0.6166219839142091, "percentage": 6.17, "elapsed_time": "0:16:56", "remaining_time": "4:17:54", "throughput": 2351.38, "total_tokens": 2391136} {"current_steps": 4145, "total_steps": 67140, "loss": 0.7287, "lr": 3.086088769734882e-05, "epoch": 0.6173666964551683, "percentage": 6.17, "elapsed_time": "0:16:58", "remaining_time": "4:17:52", "throughput": 2351.68, "total_tokens": 2394144} {"current_steps": 4150, "total_steps": 67140, "loss": 0.6347, "lr": 3.0898123324396784e-05, "epoch": 0.6181114089961275, "percentage": 6.18, "elapsed_time": "0:16:59", "remaining_time": "4:17:49", "throughput": 2351.84, "total_tokens": 2396992} {"current_steps": 4155, "total_steps": 67140, "loss": 0.6367, "lr": 3.093535895144474e-05, "epoch": 0.6188561215370867, "percentage": 6.19, "elapsed_time": "0:17:00", "remaining_time": "4:17:46", "throughput": 2351.9, "total_tokens": 2399616} {"current_steps": 4160, "total_steps": 67140, "loss": 0.9083, "lr": 3.0972594578492704e-05, "epoch": 0.6196008340780459, "percentage": 6.2, "elapsed_time": "0:17:01", "remaining_time": "4:17:43", "throughput": 2351.96, "total_tokens": 2402272} {"current_steps": 4165, "total_steps": 67140, "loss": 0.7163, "lr": 3.100983020554066e-05, "epoch": 0.6203455466190051, "percentage": 6.2, "elapsed_time": "0:17:02", "remaining_time": "4:17:40", "throughput": 2352.16, "total_tokens": 2405120} {"current_steps": 4170, "total_steps": 67140, "loss": 0.6848, "lr": 3.1047065832588624e-05, "epoch": 0.6210902591599643, "percentage": 6.21, "elapsed_time": "0:17:03", "remaining_time": "4:17:37", "throughput": 2352.44, "total_tokens": 2408096} {"current_steps": 4175, "total_steps": 67140, "loss": 0.6581, "lr": 3.108430145963658e-05, "epoch": 0.6218349717009234, "percentage": 6.22, "elapsed_time": "0:17:04", "remaining_time": "4:17:35", "throughput": 2352.71, "total_tokens": 2411072} {"current_steps": 4180, "total_steps": 67140, "loss": 0.6703, "lr": 3.1121537086684543e-05, "epoch": 0.6225796842418826, "percentage": 6.23, "elapsed_time": "0:17:05", "remaining_time": "4:17:33", "throughput": 2352.99, "total_tokens": 2414080} {"current_steps": 4185, "total_steps": 67140, "loss": 0.702, "lr": 3.11587727137325e-05, "epoch": 0.6233243967828418, "percentage": 6.23, "elapsed_time": "0:17:07", "remaining_time": "4:17:31", "throughput": 2353.39, "total_tokens": 2417280} {"current_steps": 4190, "total_steps": 67140, "loss": 0.7883, "lr": 3.1196008340780456e-05, "epoch": 0.624069109323801, "percentage": 6.24, "elapsed_time": "0:17:08", "remaining_time": "4:17:28", "throughput": 2353.56, "total_tokens": 2420128} {"current_steps": 4195, "total_steps": 67140, "loss": 0.8329, "lr": 3.123324396782842e-05, "epoch": 0.6248138218647602, "percentage": 6.25, "elapsed_time": "0:17:09", "remaining_time": "4:17:26", "throughput": 2353.87, "total_tokens": 2423136} {"current_steps": 4200, "total_steps": 67140, "loss": 0.777, "lr": 3.1270479594876376e-05, "epoch": 0.6255585344057194, "percentage": 6.26, "elapsed_time": "0:17:10", "remaining_time": "4:17:23", "throughput": 2354.17, "total_tokens": 2426144} {"current_steps": 4205, "total_steps": 67140, "loss": 0.6705, "lr": 3.130771522192434e-05, "epoch": 0.6263032469466786, "percentage": 6.26, "elapsed_time": "0:17:11", "remaining_time": "4:17:21", "throughput": 2354.56, "total_tokens": 2429280} {"current_steps": 4210, "total_steps": 67140, "loss": 0.7299, "lr": 3.1344950848972296e-05, "epoch": 0.6270479594876378, "percentage": 6.27, "elapsed_time": "0:17:12", "remaining_time": "4:17:18", "throughput": 2354.64, "total_tokens": 2432000} {"current_steps": 4215, "total_steps": 67140, "loss": 0.6771, "lr": 3.138218647602026e-05, "epoch": 0.627792672028597, "percentage": 6.28, "elapsed_time": "0:17:14", "remaining_time": "4:17:17", "throughput": 2354.97, "total_tokens": 2435136} {"current_steps": 4220, "total_steps": 67140, "loss": 0.7533, "lr": 3.141942210306822e-05, "epoch": 0.6285373845695561, "percentage": 6.29, "elapsed_time": "0:17:15", "remaining_time": "4:17:14", "throughput": 2355.14, "total_tokens": 2437952} {"current_steps": 4225, "total_steps": 67140, "loss": 0.8902, "lr": 3.145665773011618e-05, "epoch": 0.6292820971105153, "percentage": 6.29, "elapsed_time": "0:17:16", "remaining_time": "4:17:12", "throughput": 2355.37, "total_tokens": 2440928} {"current_steps": 4230, "total_steps": 67140, "loss": 0.7494, "lr": 3.1493893357164135e-05, "epoch": 0.6300268096514745, "percentage": 6.3, "elapsed_time": "0:17:17", "remaining_time": "4:17:09", "throughput": 2355.6, "total_tokens": 2443808} {"current_steps": 4235, "total_steps": 67140, "loss": 0.5257, "lr": 3.153112898421209e-05, "epoch": 0.6307715221924337, "percentage": 6.31, "elapsed_time": "0:17:18", "remaining_time": "4:17:06", "throughput": 2355.6, "total_tokens": 2446400} {"current_steps": 4240, "total_steps": 67140, "loss": 0.7604, "lr": 3.1568364611260055e-05, "epoch": 0.6315162347333929, "percentage": 6.32, "elapsed_time": "0:17:19", "remaining_time": "4:17:03", "throughput": 2355.84, "total_tokens": 2449376} {"current_steps": 4245, "total_steps": 67140, "loss": 0.6765, "lr": 3.160560023830801e-05, "epoch": 0.6322609472743521, "percentage": 6.32, "elapsed_time": "0:17:20", "remaining_time": "4:17:01", "throughput": 2356.03, "total_tokens": 2452256} {"current_steps": 4250, "total_steps": 67140, "loss": 0.7117, "lr": 3.1642835865355975e-05, "epoch": 0.6330056598153113, "percentage": 6.33, "elapsed_time": "0:17:21", "remaining_time": "4:16:58", "throughput": 2356.15, "total_tokens": 2455040} {"current_steps": 4255, "total_steps": 67140, "loss": 0.9111, "lr": 3.168007149240393e-05, "epoch": 0.6337503723562705, "percentage": 6.34, "elapsed_time": "0:17:23", "remaining_time": "4:16:56", "throughput": 2356.38, "total_tokens": 2457952} {"current_steps": 4260, "total_steps": 67140, "loss": 0.6411, "lr": 3.1717307119451894e-05, "epoch": 0.6344950848972297, "percentage": 6.34, "elapsed_time": "0:17:24", "remaining_time": "4:16:54", "throughput": 2356.82, "total_tokens": 2461216} {"current_steps": 4265, "total_steps": 67140, "loss": 0.7378, "lr": 3.175454274649986e-05, "epoch": 0.6352397974381888, "percentage": 6.35, "elapsed_time": "0:17:25", "remaining_time": "4:16:52", "throughput": 2357.29, "total_tokens": 2464544} {"current_steps": 4270, "total_steps": 67140, "loss": 0.6937, "lr": 3.1791778373547814e-05, "epoch": 0.635984509979148, "percentage": 6.36, "elapsed_time": "0:17:26", "remaining_time": "4:16:50", "throughput": 2357.47, "total_tokens": 2467392} {"current_steps": 4275, "total_steps": 67140, "loss": 0.6715, "lr": 3.182901400059577e-05, "epoch": 0.6367292225201072, "percentage": 6.37, "elapsed_time": "0:17:27", "remaining_time": "4:16:47", "throughput": 2357.56, "total_tokens": 2470112} {"current_steps": 4280, "total_steps": 67140, "loss": 0.7028, "lr": 3.186624962764373e-05, "epoch": 0.6374739350610664, "percentage": 6.37, "elapsed_time": "0:17:28", "remaining_time": "4:16:44", "throughput": 2357.76, "total_tokens": 2472992} {"current_steps": 4285, "total_steps": 67140, "loss": 0.539, "lr": 3.190348525469169e-05, "epoch": 0.6382186476020256, "percentage": 6.38, "elapsed_time": "0:17:29", "remaining_time": "4:16:41", "throughput": 2357.93, "total_tokens": 2475808} {"current_steps": 4290, "total_steps": 67140, "loss": 0.7001, "lr": 3.1940720881739647e-05, "epoch": 0.6389633601429848, "percentage": 6.39, "elapsed_time": "0:17:31", "remaining_time": "4:16:39", "throughput": 2358.13, "total_tokens": 2478688} {"current_steps": 4295, "total_steps": 67140, "loss": 0.7709, "lr": 3.197795650878761e-05, "epoch": 0.639708072683944, "percentage": 6.4, "elapsed_time": "0:17:32", "remaining_time": "4:16:36", "throughput": 2358.19, "total_tokens": 2481344} {"current_steps": 4300, "total_steps": 67140, "loss": 0.7577, "lr": 3.201519213583557e-05, "epoch": 0.6404527852249032, "percentage": 6.4, "elapsed_time": "0:17:33", "remaining_time": "4:16:33", "throughput": 2358.27, "total_tokens": 2484064} {"current_steps": 4305, "total_steps": 67140, "loss": 0.7709, "lr": 3.205242776288353e-05, "epoch": 0.6411974977658623, "percentage": 6.41, "elapsed_time": "0:17:34", "remaining_time": "4:16:30", "throughput": 2358.38, "total_tokens": 2486784} {"current_steps": 4310, "total_steps": 67140, "loss": 0.5875, "lr": 3.208966338993149e-05, "epoch": 0.6419422103068215, "percentage": 6.42, "elapsed_time": "0:17:35", "remaining_time": "4:16:27", "throughput": 2358.53, "total_tokens": 2489568} {"current_steps": 4315, "total_steps": 67140, "loss": 0.8013, "lr": 3.212689901697944e-05, "epoch": 0.6426869228477807, "percentage": 6.43, "elapsed_time": "0:17:36", "remaining_time": "4:16:25", "throughput": 2358.74, "total_tokens": 2492512} {"current_steps": 4320, "total_steps": 67140, "loss": 0.6744, "lr": 3.2164134644027406e-05, "epoch": 0.6434316353887399, "percentage": 6.43, "elapsed_time": "0:17:37", "remaining_time": "4:16:22", "throughput": 2358.87, "total_tokens": 2495296} {"current_steps": 4325, "total_steps": 67140, "loss": 0.7392, "lr": 3.220137027107536e-05, "epoch": 0.6441763479296991, "percentage": 6.44, "elapsed_time": "0:17:38", "remaining_time": "4:16:20", "throughput": 2359.09, "total_tokens": 2498208} {"current_steps": 4330, "total_steps": 67140, "loss": 0.7204, "lr": 3.2238605898123325e-05, "epoch": 0.6449210604706583, "percentage": 6.45, "elapsed_time": "0:17:40", "remaining_time": "4:16:16", "throughput": 2359.11, "total_tokens": 2500800} {"current_steps": 4335, "total_steps": 67140, "loss": 0.715, "lr": 3.227584152517129e-05, "epoch": 0.6456657730116175, "percentage": 6.46, "elapsed_time": "0:17:41", "remaining_time": "4:16:14", "throughput": 2359.17, "total_tokens": 2503488} {"current_steps": 4340, "total_steps": 67140, "loss": 0.7227, "lr": 3.2313077152219245e-05, "epoch": 0.6464104855525767, "percentage": 6.46, "elapsed_time": "0:17:42", "remaining_time": "4:16:11", "throughput": 2359.34, "total_tokens": 2506272} {"current_steps": 4345, "total_steps": 67140, "loss": 0.5788, "lr": 3.235031277926721e-05, "epoch": 0.6471551980935359, "percentage": 6.47, "elapsed_time": "0:17:43", "remaining_time": "4:16:08", "throughput": 2359.43, "total_tokens": 2508992} {"current_steps": 4350, "total_steps": 67140, "loss": 0.7894, "lr": 3.2387548406315165e-05, "epoch": 0.647899910634495, "percentage": 6.48, "elapsed_time": "0:17:44", "remaining_time": "4:16:05", "throughput": 2359.38, "total_tokens": 2511488} {"current_steps": 4355, "total_steps": 67140, "loss": 0.6593, "lr": 3.242478403336313e-05, "epoch": 0.6486446231754542, "percentage": 6.49, "elapsed_time": "0:17:45", "remaining_time": "4:16:02", "throughput": 2359.61, "total_tokens": 2514432} {"current_steps": 4360, "total_steps": 67140, "loss": 0.7786, "lr": 3.246201966041108e-05, "epoch": 0.6493893357164134, "percentage": 6.49, "elapsed_time": "0:17:46", "remaining_time": "4:16:00", "throughput": 2360.03, "total_tokens": 2517664} {"current_steps": 4365, "total_steps": 67140, "loss": 0.7205, "lr": 3.249925528745904e-05, "epoch": 0.6501340482573726, "percentage": 6.5, "elapsed_time": "0:17:47", "remaining_time": "4:15:58", "throughput": 2360.29, "total_tokens": 2520608} {"current_steps": 4370, "total_steps": 67140, "loss": 0.7379, "lr": 3.2536490914507e-05, "epoch": 0.6508787607983318, "percentage": 6.51, "elapsed_time": "0:17:49", "remaining_time": "4:15:55", "throughput": 2360.51, "total_tokens": 2523520} {"current_steps": 4375, "total_steps": 67140, "loss": 0.7312, "lr": 3.257372654155496e-05, "epoch": 0.651623473339291, "percentage": 6.52, "elapsed_time": "0:17:50", "remaining_time": "4:15:53", "throughput": 2360.82, "total_tokens": 2526592} {"current_steps": 4380, "total_steps": 67140, "loss": 0.7325, "lr": 3.2610962168602924e-05, "epoch": 0.6523681858802503, "percentage": 6.52, "elapsed_time": "0:17:51", "remaining_time": "4:15:51", "throughput": 2361.15, "total_tokens": 2529728} {"current_steps": 4385, "total_steps": 67140, "loss": 0.7858, "lr": 3.264819779565088e-05, "epoch": 0.6531128984212095, "percentage": 6.53, "elapsed_time": "0:17:52", "remaining_time": "4:15:49", "throughput": 2361.29, "total_tokens": 2532544} {"current_steps": 4390, "total_steps": 67140, "loss": 0.7766, "lr": 3.2685433422698844e-05, "epoch": 0.6538576109621687, "percentage": 6.54, "elapsed_time": "0:17:53", "remaining_time": "4:15:46", "throughput": 2361.44, "total_tokens": 2535328} {"current_steps": 4395, "total_steps": 67140, "loss": 0.7692, "lr": 3.27226690497468e-05, "epoch": 0.6546023235031277, "percentage": 6.55, "elapsed_time": "0:17:54", "remaining_time": "4:15:44", "throughput": 2361.64, "total_tokens": 2538240} {"current_steps": 4400, "total_steps": 67140, "loss": 0.7203, "lr": 3.275990467679476e-05, "epoch": 0.655347036044087, "percentage": 6.55, "elapsed_time": "0:17:55", "remaining_time": "4:15:41", "throughput": 2361.72, "total_tokens": 2540960} {"current_steps": 4405, "total_steps": 67140, "loss": 0.7368, "lr": 3.279714030384271e-05, "epoch": 0.6560917485850462, "percentage": 6.56, "elapsed_time": "0:17:57", "remaining_time": "4:15:38", "throughput": 2361.89, "total_tokens": 2543776} {"current_steps": 4410, "total_steps": 67140, "loss": 0.7714, "lr": 3.2834375930890676e-05, "epoch": 0.6568364611260054, "percentage": 6.57, "elapsed_time": "0:17:58", "remaining_time": "4:15:35", "throughput": 2362.06, "total_tokens": 2546624} {"current_steps": 4415, "total_steps": 67140, "loss": 0.685, "lr": 3.287161155793864e-05, "epoch": 0.6575811736669646, "percentage": 6.58, "elapsed_time": "0:17:59", "remaining_time": "4:15:33", "throughput": 2362.2, "total_tokens": 2549408} {"current_steps": 4420, "total_steps": 67140, "loss": 0.691, "lr": 3.2908847184986596e-05, "epoch": 0.6583258862079238, "percentage": 6.58, "elapsed_time": "0:18:00", "remaining_time": "4:15:30", "throughput": 2362.45, "total_tokens": 2552384} {"current_steps": 4425, "total_steps": 67140, "loss": 0.8017, "lr": 3.294608281203456e-05, "epoch": 0.659070598748883, "percentage": 6.59, "elapsed_time": "0:18:01", "remaining_time": "4:15:28", "throughput": 2362.6, "total_tokens": 2555200} {"current_steps": 4430, "total_steps": 67140, "loss": 0.7271, "lr": 3.2983318439082516e-05, "epoch": 0.6598153112898422, "percentage": 6.6, "elapsed_time": "0:18:02", "remaining_time": "4:15:25", "throughput": 2362.86, "total_tokens": 2558176} {"current_steps": 4435, "total_steps": 67140, "loss": 0.7585, "lr": 3.302055406613048e-05, "epoch": 0.6605600238308013, "percentage": 6.61, "elapsed_time": "0:18:03", "remaining_time": "4:15:23", "throughput": 2363.16, "total_tokens": 2561248} {"current_steps": 4440, "total_steps": 67140, "loss": 0.7144, "lr": 3.3057789693178435e-05, "epoch": 0.6613047363717605, "percentage": 6.61, "elapsed_time": "0:18:05", "remaining_time": "4:15:22", "throughput": 2363.46, "total_tokens": 2564384} {"current_steps": 4445, "total_steps": 67140, "loss": 0.6774, "lr": 3.309502532022639e-05, "epoch": 0.6620494489127197, "percentage": 6.62, "elapsed_time": "0:18:06", "remaining_time": "4:15:19", "throughput": 2363.48, "total_tokens": 2567008} {"current_steps": 4450, "total_steps": 67140, "loss": 0.8689, "lr": 3.313226094727435e-05, "epoch": 0.6627941614536789, "percentage": 6.63, "elapsed_time": "0:18:07", "remaining_time": "4:15:16", "throughput": 2363.7, "total_tokens": 2569952} {"current_steps": 4455, "total_steps": 67140, "loss": 0.706, "lr": 3.316949657432231e-05, "epoch": 0.6635388739946381, "percentage": 6.64, "elapsed_time": "0:18:08", "remaining_time": "4:15:14", "throughput": 2363.88, "total_tokens": 2572832} {"current_steps": 4460, "total_steps": 67140, "loss": 0.6171, "lr": 3.3206732201370275e-05, "epoch": 0.6642835865355973, "percentage": 6.64, "elapsed_time": "0:18:09", "remaining_time": "4:15:11", "throughput": 2363.98, "total_tokens": 2575584} {"current_steps": 4465, "total_steps": 67140, "loss": 0.7488, "lr": 3.324396782841823e-05, "epoch": 0.6650282990765565, "percentage": 6.65, "elapsed_time": "0:18:10", "remaining_time": "4:15:09", "throughput": 2364.26, "total_tokens": 2578656} {"current_steps": 4470, "total_steps": 67140, "loss": 0.6083, "lr": 3.3281203455466195e-05, "epoch": 0.6657730116175157, "percentage": 6.66, "elapsed_time": "0:18:11", "remaining_time": "4:15:07", "throughput": 2364.41, "total_tokens": 2581472} {"current_steps": 4475, "total_steps": 67140, "loss": 0.7682, "lr": 3.331843908251415e-05, "epoch": 0.6665177241584749, "percentage": 6.67, "elapsed_time": "0:18:12", "remaining_time": "4:15:05", "throughput": 2364.58, "total_tokens": 2584384} {"current_steps": 4480, "total_steps": 67140, "loss": 0.6685, "lr": 3.3355674709562114e-05, "epoch": 0.667262436699434, "percentage": 6.67, "elapsed_time": "0:18:14", "remaining_time": "4:15:02", "throughput": 2364.7, "total_tokens": 2587136} {"current_steps": 4485, "total_steps": 67140, "loss": 0.8553, "lr": 3.339291033661007e-05, "epoch": 0.6680071492403932, "percentage": 6.68, "elapsed_time": "0:18:15", "remaining_time": "4:15:00", "throughput": 2364.97, "total_tokens": 2590176} {"current_steps": 4490, "total_steps": 67140, "loss": 0.7288, "lr": 3.343014596365803e-05, "epoch": 0.6687518617813524, "percentage": 6.69, "elapsed_time": "0:18:16", "remaining_time": "4:14:57", "throughput": 2365.06, "total_tokens": 2592896} {"current_steps": 4495, "total_steps": 67140, "loss": 0.6581, "lr": 3.346738159070599e-05, "epoch": 0.6694965743223116, "percentage": 6.69, "elapsed_time": "0:18:17", "remaining_time": "4:14:54", "throughput": 2365.13, "total_tokens": 2595616} {"current_steps": 4500, "total_steps": 67140, "loss": 0.8386, "lr": 3.350461721775395e-05, "epoch": 0.6702412868632708, "percentage": 6.7, "elapsed_time": "0:18:18", "remaining_time": "4:14:52", "throughput": 2365.33, "total_tokens": 2598528} {"current_steps": 4505, "total_steps": 67140, "loss": 0.8396, "lr": 3.354185284480191e-05, "epoch": 0.67098599940423, "percentage": 6.71, "elapsed_time": "0:18:19", "remaining_time": "4:14:49", "throughput": 2365.54, "total_tokens": 2601440} {"current_steps": 4510, "total_steps": 67140, "loss": 0.7021, "lr": 3.3579088471849867e-05, "epoch": 0.6717307119451892, "percentage": 6.72, "elapsed_time": "0:18:20", "remaining_time": "4:14:47", "throughput": 2365.81, "total_tokens": 2604480} {"current_steps": 4515, "total_steps": 67140, "loss": 0.7315, "lr": 3.361632409889783e-05, "epoch": 0.6724754244861484, "percentage": 6.72, "elapsed_time": "0:18:22", "remaining_time": "4:14:45", "throughput": 2366.06, "total_tokens": 2607456} {"current_steps": 4520, "total_steps": 67140, "loss": 0.7012, "lr": 3.3653559725945786e-05, "epoch": 0.6732201370271076, "percentage": 6.73, "elapsed_time": "0:18:23", "remaining_time": "4:14:43", "throughput": 2366.19, "total_tokens": 2610304} {"current_steps": 4525, "total_steps": 67140, "loss": 0.6915, "lr": 3.369079535299375e-05, "epoch": 0.6739648495680667, "percentage": 6.74, "elapsed_time": "0:18:24", "remaining_time": "4:14:40", "throughput": 2366.24, "total_tokens": 2612960} {"current_steps": 4530, "total_steps": 67140, "loss": 0.6026, "lr": 3.3728030980041706e-05, "epoch": 0.6747095621090259, "percentage": 6.75, "elapsed_time": "0:18:25", "remaining_time": "4:14:36", "throughput": 2366.2, "total_tokens": 2615424} {"current_steps": 4535, "total_steps": 67140, "loss": 0.7894, "lr": 3.376526660708966e-05, "epoch": 0.6754542746499851, "percentage": 6.75, "elapsed_time": "0:18:26", "remaining_time": "4:14:34", "throughput": 2366.48, "total_tokens": 2618496} {"current_steps": 4540, "total_steps": 67140, "loss": 0.7653, "lr": 3.3802502234137626e-05, "epoch": 0.6761989871909443, "percentage": 6.76, "elapsed_time": "0:18:27", "remaining_time": "4:14:32", "throughput": 2366.6, "total_tokens": 2621280} {"current_steps": 4545, "total_steps": 67140, "loss": 0.7211, "lr": 3.383973786118558e-05, "epoch": 0.6769436997319035, "percentage": 6.77, "elapsed_time": "0:18:28", "remaining_time": "4:14:29", "throughput": 2366.71, "total_tokens": 2624000} {"current_steps": 4550, "total_steps": 67140, "loss": 0.6447, "lr": 3.3876973488233545e-05, "epoch": 0.6776884122728627, "percentage": 6.78, "elapsed_time": "0:18:29", "remaining_time": "4:14:27", "throughput": 2366.94, "total_tokens": 2626976} {"current_steps": 4555, "total_steps": 67140, "loss": 0.6497, "lr": 3.39142091152815e-05, "epoch": 0.6784331248138219, "percentage": 6.78, "elapsed_time": "0:18:31", "remaining_time": "4:14:25", "throughput": 2367.07, "total_tokens": 2629824} {"current_steps": 4560, "total_steps": 67140, "loss": 0.7676, "lr": 3.3951444742329465e-05, "epoch": 0.6791778373547811, "percentage": 6.79, "elapsed_time": "0:18:32", "remaining_time": "4:14:22", "throughput": 2367.19, "total_tokens": 2632608} {"current_steps": 4565, "total_steps": 67140, "loss": 0.6547, "lr": 3.398868036937742e-05, "epoch": 0.6799225498957402, "percentage": 6.8, "elapsed_time": "0:18:33", "remaining_time": "4:14:20", "throughput": 2367.44, "total_tokens": 2635616} {"current_steps": 4570, "total_steps": 67140, "loss": 0.742, "lr": 3.4025915996425385e-05, "epoch": 0.6806672624366994, "percentage": 6.81, "elapsed_time": "0:18:34", "remaining_time": "4:14:18", "throughput": 2367.81, "total_tokens": 2638848} {"current_steps": 4575, "total_steps": 67140, "loss": 0.7296, "lr": 3.406315162347334e-05, "epoch": 0.6814119749776586, "percentage": 6.81, "elapsed_time": "0:18:35", "remaining_time": "4:14:16", "throughput": 2367.95, "total_tokens": 2641664} {"current_steps": 4580, "total_steps": 67140, "loss": 0.8011, "lr": 3.41003872505213e-05, "epoch": 0.6821566875186178, "percentage": 6.82, "elapsed_time": "0:18:36", "remaining_time": "4:14:14", "throughput": 2368.34, "total_tokens": 2644864} {"current_steps": 4585, "total_steps": 67140, "loss": 0.8507, "lr": 3.413762287756926e-05, "epoch": 0.682901400059577, "percentage": 6.83, "elapsed_time": "0:18:37", "remaining_time": "4:14:11", "throughput": 2368.58, "total_tokens": 2647840} {"current_steps": 4590, "total_steps": 67140, "loss": 0.7155, "lr": 3.417485850461722e-05, "epoch": 0.6836461126005362, "percentage": 6.84, "elapsed_time": "0:18:39", "remaining_time": "4:14:09", "throughput": 2368.85, "total_tokens": 2650848} {"current_steps": 4595, "total_steps": 67140, "loss": 0.716, "lr": 3.421209413166518e-05, "epoch": 0.6843908251414954, "percentage": 6.84, "elapsed_time": "0:18:40", "remaining_time": "4:14:06", "throughput": 2368.91, "total_tokens": 2653536} {"current_steps": 4600, "total_steps": 67140, "loss": 0.6634, "lr": 3.424932975871314e-05, "epoch": 0.6851355376824546, "percentage": 6.85, "elapsed_time": "0:18:41", "remaining_time": "4:14:04", "throughput": 2369.17, "total_tokens": 2656576} {"current_steps": 4605, "total_steps": 67140, "loss": 0.7074, "lr": 3.42865653857611e-05, "epoch": 0.6858802502234138, "percentage": 6.86, "elapsed_time": "0:18:42", "remaining_time": "4:14:03", "throughput": 2369.55, "total_tokens": 2659776} {"current_steps": 4610, "total_steps": 67140, "loss": 0.7506, "lr": 3.432380101280906e-05, "epoch": 0.6866249627643729, "percentage": 6.87, "elapsed_time": "0:18:43", "remaining_time": "4:14:00", "throughput": 2369.76, "total_tokens": 2662720} {"current_steps": 4615, "total_steps": 67140, "loss": 0.6584, "lr": 3.436103663985702e-05, "epoch": 0.6873696753053321, "percentage": 6.87, "elapsed_time": "0:18:44", "remaining_time": "4:13:58", "throughput": 2369.83, "total_tokens": 2665440} {"current_steps": 4620, "total_steps": 67140, "loss": 0.7512, "lr": 3.4398272266904977e-05, "epoch": 0.6881143878462913, "percentage": 6.88, "elapsed_time": "0:18:45", "remaining_time": "4:13:55", "throughput": 2369.95, "total_tokens": 2668224} {"current_steps": 4625, "total_steps": 67140, "loss": 0.6636, "lr": 3.443550789395293e-05, "epoch": 0.6888591003872505, "percentage": 6.89, "elapsed_time": "0:18:46", "remaining_time": "4:13:53", "throughput": 2370.09, "total_tokens": 2671040} {"current_steps": 4630, "total_steps": 67140, "loss": 0.8123, "lr": 3.4472743521000896e-05, "epoch": 0.6896038129282097, "percentage": 6.9, "elapsed_time": "0:18:48", "remaining_time": "4:13:50", "throughput": 2370.2, "total_tokens": 2673792} {"current_steps": 4635, "total_steps": 67140, "loss": 0.741, "lr": 3.450997914804885e-05, "epoch": 0.6903485254691689, "percentage": 6.9, "elapsed_time": "0:18:49", "remaining_time": "4:13:47", "throughput": 2370.39, "total_tokens": 2676672} {"current_steps": 4640, "total_steps": 67140, "loss": 0.5918, "lr": 3.4547214775096816e-05, "epoch": 0.6910932380101281, "percentage": 6.91, "elapsed_time": "0:18:50", "remaining_time": "4:13:45", "throughput": 2370.5, "total_tokens": 2679424} {"current_steps": 4645, "total_steps": 67140, "loss": 0.8578, "lr": 3.458445040214477e-05, "epoch": 0.6918379505510873, "percentage": 6.92, "elapsed_time": "0:18:51", "remaining_time": "4:13:42", "throughput": 2370.62, "total_tokens": 2682240} {"current_steps": 4650, "total_steps": 67140, "loss": 0.8188, "lr": 3.4621686029192736e-05, "epoch": 0.6925826630920465, "percentage": 6.93, "elapsed_time": "0:18:52", "remaining_time": "4:13:41", "throughput": 2370.91, "total_tokens": 2685376} {"current_steps": 4655, "total_steps": 67140, "loss": 0.6689, "lr": 3.465892165624069e-05, "epoch": 0.6933273756330056, "percentage": 6.93, "elapsed_time": "0:18:53", "remaining_time": "4:13:38", "throughput": 2370.92, "total_tokens": 2687968} {"current_steps": 4660, "total_steps": 67140, "loss": 0.7532, "lr": 3.4696157283288655e-05, "epoch": 0.6940720881739648, "percentage": 6.94, "elapsed_time": "0:18:54", "remaining_time": "4:13:35", "throughput": 2370.96, "total_tokens": 2690624} {"current_steps": 4665, "total_steps": 67140, "loss": 0.7169, "lr": 3.473339291033661e-05, "epoch": 0.694816800714924, "percentage": 6.95, "elapsed_time": "0:18:55", "remaining_time": "4:13:33", "throughput": 2371.21, "total_tokens": 2693664} {"current_steps": 4670, "total_steps": 67140, "loss": 0.7857, "lr": 3.477062853738457e-05, "epoch": 0.6955615132558832, "percentage": 6.96, "elapsed_time": "0:18:57", "remaining_time": "4:13:31", "throughput": 2371.38, "total_tokens": 2696576} {"current_steps": 4675, "total_steps": 67140, "loss": 0.7027, "lr": 3.480786416443253e-05, "epoch": 0.6963062257968424, "percentage": 6.96, "elapsed_time": "0:18:58", "remaining_time": "4:13:29", "throughput": 2371.56, "total_tokens": 2699488} {"current_steps": 4680, "total_steps": 67140, "loss": 0.7812, "lr": 3.484509979148049e-05, "epoch": 0.6970509383378016, "percentage": 6.97, "elapsed_time": "0:18:59", "remaining_time": "4:13:26", "throughput": 2371.72, "total_tokens": 2702336} {"current_steps": 4685, "total_steps": 67140, "loss": 0.7525, "lr": 3.488233541852845e-05, "epoch": 0.6977956508787608, "percentage": 6.98, "elapsed_time": "0:19:00", "remaining_time": "4:13:24", "throughput": 2371.85, "total_tokens": 2705152} {"current_steps": 4690, "total_steps": 67140, "loss": 0.7198, "lr": 3.491957104557641e-05, "epoch": 0.69854036341972, "percentage": 6.99, "elapsed_time": "0:19:01", "remaining_time": "4:13:21", "throughput": 2372.05, "total_tokens": 2708096} {"current_steps": 4695, "total_steps": 67140, "loss": 0.6827, "lr": 3.495680667262437e-05, "epoch": 0.6992850759606791, "percentage": 6.99, "elapsed_time": "0:19:02", "remaining_time": "4:13:19", "throughput": 2372.21, "total_tokens": 2710944} {"current_steps": 4700, "total_steps": 67140, "loss": 0.7331, "lr": 3.499404229967233e-05, "epoch": 0.7000297885016383, "percentage": 7.0, "elapsed_time": "0:19:03", "remaining_time": "4:13:16", "throughput": 2372.27, "total_tokens": 2713664} {"current_steps": 4705, "total_steps": 67140, "loss": 0.6231, "lr": 3.5031277926720284e-05, "epoch": 0.7007745010425975, "percentage": 7.01, "elapsed_time": "0:19:05", "remaining_time": "4:13:15", "throughput": 2372.61, "total_tokens": 2716896} {"current_steps": 4710, "total_steps": 67140, "loss": 0.5415, "lr": 3.506851355376825e-05, "epoch": 0.7015192135835567, "percentage": 7.02, "elapsed_time": "0:19:06", "remaining_time": "4:13:12", "throughput": 2372.69, "total_tokens": 2719584} {"current_steps": 4715, "total_steps": 67140, "loss": 0.7384, "lr": 3.5105749180816204e-05, "epoch": 0.7022639261245159, "percentage": 7.02, "elapsed_time": "0:19:07", "remaining_time": "4:13:09", "throughput": 2372.77, "total_tokens": 2722304} {"current_steps": 4720, "total_steps": 67140, "loss": 0.7865, "lr": 3.514298480786417e-05, "epoch": 0.7030086386654751, "percentage": 7.03, "elapsed_time": "0:19:08", "remaining_time": "4:13:07", "throughput": 2372.85, "total_tokens": 2724992} {"current_steps": 4725, "total_steps": 67140, "loss": 0.8204, "lr": 3.518022043491212e-05, "epoch": 0.7037533512064343, "percentage": 7.04, "elapsed_time": "0:19:09", "remaining_time": "4:13:04", "throughput": 2372.87, "total_tokens": 2727648} {"current_steps": 4730, "total_steps": 67140, "loss": 0.7808, "lr": 3.5217456061960087e-05, "epoch": 0.7044980637473935, "percentage": 7.04, "elapsed_time": "0:19:10", "remaining_time": "4:13:02", "throughput": 2373.05, "total_tokens": 2730560} {"current_steps": 4735, "total_steps": 67140, "loss": 0.7229, "lr": 3.525469168900804e-05, "epoch": 0.7052427762883527, "percentage": 7.05, "elapsed_time": "0:19:11", "remaining_time": "4:13:00", "throughput": 2373.21, "total_tokens": 2733440} {"current_steps": 4740, "total_steps": 67140, "loss": 0.7768, "lr": 3.5291927316056006e-05, "epoch": 0.7059874888293118, "percentage": 7.06, "elapsed_time": "0:19:12", "remaining_time": "4:12:57", "throughput": 2373.39, "total_tokens": 2736320} {"current_steps": 4745, "total_steps": 67140, "loss": 0.801, "lr": 3.532916294310397e-05, "epoch": 0.706732201370271, "percentage": 7.07, "elapsed_time": "0:19:14", "remaining_time": "4:12:55", "throughput": 2373.51, "total_tokens": 2739136} {"current_steps": 4750, "total_steps": 67140, "loss": 0.7386, "lr": 3.536639857015192e-05, "epoch": 0.7074769139112302, "percentage": 7.07, "elapsed_time": "0:19:15", "remaining_time": "4:12:53", "throughput": 2373.75, "total_tokens": 2742176} {"current_steps": 4755, "total_steps": 67140, "loss": 0.6704, "lr": 3.540363419719988e-05, "epoch": 0.7082216264521894, "percentage": 7.08, "elapsed_time": "0:19:16", "remaining_time": "4:12:50", "throughput": 2373.93, "total_tokens": 2745056} {"current_steps": 4760, "total_steps": 67140, "loss": 0.7491, "lr": 3.544086982424784e-05, "epoch": 0.7089663389931486, "percentage": 7.09, "elapsed_time": "0:19:17", "remaining_time": "4:12:49", "throughput": 2374.17, "total_tokens": 2748128} {"current_steps": 4765, "total_steps": 67140, "loss": 0.7492, "lr": 3.54781054512958e-05, "epoch": 0.7097110515341079, "percentage": 7.1, "elapsed_time": "0:19:18", "remaining_time": "4:12:46", "throughput": 2374.35, "total_tokens": 2751008} {"current_steps": 4770, "total_steps": 67140, "loss": 0.5936, "lr": 3.551534107834376e-05, "epoch": 0.710455764075067, "percentage": 7.1, "elapsed_time": "0:19:19", "remaining_time": "4:12:44", "throughput": 2374.58, "total_tokens": 2754016} {"current_steps": 4775, "total_steps": 67140, "loss": 0.6392, "lr": 3.555257670539172e-05, "epoch": 0.7112004766160263, "percentage": 7.11, "elapsed_time": "0:19:20", "remaining_time": "4:12:43", "throughput": 2374.97, "total_tokens": 2757248} {"current_steps": 4780, "total_steps": 67140, "loss": 0.7411, "lr": 3.558981233243968e-05, "epoch": 0.7119451891569855, "percentage": 7.12, "elapsed_time": "0:19:22", "remaining_time": "4:12:40", "throughput": 2375.14, "total_tokens": 2760128} {"current_steps": 4785, "total_steps": 67140, "loss": 0.8021, "lr": 3.562704795948764e-05, "epoch": 0.7126899016979446, "percentage": 7.13, "elapsed_time": "0:19:23", "remaining_time": "4:12:38", "throughput": 2375.36, "total_tokens": 2763136} {"current_steps": 4790, "total_steps": 67140, "loss": 0.733, "lr": 3.56642835865356e-05, "epoch": 0.7134346142389038, "percentage": 7.13, "elapsed_time": "0:19:24", "remaining_time": "4:12:36", "throughput": 2375.43, "total_tokens": 2765856} {"current_steps": 4795, "total_steps": 67140, "loss": 0.5814, "lr": 3.5701519213583554e-05, "epoch": 0.714179326779863, "percentage": 7.14, "elapsed_time": "0:19:25", "remaining_time": "4:12:34", "throughput": 2375.65, "total_tokens": 2768864} {"current_steps": 4800, "total_steps": 67140, "loss": 0.5802, "lr": 3.573875484063152e-05, "epoch": 0.7149240393208222, "percentage": 7.15, "elapsed_time": "0:19:26", "remaining_time": "4:12:31", "throughput": 2375.67, "total_tokens": 2771520} {"current_steps": 4805, "total_steps": 67140, "loss": 0.6339, "lr": 3.5775990467679474e-05, "epoch": 0.7156687518617814, "percentage": 7.16, "elapsed_time": "0:19:27", "remaining_time": "4:12:29", "throughput": 2375.91, "total_tokens": 2774560} {"current_steps": 4810, "total_steps": 67140, "loss": 0.7092, "lr": 3.581322609472744e-05, "epoch": 0.7164134644027406, "percentage": 7.16, "elapsed_time": "0:19:28", "remaining_time": "4:12:27", "throughput": 2375.99, "total_tokens": 2777312} {"current_steps": 4815, "total_steps": 67140, "loss": 0.6708, "lr": 3.5850461721775394e-05, "epoch": 0.7171581769436998, "percentage": 7.17, "elapsed_time": "0:19:30", "remaining_time": "4:12:24", "throughput": 2376.09, "total_tokens": 2780128} {"current_steps": 4820, "total_steps": 67140, "loss": 0.697, "lr": 3.588769734882336e-05, "epoch": 0.717902889484659, "percentage": 7.18, "elapsed_time": "0:19:31", "remaining_time": "4:12:23", "throughput": 2376.36, "total_tokens": 2783200} {"current_steps": 4825, "total_steps": 67140, "loss": 0.6567, "lr": 3.592493297587132e-05, "epoch": 0.7186476020256181, "percentage": 7.19, "elapsed_time": "0:19:32", "remaining_time": "4:12:20", "throughput": 2376.48, "total_tokens": 2786048} {"current_steps": 4830, "total_steps": 67140, "loss": 0.788, "lr": 3.596216860291928e-05, "epoch": 0.7193923145665773, "percentage": 7.19, "elapsed_time": "0:19:33", "remaining_time": "4:12:18", "throughput": 2376.61, "total_tokens": 2788864} {"current_steps": 4835, "total_steps": 67140, "loss": 0.8028, "lr": 3.599940422996723e-05, "epoch": 0.7201370271075365, "percentage": 7.2, "elapsed_time": "0:19:34", "remaining_time": "4:12:15", "throughput": 2376.66, "total_tokens": 2791552} {"current_steps": 4840, "total_steps": 67140, "loss": 0.6403, "lr": 3.603663985701519e-05, "epoch": 0.7208817396484957, "percentage": 7.21, "elapsed_time": "0:19:35", "remaining_time": "4:12:13", "throughput": 2376.86, "total_tokens": 2794528} {"current_steps": 4845, "total_steps": 67140, "loss": 0.697, "lr": 3.607387548406315e-05, "epoch": 0.7216264521894549, "percentage": 7.22, "elapsed_time": "0:19:36", "remaining_time": "4:12:11", "throughput": 2376.96, "total_tokens": 2797280} {"current_steps": 4850, "total_steps": 67140, "loss": 0.7504, "lr": 3.611111111111111e-05, "epoch": 0.7223711647304141, "percentage": 7.22, "elapsed_time": "0:19:37", "remaining_time": "4:12:08", "throughput": 2376.96, "total_tokens": 2799872} {"current_steps": 4855, "total_steps": 67140, "loss": 0.7559, "lr": 3.614834673815907e-05, "epoch": 0.7231158772713733, "percentage": 7.23, "elapsed_time": "0:19:39", "remaining_time": "4:12:05", "throughput": 2377.02, "total_tokens": 2802560} {"current_steps": 4860, "total_steps": 67140, "loss": 0.7494, "lr": 3.618558236520703e-05, "epoch": 0.7238605898123325, "percentage": 7.24, "elapsed_time": "0:19:40", "remaining_time": "4:12:03", "throughput": 2377.23, "total_tokens": 2805536} {"current_steps": 4865, "total_steps": 67140, "loss": 0.8183, "lr": 3.622281799225499e-05, "epoch": 0.7246053023532917, "percentage": 7.25, "elapsed_time": "0:19:41", "remaining_time": "4:12:01", "throughput": 2377.47, "total_tokens": 2808576} {"current_steps": 4870, "total_steps": 67140, "loss": 0.6468, "lr": 3.6260053619302956e-05, "epoch": 0.7253500148942508, "percentage": 7.25, "elapsed_time": "0:19:42", "remaining_time": "4:11:59", "throughput": 2377.74, "total_tokens": 2811680} {"current_steps": 4875, "total_steps": 67140, "loss": 0.6152, "lr": 3.629728924635091e-05, "epoch": 0.72609472743521, "percentage": 7.26, "elapsed_time": "0:19:43", "remaining_time": "4:11:57", "throughput": 2377.88, "total_tokens": 2814528} {"current_steps": 4880, "total_steps": 67140, "loss": 0.7942, "lr": 3.633452487339887e-05, "epoch": 0.7268394399761692, "percentage": 7.27, "elapsed_time": "0:19:44", "remaining_time": "4:11:54", "throughput": 2377.86, "total_tokens": 2817056} {"current_steps": 4885, "total_steps": 67140, "loss": 0.6934, "lr": 3.6371760500446825e-05, "epoch": 0.7275841525171284, "percentage": 7.28, "elapsed_time": "0:19:45", "remaining_time": "4:11:52", "throughput": 2378.08, "total_tokens": 2820032} {"current_steps": 4890, "total_steps": 67140, "loss": 0.8595, "lr": 3.640899612749479e-05, "epoch": 0.7283288650580876, "percentage": 7.28, "elapsed_time": "0:19:46", "remaining_time": "4:11:50", "throughput": 2378.13, "total_tokens": 2822752} {"current_steps": 4895, "total_steps": 67140, "loss": 0.5606, "lr": 3.6446231754542745e-05, "epoch": 0.7290735775990468, "percentage": 7.29, "elapsed_time": "0:19:48", "remaining_time": "4:11:47", "throughput": 2378.27, "total_tokens": 2825568} {"current_steps": 4900, "total_steps": 67140, "loss": 0.5269, "lr": 3.648346738159071e-05, "epoch": 0.729818290140006, "percentage": 7.3, "elapsed_time": "0:19:49", "remaining_time": "4:11:45", "throughput": 2378.48, "total_tokens": 2828576} {"current_steps": 4905, "total_steps": 67140, "loss": 0.7011, "lr": 3.652070300863867e-05, "epoch": 0.7305630026809652, "percentage": 7.31, "elapsed_time": "0:19:50", "remaining_time": "4:11:43", "throughput": 2378.6, "total_tokens": 2831360} {"current_steps": 4910, "total_steps": 67140, "loss": 1.099, "lr": 3.655793863568663e-05, "epoch": 0.7313077152219244, "percentage": 7.31, "elapsed_time": "0:19:51", "remaining_time": "4:11:40", "throughput": 2378.59, "total_tokens": 2833952} {"current_steps": 4915, "total_steps": 67140, "loss": 0.7857, "lr": 3.659517426273459e-05, "epoch": 0.7320524277628835, "percentage": 7.32, "elapsed_time": "0:19:52", "remaining_time": "4:11:39", "throughput": 2378.98, "total_tokens": 2837280} {"current_steps": 4920, "total_steps": 67140, "loss": 0.7273, "lr": 3.663240988978254e-05, "epoch": 0.7327971403038427, "percentage": 7.33, "elapsed_time": "0:19:53", "remaining_time": "4:11:36", "throughput": 2379.05, "total_tokens": 2840000} {"current_steps": 4925, "total_steps": 67140, "loss": 0.7457, "lr": 3.6669645516830504e-05, "epoch": 0.7335418528448019, "percentage": 7.34, "elapsed_time": "0:19:54", "remaining_time": "4:11:34", "throughput": 2379.22, "total_tokens": 2842912} {"current_steps": 4930, "total_steps": 67140, "loss": 0.8084, "lr": 3.670688114387846e-05, "epoch": 0.7342865653857611, "percentage": 7.34, "elapsed_time": "0:19:56", "remaining_time": "4:11:32", "throughput": 2379.46, "total_tokens": 2845952} {"current_steps": 4935, "total_steps": 67140, "loss": 0.7172, "lr": 3.6744116770926424e-05, "epoch": 0.7350312779267203, "percentage": 7.35, "elapsed_time": "0:19:57", "remaining_time": "4:11:30", "throughput": 2379.54, "total_tokens": 2848736} {"current_steps": 4940, "total_steps": 67140, "loss": 0.614, "lr": 3.678135239797439e-05, "epoch": 0.7357759904676795, "percentage": 7.36, "elapsed_time": "0:19:58", "remaining_time": "4:11:28", "throughput": 2379.68, "total_tokens": 2851616} {"current_steps": 4945, "total_steps": 67140, "loss": 0.8591, "lr": 3.681858802502234e-05, "epoch": 0.7365207030086387, "percentage": 7.37, "elapsed_time": "0:19:59", "remaining_time": "4:11:25", "throughput": 2379.75, "total_tokens": 2854368} {"current_steps": 4950, "total_steps": 67140, "loss": 0.789, "lr": 3.6855823652070307e-05, "epoch": 0.7372654155495979, "percentage": 7.37, "elapsed_time": "0:20:00", "remaining_time": "4:11:23", "throughput": 2379.96, "total_tokens": 2857312} {"current_steps": 4955, "total_steps": 67140, "loss": 0.6065, "lr": 3.689305927911826e-05, "epoch": 0.738010128090557, "percentage": 7.38, "elapsed_time": "0:20:01", "remaining_time": "4:11:21", "throughput": 2380.17, "total_tokens": 2860320} {"current_steps": 4960, "total_steps": 67140, "loss": 0.6358, "lr": 3.6930294906166226e-05, "epoch": 0.7387548406315162, "percentage": 7.39, "elapsed_time": "0:20:02", "remaining_time": "4:11:19", "throughput": 2380.26, "total_tokens": 2863072} {"current_steps": 4965, "total_steps": 67140, "loss": 0.7943, "lr": 3.6967530533214176e-05, "epoch": 0.7394995531724754, "percentage": 7.39, "elapsed_time": "0:20:03", "remaining_time": "4:11:17", "throughput": 2380.5, "total_tokens": 2866112} {"current_steps": 4970, "total_steps": 67140, "loss": 0.8172, "lr": 3.700476616026214e-05, "epoch": 0.7402442657134346, "percentage": 7.4, "elapsed_time": "0:20:05", "remaining_time": "4:11:14", "throughput": 2380.64, "total_tokens": 2868960} {"current_steps": 4975, "total_steps": 67140, "loss": 0.8055, "lr": 3.7042001787310096e-05, "epoch": 0.7409889782543938, "percentage": 7.41, "elapsed_time": "0:20:06", "remaining_time": "4:11:12", "throughput": 2380.71, "total_tokens": 2871680} {"current_steps": 4980, "total_steps": 67140, "loss": 0.7117, "lr": 3.707923741435806e-05, "epoch": 0.741733690795353, "percentage": 7.42, "elapsed_time": "0:20:07", "remaining_time": "4:11:10", "throughput": 2380.82, "total_tokens": 2874496} {"current_steps": 4985, "total_steps": 67140, "loss": 0.8237, "lr": 3.711647304140602e-05, "epoch": 0.7424784033363122, "percentage": 7.42, "elapsed_time": "0:20:08", "remaining_time": "4:11:08", "throughput": 2381.04, "total_tokens": 2877536} {"current_steps": 4990, "total_steps": 67140, "loss": 0.8033, "lr": 3.715370866845398e-05, "epoch": 0.7432231158772714, "percentage": 7.43, "elapsed_time": "0:20:09", "remaining_time": "4:11:06", "throughput": 2381.2, "total_tokens": 2880480} {"current_steps": 4995, "total_steps": 67140, "loss": 0.6877, "lr": 3.719094429550194e-05, "epoch": 0.7439678284182306, "percentage": 7.44, "elapsed_time": "0:20:10", "remaining_time": "4:11:04", "throughput": 2381.31, "total_tokens": 2883296} {"current_steps": 5000, "total_steps": 67140, "loss": 0.7637, "lr": 3.72281799225499e-05, "epoch": 0.7447125409591897, "percentage": 7.45, "elapsed_time": "0:20:11", "remaining_time": "4:11:01", "throughput": 2381.27, "total_tokens": 2885824} {"current_steps": 5005, "total_steps": 67140, "loss": 0.8025, "lr": 3.726541554959786e-05, "epoch": 0.7454572535001489, "percentage": 7.45, "elapsed_time": "0:20:12", "remaining_time": "4:10:58", "throughput": 2381.29, "total_tokens": 2888448} {"current_steps": 5010, "total_steps": 67140, "loss": 0.8559, "lr": 3.730265117664581e-05, "epoch": 0.7462019660411081, "percentage": 7.46, "elapsed_time": "0:20:14", "remaining_time": "4:10:56", "throughput": 2381.31, "total_tokens": 2891104} {"current_steps": 5015, "total_steps": 67140, "loss": 0.7513, "lr": 3.7339886803693774e-05, "epoch": 0.7469466785820673, "percentage": 7.47, "elapsed_time": "0:20:15", "remaining_time": "4:10:53", "throughput": 2381.4, "total_tokens": 2893888} {"current_steps": 5020, "total_steps": 67140, "loss": 0.661, "lr": 3.737712243074174e-05, "epoch": 0.7476913911230265, "percentage": 7.48, "elapsed_time": "0:20:16", "remaining_time": "4:10:50", "throughput": 2381.27, "total_tokens": 2896192} {"current_steps": 5025, "total_steps": 67140, "loss": 0.707, "lr": 3.7414358057789694e-05, "epoch": 0.7484361036639857, "percentage": 7.48, "elapsed_time": "0:20:17", "remaining_time": "4:10:48", "throughput": 2381.38, "total_tokens": 2899008} {"current_steps": 5030, "total_steps": 67140, "loss": 0.7126, "lr": 3.745159368483766e-05, "epoch": 0.7491808162049449, "percentage": 7.49, "elapsed_time": "0:20:18", "remaining_time": "4:10:46", "throughput": 2381.54, "total_tokens": 2901920} {"current_steps": 5035, "total_steps": 67140, "loss": 0.7446, "lr": 3.7488829311885614e-05, "epoch": 0.7499255287459041, "percentage": 7.5, "elapsed_time": "0:20:19", "remaining_time": "4:10:44", "throughput": 2381.87, "total_tokens": 2905184} {"current_steps": 5040, "total_steps": 67140, "loss": 0.6707, "lr": 3.752606493893358e-05, "epoch": 0.7506702412868632, "percentage": 7.51, "elapsed_time": "0:20:20", "remaining_time": "4:10:42", "throughput": 2381.99, "total_tokens": 2908000} {"current_steps": 5045, "total_steps": 67140, "loss": 0.6768, "lr": 3.7563300565981534e-05, "epoch": 0.7514149538278224, "percentage": 7.51, "elapsed_time": "0:20:21", "remaining_time": "4:10:39", "throughput": 2382.05, "total_tokens": 2910720} {"current_steps": 5050, "total_steps": 67140, "loss": 0.793, "lr": 3.760053619302949e-05, "epoch": 0.7521596663687816, "percentage": 7.52, "elapsed_time": "0:20:23", "remaining_time": "4:10:38", "throughput": 2382.25, "total_tokens": 2913728} {"current_steps": 5055, "total_steps": 67140, "loss": 0.7528, "lr": 3.7637771820077446e-05, "epoch": 0.7529043789097408, "percentage": 7.53, "elapsed_time": "0:20:24", "remaining_time": "4:10:35", "throughput": 2382.25, "total_tokens": 2916352} {"current_steps": 5060, "total_steps": 67140, "loss": 0.7118, "lr": 3.767500744712541e-05, "epoch": 0.7536490914507, "percentage": 7.54, "elapsed_time": "0:20:25", "remaining_time": "4:10:33", "throughput": 2382.38, "total_tokens": 2919168} {"current_steps": 5065, "total_steps": 67140, "loss": 0.6968, "lr": 3.771224307417337e-05, "epoch": 0.7543938039916592, "percentage": 7.54, "elapsed_time": "0:20:26", "remaining_time": "4:10:30", "throughput": 2382.32, "total_tokens": 2921696} {"current_steps": 5070, "total_steps": 67140, "loss": 0.7294, "lr": 3.774947870122133e-05, "epoch": 0.7551385165326184, "percentage": 7.55, "elapsed_time": "0:20:27", "remaining_time": "4:10:28", "throughput": 2382.44, "total_tokens": 2924544} {"current_steps": 5075, "total_steps": 67140, "loss": 1.0311, "lr": 3.778671432826929e-05, "epoch": 0.7558832290735776, "percentage": 7.56, "elapsed_time": "0:20:28", "remaining_time": "4:10:26", "throughput": 2382.61, "total_tokens": 2927520} {"current_steps": 5080, "total_steps": 67140, "loss": 0.6987, "lr": 3.782394995531725e-05, "epoch": 0.7566279416145368, "percentage": 7.57, "elapsed_time": "0:20:29", "remaining_time": "4:10:24", "throughput": 2382.84, "total_tokens": 2930560} {"current_steps": 5085, "total_steps": 67140, "loss": 0.7144, "lr": 3.786118558236521e-05, "epoch": 0.7573726541554959, "percentage": 7.57, "elapsed_time": "0:20:30", "remaining_time": "4:10:21", "throughput": 2382.8, "total_tokens": 2933088} {"current_steps": 5090, "total_steps": 67140, "loss": 0.6084, "lr": 3.789842120941317e-05, "epoch": 0.7581173666964551, "percentage": 7.58, "elapsed_time": "0:20:32", "remaining_time": "4:10:19", "throughput": 2382.87, "total_tokens": 2935808} {"current_steps": 5095, "total_steps": 67140, "loss": 0.7404, "lr": 3.7935656836461125e-05, "epoch": 0.7588620792374143, "percentage": 7.59, "elapsed_time": "0:20:33", "remaining_time": "4:10:17", "throughput": 2382.99, "total_tokens": 2938624} {"current_steps": 5100, "total_steps": 67140, "loss": 0.6206, "lr": 3.797289246350909e-05, "epoch": 0.7596067917783735, "percentage": 7.6, "elapsed_time": "0:20:34", "remaining_time": "4:10:14", "throughput": 2383.21, "total_tokens": 2941600} {"current_steps": 5105, "total_steps": 67140, "loss": 0.7126, "lr": 3.8010128090557045e-05, "epoch": 0.7603515043193327, "percentage": 7.6, "elapsed_time": "0:20:35", "remaining_time": "4:10:12", "throughput": 2383.41, "total_tokens": 2944576} {"current_steps": 5110, "total_steps": 67140, "loss": 0.664, "lr": 3.804736371760501e-05, "epoch": 0.7610962168602919, "percentage": 7.61, "elapsed_time": "0:20:36", "remaining_time": "4:10:10", "throughput": 2383.52, "total_tokens": 2947424} {"current_steps": 5115, "total_steps": 67140, "loss": 0.7014, "lr": 3.8084599344652965e-05, "epoch": 0.7618409294012511, "percentage": 7.62, "elapsed_time": "0:20:37", "remaining_time": "4:10:08", "throughput": 2383.69, "total_tokens": 2950336} {"current_steps": 5120, "total_steps": 67140, "loss": 0.7266, "lr": 3.812183497170093e-05, "epoch": 0.7625856419422103, "percentage": 7.63, "elapsed_time": "0:20:38", "remaining_time": "4:10:06", "throughput": 2383.72, "total_tokens": 2952992} {"current_steps": 5125, "total_steps": 67140, "loss": 0.7142, "lr": 3.8159070598748884e-05, "epoch": 0.7633303544831695, "percentage": 7.63, "elapsed_time": "0:20:39", "remaining_time": "4:10:03", "throughput": 2383.8, "total_tokens": 2955776} {"current_steps": 5130, "total_steps": 67140, "loss": 0.6775, "lr": 3.819630622579685e-05, "epoch": 0.7640750670241286, "percentage": 7.64, "elapsed_time": "0:20:41", "remaining_time": "4:10:01", "throughput": 2383.89, "total_tokens": 2958592} {"current_steps": 5135, "total_steps": 67140, "loss": 0.5605, "lr": 3.8233541852844804e-05, "epoch": 0.7648197795650878, "percentage": 7.65, "elapsed_time": "0:20:42", "remaining_time": "4:09:59", "throughput": 2384.03, "total_tokens": 2961408} {"current_steps": 5140, "total_steps": 67140, "loss": 0.7916, "lr": 3.827077747989276e-05, "epoch": 0.765564492106047, "percentage": 7.66, "elapsed_time": "0:20:43", "remaining_time": "4:09:56", "throughput": 2384.06, "total_tokens": 2964064} {"current_steps": 5145, "total_steps": 67140, "loss": 0.6055, "lr": 3.8308013106940724e-05, "epoch": 0.7663092046470062, "percentage": 7.66, "elapsed_time": "0:20:44", "remaining_time": "4:09:53", "throughput": 2384.01, "total_tokens": 2966560} {"current_steps": 5150, "total_steps": 67140, "loss": 0.8349, "lr": 3.834524873398868e-05, "epoch": 0.7670539171879655, "percentage": 7.67, "elapsed_time": "0:20:45", "remaining_time": "4:09:51", "throughput": 2384.09, "total_tokens": 2969344} {"current_steps": 5155, "total_steps": 67140, "loss": 0.7006, "lr": 3.8382484361036644e-05, "epoch": 0.7677986297289247, "percentage": 7.68, "elapsed_time": "0:20:46", "remaining_time": "4:09:49", "throughput": 2384.24, "total_tokens": 2972224} {"current_steps": 5160, "total_steps": 67140, "loss": 0.659, "lr": 3.84197199880846e-05, "epoch": 0.7685433422698839, "percentage": 7.69, "elapsed_time": "0:20:47", "remaining_time": "4:09:47", "throughput": 2384.46, "total_tokens": 2975296} {"current_steps": 5165, "total_steps": 67140, "loss": 0.807, "lr": 3.845695561513256e-05, "epoch": 0.7692880548108431, "percentage": 7.69, "elapsed_time": "0:20:48", "remaining_time": "4:09:45", "throughput": 2384.59, "total_tokens": 2978144} {"current_steps": 5170, "total_steps": 67140, "loss": 0.6607, "lr": 3.849419124218052e-05, "epoch": 0.7700327673518021, "percentage": 7.7, "elapsed_time": "0:20:50", "remaining_time": "4:09:43", "throughput": 2384.67, "total_tokens": 2980864} {"current_steps": 5175, "total_steps": 67140, "loss": 0.7456, "lr": 3.853142686922848e-05, "epoch": 0.7707774798927614, "percentage": 7.71, "elapsed_time": "0:20:51", "remaining_time": "4:09:40", "throughput": 2384.69, "total_tokens": 2983488} {"current_steps": 5180, "total_steps": 67140, "loss": 0.7176, "lr": 3.856866249627644e-05, "epoch": 0.7715221924337206, "percentage": 7.72, "elapsed_time": "0:20:52", "remaining_time": "4:09:38", "throughput": 2384.78, "total_tokens": 2986304} {"current_steps": 5185, "total_steps": 67140, "loss": 0.7121, "lr": 3.8605898123324396e-05, "epoch": 0.7722669049746798, "percentage": 7.72, "elapsed_time": "0:20:53", "remaining_time": "4:09:36", "throughput": 2384.9, "total_tokens": 2989120} {"current_steps": 5190, "total_steps": 67140, "loss": 0.7255, "lr": 3.864313375037236e-05, "epoch": 0.773011617515639, "percentage": 7.73, "elapsed_time": "0:20:54", "remaining_time": "4:09:33", "throughput": 2384.98, "total_tokens": 2991904} {"current_steps": 5195, "total_steps": 67140, "loss": 0.7763, "lr": 3.8680369377420316e-05, "epoch": 0.7737563300565982, "percentage": 7.74, "elapsed_time": "0:20:55", "remaining_time": "4:09:31", "throughput": 2385.05, "total_tokens": 2994624} {"current_steps": 5200, "total_steps": 67140, "loss": 0.7826, "lr": 3.871760500446828e-05, "epoch": 0.7745010425975574, "percentage": 7.75, "elapsed_time": "0:20:56", "remaining_time": "4:09:29", "throughput": 2385.2, "total_tokens": 2997568} {"current_steps": 5205, "total_steps": 67140, "loss": 0.9045, "lr": 3.8754840631516235e-05, "epoch": 0.7752457551385166, "percentage": 7.75, "elapsed_time": "0:20:57", "remaining_time": "4:09:27", "throughput": 2385.35, "total_tokens": 3000448} {"current_steps": 5210, "total_steps": 67140, "loss": 0.8687, "lr": 3.87920762585642e-05, "epoch": 0.7759904676794758, "percentage": 7.76, "elapsed_time": "0:20:59", "remaining_time": "4:09:25", "throughput": 2385.49, "total_tokens": 3003392} {"current_steps": 5215, "total_steps": 67140, "loss": 0.7714, "lr": 3.8829311885612155e-05, "epoch": 0.7767351802204349, "percentage": 7.77, "elapsed_time": "0:21:00", "remaining_time": "4:09:23", "throughput": 2385.53, "total_tokens": 3006080} {"current_steps": 5220, "total_steps": 67140, "loss": 0.7147, "lr": 3.886654751266012e-05, "epoch": 0.7774798927613941, "percentage": 7.77, "elapsed_time": "0:21:01", "remaining_time": "4:09:21", "throughput": 2385.69, "total_tokens": 3008992} {"current_steps": 5225, "total_steps": 67140, "loss": 0.6045, "lr": 3.8903783139708075e-05, "epoch": 0.7782246053023533, "percentage": 7.78, "elapsed_time": "0:21:02", "remaining_time": "4:09:18", "throughput": 2385.67, "total_tokens": 3011552} {"current_steps": 5230, "total_steps": 67140, "loss": 0.8235, "lr": 3.894101876675603e-05, "epoch": 0.7789693178433125, "percentage": 7.79, "elapsed_time": "0:21:03", "remaining_time": "4:09:16", "throughput": 2385.79, "total_tokens": 3014400} {"current_steps": 5235, "total_steps": 67140, "loss": 0.6894, "lr": 3.8978254393803994e-05, "epoch": 0.7797140303842717, "percentage": 7.8, "elapsed_time": "0:21:04", "remaining_time": "4:09:14", "throughput": 2385.93, "total_tokens": 3017280} {"current_steps": 5240, "total_steps": 67140, "loss": 0.7822, "lr": 3.901549002085195e-05, "epoch": 0.7804587429252309, "percentage": 7.8, "elapsed_time": "0:21:05", "remaining_time": "4:09:12", "throughput": 2386.02, "total_tokens": 3020064} {"current_steps": 5245, "total_steps": 67140, "loss": 0.7685, "lr": 3.9052725647899914e-05, "epoch": 0.7812034554661901, "percentage": 7.81, "elapsed_time": "0:21:06", "remaining_time": "4:09:10", "throughput": 2386.21, "total_tokens": 3023072} {"current_steps": 5250, "total_steps": 67140, "loss": 0.686, "lr": 3.908996127494787e-05, "epoch": 0.7819481680071493, "percentage": 7.82, "elapsed_time": "0:21:08", "remaining_time": "4:09:08", "throughput": 2386.3, "total_tokens": 3025856} {"current_steps": 5255, "total_steps": 67140, "loss": 0.7592, "lr": 3.9127196901995834e-05, "epoch": 0.7826928805481085, "percentage": 7.83, "elapsed_time": "0:21:09", "remaining_time": "4:09:06", "throughput": 2386.64, "total_tokens": 3029152} {"current_steps": 5260, "total_steps": 67140, "loss": 0.7286, "lr": 3.916443252904379e-05, "epoch": 0.7834375930890676, "percentage": 7.83, "elapsed_time": "0:21:10", "remaining_time": "4:09:04", "throughput": 2386.7, "total_tokens": 3031904} {"current_steps": 5265, "total_steps": 67140, "loss": 0.6242, "lr": 3.9201668156091754e-05, "epoch": 0.7841823056300268, "percentage": 7.84, "elapsed_time": "0:21:11", "remaining_time": "4:09:02", "throughput": 2386.87, "total_tokens": 3034848} {"current_steps": 5270, "total_steps": 67140, "loss": 0.7729, "lr": 3.923890378313971e-05, "epoch": 0.784927018170986, "percentage": 7.85, "elapsed_time": "0:21:12", "remaining_time": "4:09:00", "throughput": 2387.08, "total_tokens": 3037888} {"current_steps": 5275, "total_steps": 67140, "loss": 0.6597, "lr": 3.9276139410187666e-05, "epoch": 0.7856717307119452, "percentage": 7.86, "elapsed_time": "0:21:13", "remaining_time": "4:08:58", "throughput": 2387.29, "total_tokens": 3040896} {"current_steps": 5280, "total_steps": 67140, "loss": 0.8254, "lr": 3.931337503723563e-05, "epoch": 0.7864164432529044, "percentage": 7.86, "elapsed_time": "0:21:14", "remaining_time": "4:08:56", "throughput": 2387.46, "total_tokens": 3043840} {"current_steps": 5285, "total_steps": 67140, "loss": 0.7491, "lr": 3.9350610664283586e-05, "epoch": 0.7871611557938636, "percentage": 7.87, "elapsed_time": "0:21:16", "remaining_time": "4:08:54", "throughput": 2387.55, "total_tokens": 3046624} {"current_steps": 5290, "total_steps": 67140, "loss": 0.6797, "lr": 3.938784629133155e-05, "epoch": 0.7879058683348228, "percentage": 7.88, "elapsed_time": "0:21:17", "remaining_time": "4:08:52", "throughput": 2387.68, "total_tokens": 3049472} {"current_steps": 5295, "total_steps": 67140, "loss": 0.7185, "lr": 3.9425081918379506e-05, "epoch": 0.788650580875782, "percentage": 7.89, "elapsed_time": "0:21:18", "remaining_time": "4:08:50", "throughput": 2387.85, "total_tokens": 3052416} {"current_steps": 5300, "total_steps": 67140, "loss": 0.6726, "lr": 3.946231754542747e-05, "epoch": 0.7893952934167411, "percentage": 7.89, "elapsed_time": "0:21:19", "remaining_time": "4:08:48", "throughput": 2387.93, "total_tokens": 3055232} {"current_steps": 5305, "total_steps": 67140, "loss": 0.7165, "lr": 3.9499553172475426e-05, "epoch": 0.7901400059577003, "percentage": 7.9, "elapsed_time": "0:21:20", "remaining_time": "4:08:46", "throughput": 2388.16, "total_tokens": 3058272} {"current_steps": 5310, "total_steps": 67140, "loss": 0.6962, "lr": 3.953678879952338e-05, "epoch": 0.7908847184986595, "percentage": 7.91, "elapsed_time": "0:21:21", "remaining_time": "4:08:44", "throughput": 2388.35, "total_tokens": 3061280} {"current_steps": 5315, "total_steps": 67140, "loss": 0.7928, "lr": 3.9574024426571345e-05, "epoch": 0.7916294310396187, "percentage": 7.92, "elapsed_time": "0:21:22", "remaining_time": "4:08:43", "throughput": 2388.56, "total_tokens": 3064320} {"current_steps": 5320, "total_steps": 67140, "loss": 0.727, "lr": 3.96112600536193e-05, "epoch": 0.7923741435805779, "percentage": 7.92, "elapsed_time": "0:21:24", "remaining_time": "4:08:40", "throughput": 2388.56, "total_tokens": 3066912} {"current_steps": 5325, "total_steps": 67140, "loss": 0.7111, "lr": 3.9648495680667265e-05, "epoch": 0.7931188561215371, "percentage": 7.93, "elapsed_time": "0:21:25", "remaining_time": "4:08:38", "throughput": 2388.7, "total_tokens": 3069856} {"current_steps": 5330, "total_steps": 67140, "loss": 0.6898, "lr": 3.968573130771522e-05, "epoch": 0.7938635686624963, "percentage": 7.94, "elapsed_time": "0:21:26", "remaining_time": "4:08:36", "throughput": 2388.83, "total_tokens": 3072672} {"current_steps": 5335, "total_steps": 67140, "loss": 0.699, "lr": 3.9722966934763185e-05, "epoch": 0.7946082812034555, "percentage": 7.95, "elapsed_time": "0:21:27", "remaining_time": "4:08:34", "throughput": 2389.08, "total_tokens": 3075776} {"current_steps": 5340, "total_steps": 67140, "loss": 0.6921, "lr": 3.976020256181114e-05, "epoch": 0.7953529937444147, "percentage": 7.95, "elapsed_time": "0:21:28", "remaining_time": "4:08:32", "throughput": 2389.2, "total_tokens": 3078624} {"current_steps": 5345, "total_steps": 67140, "loss": 0.6888, "lr": 3.9797438188859104e-05, "epoch": 0.7960977062853738, "percentage": 7.96, "elapsed_time": "0:21:29", "remaining_time": "4:08:30", "throughput": 2389.44, "total_tokens": 3081728} {"current_steps": 5350, "total_steps": 67140, "loss": 0.5783, "lr": 3.983467381590707e-05, "epoch": 0.796842418826333, "percentage": 7.97, "elapsed_time": "0:21:30", "remaining_time": "4:08:28", "throughput": 2389.54, "total_tokens": 3084512} {"current_steps": 5355, "total_steps": 67140, "loss": 0.8793, "lr": 3.987190944295502e-05, "epoch": 0.7975871313672922, "percentage": 7.98, "elapsed_time": "0:21:31", "remaining_time": "4:08:26", "throughput": 2389.71, "total_tokens": 3087488} {"current_steps": 5360, "total_steps": 67140, "loss": 0.7538, "lr": 3.990914507000298e-05, "epoch": 0.7983318439082514, "percentage": 7.98, "elapsed_time": "0:21:33", "remaining_time": "4:08:23", "throughput": 2389.69, "total_tokens": 3089984} {"current_steps": 5365, "total_steps": 67140, "loss": 0.6577, "lr": 3.994638069705094e-05, "epoch": 0.7990765564492106, "percentage": 7.99, "elapsed_time": "0:21:34", "remaining_time": "4:08:21", "throughput": 2389.83, "total_tokens": 3092896} {"current_steps": 5370, "total_steps": 67140, "loss": 0.7877, "lr": 3.99836163240989e-05, "epoch": 0.7998212689901698, "percentage": 8.0, "elapsed_time": "0:21:35", "remaining_time": "4:08:20", "throughput": 2390.0, "total_tokens": 3095872} {"current_steps": 5375, "total_steps": 67140, "loss": 0.7956, "lr": 4.002085195114686e-05, "epoch": 0.800565981531129, "percentage": 8.01, "elapsed_time": "0:21:36", "remaining_time": "4:08:17", "throughput": 2390.07, "total_tokens": 3098624} {"current_steps": 5380, "total_steps": 67140, "loss": 0.7553, "lr": 4.005808757819482e-05, "epoch": 0.8013106940720882, "percentage": 8.01, "elapsed_time": "0:21:37", "remaining_time": "4:08:16", "throughput": 2390.31, "total_tokens": 3101760} {"current_steps": 5385, "total_steps": 67140, "loss": 0.6778, "lr": 4.0095323205242776e-05, "epoch": 0.8020554066130474, "percentage": 8.02, "elapsed_time": "0:21:38", "remaining_time": "4:08:14", "throughput": 2390.53, "total_tokens": 3104800} {"current_steps": 5390, "total_steps": 67140, "loss": 0.5562, "lr": 4.013255883229074e-05, "epoch": 0.8028001191540065, "percentage": 8.03, "elapsed_time": "0:21:39", "remaining_time": "4:08:12", "throughput": 2390.65, "total_tokens": 3107712} {"current_steps": 5395, "total_steps": 67140, "loss": 0.8035, "lr": 4.01697944593387e-05, "epoch": 0.8035448316949657, "percentage": 8.04, "elapsed_time": "0:21:41", "remaining_time": "4:08:10", "throughput": 2390.83, "total_tokens": 3110720} {"current_steps": 5400, "total_steps": 67140, "loss": 0.6448, "lr": 4.020703008638665e-05, "epoch": 0.8042895442359249, "percentage": 8.04, "elapsed_time": "0:21:42", "remaining_time": "4:08:09", "throughput": 2391.06, "total_tokens": 3113792} {"current_steps": 5405, "total_steps": 67140, "loss": 0.6972, "lr": 4.0244265713434616e-05, "epoch": 0.8050342567768841, "percentage": 8.05, "elapsed_time": "0:21:43", "remaining_time": "4:08:07", "throughput": 2391.2, "total_tokens": 3116736} {"current_steps": 5410, "total_steps": 67140, "loss": 0.7024, "lr": 4.028150134048257e-05, "epoch": 0.8057789693178433, "percentage": 8.06, "elapsed_time": "0:21:44", "remaining_time": "4:08:05", "throughput": 2391.31, "total_tokens": 3119584} {"current_steps": 5415, "total_steps": 67140, "loss": 0.6762, "lr": 4.0318736967530536e-05, "epoch": 0.8065236818588025, "percentage": 8.07, "elapsed_time": "0:21:45", "remaining_time": "4:08:03", "throughput": 2391.43, "total_tokens": 3122432} {"current_steps": 5420, "total_steps": 67140, "loss": 0.8177, "lr": 4.035597259457849e-05, "epoch": 0.8072683943997617, "percentage": 8.07, "elapsed_time": "0:21:46", "remaining_time": "4:08:00", "throughput": 2391.51, "total_tokens": 3125184} {"current_steps": 5425, "total_steps": 67140, "loss": 0.698, "lr": 4.0393208221626455e-05, "epoch": 0.8080131069407209, "percentage": 8.08, "elapsed_time": "0:21:47", "remaining_time": "4:07:58", "throughput": 2391.59, "total_tokens": 3128000} {"current_steps": 5430, "total_steps": 67140, "loss": 0.8117, "lr": 4.043044384867442e-05, "epoch": 0.80875781948168, "percentage": 8.09, "elapsed_time": "0:21:49", "remaining_time": "4:07:56", "throughput": 2391.76, "total_tokens": 3130944} {"current_steps": 5435, "total_steps": 67140, "loss": 0.6658, "lr": 4.0467679475722375e-05, "epoch": 0.8095025320226392, "percentage": 8.1, "elapsed_time": "0:21:50", "remaining_time": "4:07:55", "throughput": 2391.97, "total_tokens": 3133984} {"current_steps": 5440, "total_steps": 67140, "loss": 0.6867, "lr": 4.050491510277033e-05, "epoch": 0.8102472445635984, "percentage": 8.1, "elapsed_time": "0:21:51", "remaining_time": "4:07:53", "throughput": 2392.21, "total_tokens": 3137120} {"current_steps": 5445, "total_steps": 67140, "loss": 0.7955, "lr": 4.054215072981829e-05, "epoch": 0.8109919571045576, "percentage": 8.11, "elapsed_time": "0:21:52", "remaining_time": "4:07:51", "throughput": 2392.25, "total_tokens": 3139840} {"current_steps": 5450, "total_steps": 67140, "loss": 0.6886, "lr": 4.057938635686625e-05, "epoch": 0.8117366696455168, "percentage": 8.12, "elapsed_time": "0:21:53", "remaining_time": "4:07:49", "throughput": 2392.3, "total_tokens": 3142592} {"current_steps": 5455, "total_steps": 67140, "loss": 0.6599, "lr": 4.061662198391421e-05, "epoch": 0.812481382186476, "percentage": 8.12, "elapsed_time": "0:21:54", "remaining_time": "4:07:46", "throughput": 2392.33, "total_tokens": 3145248} {"current_steps": 5460, "total_steps": 67140, "loss": 0.6783, "lr": 4.065385761096217e-05, "epoch": 0.8132260947274352, "percentage": 8.13, "elapsed_time": "0:21:55", "remaining_time": "4:07:44", "throughput": 2392.45, "total_tokens": 3148096} {"current_steps": 5465, "total_steps": 67140, "loss": 0.7515, "lr": 4.069109323801013e-05, "epoch": 0.8139708072683944, "percentage": 8.14, "elapsed_time": "0:21:56", "remaining_time": "4:07:42", "throughput": 2392.59, "total_tokens": 3151008} {"current_steps": 5470, "total_steps": 67140, "loss": 0.6232, "lr": 4.072832886505809e-05, "epoch": 0.8147155198093536, "percentage": 8.15, "elapsed_time": "0:21:58", "remaining_time": "4:07:40", "throughput": 2392.75, "total_tokens": 3153920} {"current_steps": 5475, "total_steps": 67140, "loss": 0.9276, "lr": 4.0765564492106054e-05, "epoch": 0.8154602323503127, "percentage": 8.15, "elapsed_time": "0:21:59", "remaining_time": "4:07:38", "throughput": 2392.72, "total_tokens": 3156448} {"current_steps": 5480, "total_steps": 67140, "loss": 0.8717, "lr": 4.080280011915401e-05, "epoch": 0.8162049448912719, "percentage": 8.16, "elapsed_time": "0:22:00", "remaining_time": "4:07:36", "throughput": 2392.97, "total_tokens": 3159552} {"current_steps": 5485, "total_steps": 67140, "loss": 0.6846, "lr": 4.084003574620197e-05, "epoch": 0.8169496574322311, "percentage": 8.17, "elapsed_time": "0:22:01", "remaining_time": "4:07:33", "throughput": 2393.0, "total_tokens": 3162240} {"current_steps": 5490, "total_steps": 67140, "loss": 0.6737, "lr": 4.087727137324992e-05, "epoch": 0.8176943699731903, "percentage": 8.18, "elapsed_time": "0:22:02", "remaining_time": "4:07:31", "throughput": 2392.9, "total_tokens": 3164608} {"current_steps": 5495, "total_steps": 67140, "loss": 0.6261, "lr": 4.0914507000297886e-05, "epoch": 0.8184390825141495, "percentage": 8.18, "elapsed_time": "0:22:03", "remaining_time": "4:07:29", "throughput": 2393.04, "total_tokens": 3167520} {"current_steps": 5500, "total_steps": 67140, "loss": 0.6099, "lr": 4.095174262734584e-05, "epoch": 0.8191837950551087, "percentage": 8.19, "elapsed_time": "0:22:04", "remaining_time": "4:07:27", "throughput": 2393.18, "total_tokens": 3170400} {"current_steps": 5505, "total_steps": 67140, "loss": 0.7205, "lr": 4.0988978254393806e-05, "epoch": 0.819928507596068, "percentage": 8.2, "elapsed_time": "0:22:05", "remaining_time": "4:07:25", "throughput": 2393.34, "total_tokens": 3173376} {"current_steps": 5510, "total_steps": 67140, "loss": 0.6595, "lr": 4.102621388144177e-05, "epoch": 0.8206732201370271, "percentage": 8.21, "elapsed_time": "0:22:07", "remaining_time": "4:07:23", "throughput": 2393.47, "total_tokens": 3176256} {"current_steps": 5515, "total_steps": 67140, "loss": 0.7819, "lr": 4.1063449508489726e-05, "epoch": 0.8214179326779864, "percentage": 8.21, "elapsed_time": "0:22:08", "remaining_time": "4:07:21", "throughput": 2393.59, "total_tokens": 3179136} {"current_steps": 5520, "total_steps": 67140, "loss": 0.6203, "lr": 4.110068513553769e-05, "epoch": 0.8221626452189454, "percentage": 8.22, "elapsed_time": "0:22:09", "remaining_time": "4:07:19", "throughput": 2393.66, "total_tokens": 3181920} {"current_steps": 5525, "total_steps": 67140, "loss": 0.719, "lr": 4.1137920762585646e-05, "epoch": 0.8229073577599046, "percentage": 8.23, "elapsed_time": "0:22:10", "remaining_time": "4:07:17", "throughput": 2393.76, "total_tokens": 3184736} {"current_steps": 5530, "total_steps": 67140, "loss": 0.6831, "lr": 4.11751563896336e-05, "epoch": 0.8236520703008638, "percentage": 8.24, "elapsed_time": "0:22:11", "remaining_time": "4:07:14", "throughput": 2393.81, "total_tokens": 3187456} {"current_steps": 5535, "total_steps": 67140, "loss": 0.6919, "lr": 4.121239201668156e-05, "epoch": 0.824396782841823, "percentage": 8.24, "elapsed_time": "0:22:12", "remaining_time": "4:07:12", "throughput": 2393.9, "total_tokens": 3190240} {"current_steps": 5540, "total_steps": 67140, "loss": 0.7122, "lr": 4.124962764372952e-05, "epoch": 0.8251414953827823, "percentage": 8.25, "elapsed_time": "0:22:13", "remaining_time": "4:07:10", "throughput": 2393.9, "total_tokens": 3192864} {"current_steps": 5545, "total_steps": 67140, "loss": 0.6447, "lr": 4.1286863270777485e-05, "epoch": 0.8258862079237415, "percentage": 8.26, "elapsed_time": "0:22:14", "remaining_time": "4:07:07", "throughput": 2393.85, "total_tokens": 3195392} {"current_steps": 5550, "total_steps": 67140, "loss": 0.6736, "lr": 4.132409889782544e-05, "epoch": 0.8266309204647007, "percentage": 8.27, "elapsed_time": "0:22:15", "remaining_time": "4:07:05", "throughput": 2393.93, "total_tokens": 3198176} {"current_steps": 5555, "total_steps": 67140, "loss": 0.7417, "lr": 4.1361334524873405e-05, "epoch": 0.8273756330056599, "percentage": 8.27, "elapsed_time": "0:22:17", "remaining_time": "4:07:03", "throughput": 2394.08, "total_tokens": 3201152} {"current_steps": 5560, "total_steps": 67140, "loss": 0.5735, "lr": 4.139857015192136e-05, "epoch": 0.828120345546619, "percentage": 8.28, "elapsed_time": "0:22:18", "remaining_time": "4:07:02", "throughput": 2394.29, "total_tokens": 3204320} {"current_steps": 5565, "total_steps": 67140, "loss": 0.626, "lr": 4.1435805778969324e-05, "epoch": 0.8288650580875782, "percentage": 8.29, "elapsed_time": "0:22:19", "remaining_time": "4:07:00", "throughput": 2394.31, "total_tokens": 3207008} {"current_steps": 5570, "total_steps": 67140, "loss": 0.7157, "lr": 4.1473041406017274e-05, "epoch": 0.8296097706285374, "percentage": 8.3, "elapsed_time": "0:22:20", "remaining_time": "4:06:58", "throughput": 2394.39, "total_tokens": 3209760} {"current_steps": 5575, "total_steps": 67140, "loss": 0.9369, "lr": 4.151027703306524e-05, "epoch": 0.8303544831694966, "percentage": 8.3, "elapsed_time": "0:22:21", "remaining_time": "4:06:56", "throughput": 2394.61, "total_tokens": 3212864} {"current_steps": 5580, "total_steps": 67140, "loss": 0.7527, "lr": 4.1547512660113194e-05, "epoch": 0.8310991957104558, "percentage": 8.31, "elapsed_time": "0:22:22", "remaining_time": "4:06:54", "throughput": 2394.72, "total_tokens": 3215744} {"current_steps": 5585, "total_steps": 67140, "loss": 0.7979, "lr": 4.158474828716116e-05, "epoch": 0.831843908251415, "percentage": 8.32, "elapsed_time": "0:22:23", "remaining_time": "4:06:52", "throughput": 2394.74, "total_tokens": 3218400} {"current_steps": 5590, "total_steps": 67140, "loss": 0.5457, "lr": 4.162198391420912e-05, "epoch": 0.8325886207923742, "percentage": 8.33, "elapsed_time": "0:22:25", "remaining_time": "4:06:49", "throughput": 2394.7, "total_tokens": 3220960} {"current_steps": 5595, "total_steps": 67140, "loss": 0.7779, "lr": 4.165921954125708e-05, "epoch": 0.8333333333333334, "percentage": 8.33, "elapsed_time": "0:22:26", "remaining_time": "4:06:47", "throughput": 2394.85, "total_tokens": 3223872} {"current_steps": 5600, "total_steps": 67140, "loss": 0.6108, "lr": 4.169645516830504e-05, "epoch": 0.8340780458742926, "percentage": 8.34, "elapsed_time": "0:22:27", "remaining_time": "4:06:46", "throughput": 2395.02, "total_tokens": 3226880} {"current_steps": 5605, "total_steps": 67140, "loss": 0.86, "lr": 4.1733690795352996e-05, "epoch": 0.8348227584152517, "percentage": 8.35, "elapsed_time": "0:22:28", "remaining_time": "4:06:44", "throughput": 2395.23, "total_tokens": 3229920} {"current_steps": 5610, "total_steps": 67140, "loss": 0.7648, "lr": 4.177092642240096e-05, "epoch": 0.8355674709562109, "percentage": 8.36, "elapsed_time": "0:22:29", "remaining_time": "4:06:42", "throughput": 2395.35, "total_tokens": 3232768} {"current_steps": 5615, "total_steps": 67140, "loss": 0.7214, "lr": 4.180816204944891e-05, "epoch": 0.8363121834971701, "percentage": 8.36, "elapsed_time": "0:22:30", "remaining_time": "4:06:40", "throughput": 2395.57, "total_tokens": 3235808} {"current_steps": 5620, "total_steps": 67140, "loss": 0.6522, "lr": 4.184539767649687e-05, "epoch": 0.8370568960381293, "percentage": 8.37, "elapsed_time": "0:22:31", "remaining_time": "4:06:38", "throughput": 2395.55, "total_tokens": 3238400} {"current_steps": 5625, "total_steps": 67140, "loss": 0.5898, "lr": 4.1882633303544836e-05, "epoch": 0.8378016085790885, "percentage": 8.38, "elapsed_time": "0:22:32", "remaining_time": "4:06:35", "throughput": 2395.65, "total_tokens": 3241216} {"current_steps": 5630, "total_steps": 67140, "loss": 0.7482, "lr": 4.191986893059279e-05, "epoch": 0.8385463211200477, "percentage": 8.39, "elapsed_time": "0:22:34", "remaining_time": "4:06:34", "throughput": 2395.88, "total_tokens": 3244320} {"current_steps": 5635, "total_steps": 67140, "loss": 0.656, "lr": 4.1957104557640756e-05, "epoch": 0.8392910336610069, "percentage": 8.39, "elapsed_time": "0:22:35", "remaining_time": "4:06:32", "throughput": 2395.99, "total_tokens": 3247200} {"current_steps": 5640, "total_steps": 67140, "loss": 0.689, "lr": 4.199434018468871e-05, "epoch": 0.8400357462019661, "percentage": 8.4, "elapsed_time": "0:22:36", "remaining_time": "4:06:30", "throughput": 2396.14, "total_tokens": 3250144} {"current_steps": 5645, "total_steps": 67140, "loss": 0.6606, "lr": 4.2031575811736675e-05, "epoch": 0.8407804587429253, "percentage": 8.41, "elapsed_time": "0:22:37", "remaining_time": "4:06:28", "throughput": 2396.23, "total_tokens": 3252928} {"current_steps": 5650, "total_steps": 67140, "loss": 0.6333, "lr": 4.206881143878463e-05, "epoch": 0.8415251712838844, "percentage": 8.42, "elapsed_time": "0:22:38", "remaining_time": "4:06:27", "throughput": 2396.52, "total_tokens": 3256160} {"current_steps": 5655, "total_steps": 67140, "loss": 0.823, "lr": 4.2106047065832595e-05, "epoch": 0.8422698838248436, "percentage": 8.42, "elapsed_time": "0:22:39", "remaining_time": "4:06:25", "throughput": 2396.63, "total_tokens": 3259008} {"current_steps": 5660, "total_steps": 67140, "loss": 0.8863, "lr": 4.2143282692880545e-05, "epoch": 0.8430145963658028, "percentage": 8.43, "elapsed_time": "0:22:40", "remaining_time": "4:06:22", "throughput": 2396.72, "total_tokens": 3261824} {"current_steps": 5665, "total_steps": 67140, "loss": 0.6926, "lr": 4.218051831992851e-05, "epoch": 0.843759308906762, "percentage": 8.44, "elapsed_time": "0:22:42", "remaining_time": "4:06:21", "throughput": 2396.98, "total_tokens": 3264992} {"current_steps": 5670, "total_steps": 67140, "loss": 0.7855, "lr": 4.221775394697647e-05, "epoch": 0.8445040214477212, "percentage": 8.45, "elapsed_time": "0:22:43", "remaining_time": "4:06:19", "throughput": 2397.17, "total_tokens": 3268032} {"current_steps": 5675, "total_steps": 67140, "loss": 0.627, "lr": 4.225498957402443e-05, "epoch": 0.8452487339886804, "percentage": 8.45, "elapsed_time": "0:22:44", "remaining_time": "4:06:18", "throughput": 2397.32, "total_tokens": 3271008} {"current_steps": 5680, "total_steps": 67140, "loss": 0.7459, "lr": 4.229222520107239e-05, "epoch": 0.8459934465296396, "percentage": 8.46, "elapsed_time": "0:22:45", "remaining_time": "4:06:16", "throughput": 2397.52, "total_tokens": 3274080} {"current_steps": 5685, "total_steps": 67140, "loss": 0.7522, "lr": 4.232946082812035e-05, "epoch": 0.8467381590705988, "percentage": 8.47, "elapsed_time": "0:22:46", "remaining_time": "4:06:14", "throughput": 2397.56, "total_tokens": 3276768} {"current_steps": 5690, "total_steps": 67140, "loss": 0.7951, "lr": 4.236669645516831e-05, "epoch": 0.8474828716115579, "percentage": 8.47, "elapsed_time": "0:22:47", "remaining_time": "4:06:11", "throughput": 2397.65, "total_tokens": 3279552} {"current_steps": 5695, "total_steps": 67140, "loss": 3.6469, "lr": 4.240393208221627e-05, "epoch": 0.8482275841525171, "percentage": 8.48, "elapsed_time": "0:22:48", "remaining_time": "4:06:09", "throughput": 2397.63, "total_tokens": 3282112} {"current_steps": 5700, "total_steps": 67140, "loss": 0.6203, "lr": 4.2441167709264223e-05, "epoch": 0.8489722966934763, "percentage": 8.49, "elapsed_time": "0:22:50", "remaining_time": "4:06:07", "throughput": 2397.67, "total_tokens": 3284832} {"current_steps": 5705, "total_steps": 67140, "loss": 0.8438, "lr": 4.247840333631219e-05, "epoch": 0.8497170092344355, "percentage": 8.5, "elapsed_time": "0:22:51", "remaining_time": "4:06:05", "throughput": 2397.78, "total_tokens": 3287680} {"current_steps": 5710, "total_steps": 67140, "loss": 0.7666, "lr": 4.251563896336014e-05, "epoch": 0.8504617217753947, "percentage": 8.5, "elapsed_time": "0:22:52", "remaining_time": "4:06:03", "throughput": 2398.01, "total_tokens": 3290752} {"current_steps": 5715, "total_steps": 67140, "loss": 0.6858, "lr": 4.2552874590408106e-05, "epoch": 0.8512064343163539, "percentage": 8.51, "elapsed_time": "0:22:53", "remaining_time": "4:06:01", "throughput": 2398.03, "total_tokens": 3293440} {"current_steps": 5720, "total_steps": 67140, "loss": 0.7002, "lr": 4.259011021745606e-05, "epoch": 0.8519511468573131, "percentage": 8.52, "elapsed_time": "0:22:54", "remaining_time": "4:05:59", "throughput": 2398.16, "total_tokens": 3296320} {"current_steps": 5725, "total_steps": 67140, "loss": 0.7687, "lr": 4.2627345844504026e-05, "epoch": 0.8526958593982723, "percentage": 8.53, "elapsed_time": "0:22:55", "remaining_time": "4:05:57", "throughput": 2398.34, "total_tokens": 3299296} {"current_steps": 5730, "total_steps": 67140, "loss": 0.6234, "lr": 4.266458147155198e-05, "epoch": 0.8534405719392315, "percentage": 8.53, "elapsed_time": "0:22:56", "remaining_time": "4:05:55", "throughput": 2398.47, "total_tokens": 3302176} {"current_steps": 5735, "total_steps": 67140, "loss": 0.6438, "lr": 4.2701817098599946e-05, "epoch": 0.8541852844801906, "percentage": 8.54, "elapsed_time": "0:22:57", "remaining_time": "4:05:53", "throughput": 2398.55, "total_tokens": 3304992} {"current_steps": 5740, "total_steps": 67140, "loss": 0.7043, "lr": 4.27390527256479e-05, "epoch": 0.8549299970211498, "percentage": 8.55, "elapsed_time": "0:22:59", "remaining_time": "4:05:51", "throughput": 2398.71, "total_tokens": 3307968} {"current_steps": 5745, "total_steps": 67140, "loss": 0.6086, "lr": 4.277628835269586e-05, "epoch": 0.855674709562109, "percentage": 8.56, "elapsed_time": "0:23:00", "remaining_time": "4:05:49", "throughput": 2398.87, "total_tokens": 3310944} {"current_steps": 5750, "total_steps": 67140, "loss": 0.6075, "lr": 4.281352397974382e-05, "epoch": 0.8564194221030682, "percentage": 8.56, "elapsed_time": "0:23:01", "remaining_time": "4:05:47", "throughput": 2399.01, "total_tokens": 3313856} {"current_steps": 5755, "total_steps": 67140, "loss": 0.7799, "lr": 4.285075960679178e-05, "epoch": 0.8571641346440274, "percentage": 8.57, "elapsed_time": "0:23:02", "remaining_time": "4:05:45", "throughput": 2399.08, "total_tokens": 3316640} {"current_steps": 5760, "total_steps": 67140, "loss": 0.6047, "lr": 4.288799523383974e-05, "epoch": 0.8579088471849866, "percentage": 8.58, "elapsed_time": "0:23:03", "remaining_time": "4:05:43", "throughput": 2399.21, "total_tokens": 3319520} {"current_steps": 5765, "total_steps": 67140, "loss": 0.8377, "lr": 4.29252308608877e-05, "epoch": 0.8586535597259458, "percentage": 8.59, "elapsed_time": "0:23:04", "remaining_time": "4:05:41", "throughput": 2399.2, "total_tokens": 3322144} {"current_steps": 5770, "total_steps": 67140, "loss": 0.7336, "lr": 4.296246648793566e-05, "epoch": 0.859398272266905, "percentage": 8.59, "elapsed_time": "0:23:05", "remaining_time": "4:05:39", "throughput": 2399.26, "total_tokens": 3324864} {"current_steps": 5775, "total_steps": 67140, "loss": 0.7268, "lr": 4.299970211498362e-05, "epoch": 0.8601429848078642, "percentage": 8.6, "elapsed_time": "0:23:06", "remaining_time": "4:05:37", "throughput": 2399.36, "total_tokens": 3327712} {"current_steps": 5780, "total_steps": 67140, "loss": 0.6996, "lr": 4.303693774203158e-05, "epoch": 0.8608876973488233, "percentage": 8.61, "elapsed_time": "0:23:08", "remaining_time": "4:05:35", "throughput": 2399.49, "total_tokens": 3330592} {"current_steps": 5785, "total_steps": 67140, "loss": 0.7177, "lr": 4.307417336907954e-05, "epoch": 0.8616324098897825, "percentage": 8.62, "elapsed_time": "0:23:09", "remaining_time": "4:05:33", "throughput": 2399.7, "total_tokens": 3333632} {"current_steps": 5790, "total_steps": 67140, "loss": 0.656, "lr": 4.3111408996127494e-05, "epoch": 0.8623771224307417, "percentage": 8.62, "elapsed_time": "0:23:10", "remaining_time": "4:05:31", "throughput": 2399.74, "total_tokens": 3336384} {"current_steps": 5795, "total_steps": 67140, "loss": 0.6437, "lr": 4.314864462317546e-05, "epoch": 0.8631218349717009, "percentage": 8.63, "elapsed_time": "0:23:11", "remaining_time": "4:05:29", "throughput": 2399.93, "total_tokens": 3339424} {"current_steps": 5800, "total_steps": 67140, "loss": 0.5996, "lr": 4.3185880250223414e-05, "epoch": 0.8638665475126601, "percentage": 8.64, "elapsed_time": "0:23:12", "remaining_time": "4:05:27", "throughput": 2399.98, "total_tokens": 3342176} {"current_steps": 5805, "total_steps": 67140, "loss": 0.5872, "lr": 4.322311587727138e-05, "epoch": 0.8646112600536193, "percentage": 8.65, "elapsed_time": "0:23:13", "remaining_time": "4:05:26", "throughput": 2400.13, "total_tokens": 3345152} {"current_steps": 5810, "total_steps": 67140, "loss": 0.6196, "lr": 4.3260351504319333e-05, "epoch": 0.8653559725945785, "percentage": 8.65, "elapsed_time": "0:23:14", "remaining_time": "4:05:24", "throughput": 2400.25, "total_tokens": 3348032} {"current_steps": 5815, "total_steps": 67140, "loss": 0.7121, "lr": 4.32975871313673e-05, "epoch": 0.8661006851355377, "percentage": 8.66, "elapsed_time": "0:23:16", "remaining_time": "4:05:22", "throughput": 2400.39, "total_tokens": 3351008} {"current_steps": 5820, "total_steps": 67140, "loss": 0.6463, "lr": 4.333482275841525e-05, "epoch": 0.8668453976764968, "percentage": 8.67, "elapsed_time": "0:23:17", "remaining_time": "4:05:21", "throughput": 2400.62, "total_tokens": 3354176} {"current_steps": 5825, "total_steps": 67140, "loss": 0.6423, "lr": 4.3372058385463216e-05, "epoch": 0.867590110217456, "percentage": 8.68, "elapsed_time": "0:23:18", "remaining_time": "4:05:19", "throughput": 2400.81, "total_tokens": 3357248} {"current_steps": 5830, "total_steps": 67140, "loss": 0.6608, "lr": 4.340929401251117e-05, "epoch": 0.8683348227584152, "percentage": 8.68, "elapsed_time": "0:23:19", "remaining_time": "4:05:17", "throughput": 2400.94, "total_tokens": 3360160} {"current_steps": 5835, "total_steps": 67140, "loss": 0.5775, "lr": 4.344652963955913e-05, "epoch": 0.8690795352993744, "percentage": 8.69, "elapsed_time": "0:23:20", "remaining_time": "4:05:15", "throughput": 2400.99, "total_tokens": 3362944} {"current_steps": 5840, "total_steps": 67140, "loss": 0.6896, "lr": 4.348376526660709e-05, "epoch": 0.8698242478403336, "percentage": 8.7, "elapsed_time": "0:23:21", "remaining_time": "4:05:14", "throughput": 2401.19, "total_tokens": 3365984} {"current_steps": 5845, "total_steps": 67140, "loss": 0.7076, "lr": 4.352100089365505e-05, "epoch": 0.8705689603812928, "percentage": 8.71, "elapsed_time": "0:23:22", "remaining_time": "4:05:12", "throughput": 2401.32, "total_tokens": 3368864} {"current_steps": 5850, "total_steps": 67140, "loss": 0.6879, "lr": 4.355823652070301e-05, "epoch": 0.871313672922252, "percentage": 8.71, "elapsed_time": "0:23:24", "remaining_time": "4:05:10", "throughput": 2401.44, "total_tokens": 3371776} {"current_steps": 5855, "total_steps": 67140, "loss": 0.6639, "lr": 4.359547214775097e-05, "epoch": 0.8720583854632112, "percentage": 8.72, "elapsed_time": "0:23:25", "remaining_time": "4:05:08", "throughput": 2401.65, "total_tokens": 3374816} {"current_steps": 5860, "total_steps": 67140, "loss": 0.5651, "lr": 4.363270777479893e-05, "epoch": 0.8728030980041704, "percentage": 8.73, "elapsed_time": "0:23:26", "remaining_time": "4:05:06", "throughput": 2401.75, "total_tokens": 3377664} {"current_steps": 5865, "total_steps": 67140, "loss": 0.7148, "lr": 4.366994340184689e-05, "epoch": 0.8735478105451295, "percentage": 8.74, "elapsed_time": "0:23:27", "remaining_time": "4:05:04", "throughput": 2401.75, "total_tokens": 3380288} {"current_steps": 5870, "total_steps": 67140, "loss": 0.6903, "lr": 4.370717902889485e-05, "epoch": 0.8742925230860887, "percentage": 8.74, "elapsed_time": "0:23:28", "remaining_time": "4:05:02", "throughput": 2401.93, "total_tokens": 3383328} {"current_steps": 5875, "total_steps": 67140, "loss": 0.6803, "lr": 4.374441465594281e-05, "epoch": 0.8750372356270479, "percentage": 8.75, "elapsed_time": "0:23:29", "remaining_time": "4:05:00", "throughput": 2402.05, "total_tokens": 3386240} {"current_steps": 5880, "total_steps": 67140, "loss": 0.6721, "lr": 4.3781650282990765e-05, "epoch": 0.8757819481680071, "percentage": 8.76, "elapsed_time": "0:23:30", "remaining_time": "4:04:58", "throughput": 2402.1, "total_tokens": 3388960} {"current_steps": 5885, "total_steps": 67140, "loss": 0.6035, "lr": 4.381888591003873e-05, "epoch": 0.8765266607089663, "percentage": 8.77, "elapsed_time": "0:23:31", "remaining_time": "4:04:56", "throughput": 2402.19, "total_tokens": 3391744} {"current_steps": 5890, "total_steps": 67140, "loss": 0.7935, "lr": 4.3856121537086684e-05, "epoch": 0.8772713732499255, "percentage": 8.77, "elapsed_time": "0:23:33", "remaining_time": "4:04:54", "throughput": 2402.18, "total_tokens": 3394400} {"current_steps": 5895, "total_steps": 67140, "loss": 0.8589, "lr": 4.389335716413465e-05, "epoch": 0.8780160857908847, "percentage": 8.78, "elapsed_time": "0:23:34", "remaining_time": "4:04:52", "throughput": 2402.28, "total_tokens": 3397280} {"current_steps": 5900, "total_steps": 67140, "loss": 0.7975, "lr": 4.3930592791182604e-05, "epoch": 0.878760798331844, "percentage": 8.79, "elapsed_time": "0:23:35", "remaining_time": "4:04:50", "throughput": 2402.35, "total_tokens": 3400160} {"current_steps": 5905, "total_steps": 67140, "loss": 0.7266, "lr": 4.396782841823057e-05, "epoch": 0.8795055108728032, "percentage": 8.8, "elapsed_time": "0:23:36", "remaining_time": "4:04:49", "throughput": 2402.58, "total_tokens": 3403392} {"current_steps": 5910, "total_steps": 67140, "loss": 0.7834, "lr": 4.4005064045278524e-05, "epoch": 0.8802502234137622, "percentage": 8.8, "elapsed_time": "0:23:37", "remaining_time": "4:04:48", "throughput": 2402.77, "total_tokens": 3406432} {"current_steps": 5915, "total_steps": 67140, "loss": 0.6892, "lr": 4.404229967232648e-05, "epoch": 0.8809949359547214, "percentage": 8.81, "elapsed_time": "0:23:38", "remaining_time": "4:04:46", "throughput": 2402.84, "total_tokens": 3409248} {"current_steps": 5920, "total_steps": 67140, "loss": 0.6784, "lr": 4.4079535299374443e-05, "epoch": 0.8817396484956807, "percentage": 8.82, "elapsed_time": "0:23:39", "remaining_time": "4:04:44", "throughput": 2402.92, "total_tokens": 3412064} {"current_steps": 5925, "total_steps": 67140, "loss": 0.6719, "lr": 4.41167709264224e-05, "epoch": 0.8824843610366399, "percentage": 8.82, "elapsed_time": "0:23:41", "remaining_time": "4:04:42", "throughput": 2402.98, "total_tokens": 3414816} {"current_steps": 5930, "total_steps": 67140, "loss": 0.7784, "lr": 4.415400655347036e-05, "epoch": 0.883229073577599, "percentage": 8.83, "elapsed_time": "0:23:42", "remaining_time": "4:04:40", "throughput": 2403.08, "total_tokens": 3417664} {"current_steps": 5935, "total_steps": 67140, "loss": 0.861, "lr": 4.419124218051832e-05, "epoch": 0.8839737861185583, "percentage": 8.84, "elapsed_time": "0:23:43", "remaining_time": "4:04:38", "throughput": 2403.15, "total_tokens": 3420448} {"current_steps": 5940, "total_steps": 67140, "loss": 0.6302, "lr": 4.422847780756628e-05, "epoch": 0.8847184986595175, "percentage": 8.85, "elapsed_time": "0:23:44", "remaining_time": "4:04:35", "throughput": 2403.16, "total_tokens": 3423136} {"current_steps": 5945, "total_steps": 67140, "loss": 0.594, "lr": 4.426571343461424e-05, "epoch": 0.8854632112004767, "percentage": 8.85, "elapsed_time": "0:23:45", "remaining_time": "4:04:33", "throughput": 2403.16, "total_tokens": 3425792} {"current_steps": 5950, "total_steps": 67140, "loss": 0.6339, "lr": 4.43029490616622e-05, "epoch": 0.8862079237414358, "percentage": 8.86, "elapsed_time": "0:23:46", "remaining_time": "4:04:31", "throughput": 2403.19, "total_tokens": 3428544} {"current_steps": 5955, "total_steps": 67140, "loss": 0.6014, "lr": 4.4340184688710166e-05, "epoch": 0.886952636282395, "percentage": 8.87, "elapsed_time": "0:23:47", "remaining_time": "4:04:29", "throughput": 2403.2, "total_tokens": 3431200} {"current_steps": 5960, "total_steps": 67140, "loss": 0.7535, "lr": 4.4377420315758115e-05, "epoch": 0.8876973488233542, "percentage": 8.88, "elapsed_time": "0:23:48", "remaining_time": "4:04:27", "throughput": 2403.18, "total_tokens": 3433760} {"current_steps": 5965, "total_steps": 67140, "loss": 0.6332, "lr": 4.441465594280608e-05, "epoch": 0.8884420613643134, "percentage": 8.88, "elapsed_time": "0:23:50", "remaining_time": "4:04:25", "throughput": 2403.37, "total_tokens": 3436896} {"current_steps": 5970, "total_steps": 67140, "loss": 0.6805, "lr": 4.4451891569854035e-05, "epoch": 0.8891867739052726, "percentage": 8.89, "elapsed_time": "0:23:51", "remaining_time": "4:04:24", "throughput": 2403.64, "total_tokens": 3440128} {"current_steps": 5975, "total_steps": 67140, "loss": 0.7024, "lr": 4.4489127196902e-05, "epoch": 0.8899314864462318, "percentage": 8.9, "elapsed_time": "0:23:52", "remaining_time": "4:04:22", "throughput": 2403.78, "total_tokens": 3443072} {"current_steps": 5980, "total_steps": 67140, "loss": 0.7194, "lr": 4.4526362823949955e-05, "epoch": 0.890676198987191, "percentage": 8.91, "elapsed_time": "0:23:53", "remaining_time": "4:04:20", "throughput": 2403.85, "total_tokens": 3445888} {"current_steps": 5985, "total_steps": 67140, "loss": 0.7793, "lr": 4.456359845099792e-05, "epoch": 0.8914209115281502, "percentage": 8.91, "elapsed_time": "0:23:54", "remaining_time": "4:04:18", "throughput": 2403.92, "total_tokens": 3448672} {"current_steps": 5990, "total_steps": 67140, "loss": 0.9145, "lr": 4.4600834078045875e-05, "epoch": 0.8921656240691094, "percentage": 8.92, "elapsed_time": "0:23:55", "remaining_time": "4:04:17", "throughput": 2404.06, "total_tokens": 3451648} {"current_steps": 5995, "total_steps": 67140, "loss": 0.5987, "lr": 4.463806970509384e-05, "epoch": 0.8929103366100685, "percentage": 8.93, "elapsed_time": "0:23:56", "remaining_time": "4:04:15", "throughput": 2404.18, "total_tokens": 3454592} {"current_steps": 6000, "total_steps": 67140, "loss": 0.6858, "lr": 4.46753053321418e-05, "epoch": 0.8936550491510277, "percentage": 8.94, "elapsed_time": "0:23:57", "remaining_time": "4:04:13", "throughput": 2404.12, "total_tokens": 3457120} {"current_steps": 6005, "total_steps": 67140, "loss": 0.7994, "lr": 4.471254095918975e-05, "epoch": 0.8943997616919869, "percentage": 8.94, "elapsed_time": "0:23:59", "remaining_time": "4:04:12", "throughput": 2404.47, "total_tokens": 3460608} {"current_steps": 6010, "total_steps": 67140, "loss": 0.909, "lr": 4.4749776586237714e-05, "epoch": 0.8951444742329461, "percentage": 8.95, "elapsed_time": "0:24:00", "remaining_time": "4:04:10", "throughput": 2404.69, "total_tokens": 3463744} {"current_steps": 6015, "total_steps": 67140, "loss": 0.7573, "lr": 4.478701221328567e-05, "epoch": 0.8958891867739053, "percentage": 8.96, "elapsed_time": "0:24:01", "remaining_time": "4:04:09", "throughput": 2404.76, "total_tokens": 3466560} {"current_steps": 6020, "total_steps": 67140, "loss": 0.8163, "lr": 4.4824247840333634e-05, "epoch": 0.8966338993148645, "percentage": 8.97, "elapsed_time": "0:24:02", "remaining_time": "4:04:07", "throughput": 2404.83, "total_tokens": 3469376} {"current_steps": 6025, "total_steps": 67140, "loss": 0.6355, "lr": 4.486148346738159e-05, "epoch": 0.8973786118558237, "percentage": 8.97, "elapsed_time": "0:24:03", "remaining_time": "4:04:05", "throughput": 2404.95, "total_tokens": 3472288} {"current_steps": 6030, "total_steps": 67140, "loss": 0.8251, "lr": 4.4898719094429553e-05, "epoch": 0.8981233243967829, "percentage": 8.98, "elapsed_time": "0:24:04", "remaining_time": "4:04:03", "throughput": 2404.96, "total_tokens": 3474944} {"current_steps": 6035, "total_steps": 67140, "loss": 0.8086, "lr": 4.493595472147752e-05, "epoch": 0.898868036937742, "percentage": 8.99, "elapsed_time": "0:24:06", "remaining_time": "4:04:01", "throughput": 2404.98, "total_tokens": 3477664} {"current_steps": 6040, "total_steps": 67140, "loss": 0.7095, "lr": 4.497319034852547e-05, "epoch": 0.8996127494787012, "percentage": 9.0, "elapsed_time": "0:24:07", "remaining_time": "4:03:59", "throughput": 2405.04, "total_tokens": 3480416} {"current_steps": 6045, "total_steps": 67140, "loss": 0.7951, "lr": 4.501042597557343e-05, "epoch": 0.9003574620196604, "percentage": 9.0, "elapsed_time": "0:24:08", "remaining_time": "4:03:56", "throughput": 2405.08, "total_tokens": 3483136} {"current_steps": 6050, "total_steps": 67140, "loss": 0.7529, "lr": 4.5047661602621386e-05, "epoch": 0.9011021745606196, "percentage": 9.01, "elapsed_time": "0:24:09", "remaining_time": "4:03:54", "throughput": 2405.05, "total_tokens": 3485728} {"current_steps": 6055, "total_steps": 67140, "loss": 0.7826, "lr": 4.508489722966935e-05, "epoch": 0.9018468871015788, "percentage": 9.02, "elapsed_time": "0:24:10", "remaining_time": "4:03:52", "throughput": 2405.15, "total_tokens": 3488544} {"current_steps": 6060, "total_steps": 67140, "loss": 0.6237, "lr": 4.5122132856717306e-05, "epoch": 0.902591599642538, "percentage": 9.03, "elapsed_time": "0:24:11", "remaining_time": "4:03:51", "throughput": 2405.39, "total_tokens": 3491744} {"current_steps": 6065, "total_steps": 67140, "loss": 0.7433, "lr": 4.515936848376527e-05, "epoch": 0.9033363121834972, "percentage": 9.03, "elapsed_time": "0:24:12", "remaining_time": "4:03:49", "throughput": 2405.49, "total_tokens": 3494592} {"current_steps": 6070, "total_steps": 67140, "loss": 0.5769, "lr": 4.5196604110813225e-05, "epoch": 0.9040810247244564, "percentage": 9.04, "elapsed_time": "0:24:13", "remaining_time": "4:03:47", "throughput": 2405.53, "total_tokens": 3497344} {"current_steps": 6075, "total_steps": 67140, "loss": 0.7076, "lr": 4.523383973786119e-05, "epoch": 0.9048257372654156, "percentage": 9.05, "elapsed_time": "0:24:15", "remaining_time": "4:03:45", "throughput": 2405.61, "total_tokens": 3500224} {"current_steps": 6080, "total_steps": 67140, "loss": 0.6652, "lr": 4.527107536490915e-05, "epoch": 0.9055704498063747, "percentage": 9.06, "elapsed_time": "0:24:16", "remaining_time": "4:03:43", "throughput": 2405.67, "total_tokens": 3503040} {"current_steps": 6085, "total_steps": 67140, "loss": 0.6812, "lr": 4.530831099195711e-05, "epoch": 0.9063151623473339, "percentage": 9.06, "elapsed_time": "0:24:17", "remaining_time": "4:03:42", "throughput": 2405.83, "total_tokens": 3506016} {"current_steps": 6090, "total_steps": 67140, "loss": 0.7995, "lr": 4.5345546619005065e-05, "epoch": 0.9070598748882931, "percentage": 9.07, "elapsed_time": "0:24:18", "remaining_time": "4:03:40", "throughput": 2406.01, "total_tokens": 3509088} {"current_steps": 6095, "total_steps": 67140, "loss": 0.634, "lr": 4.538278224605302e-05, "epoch": 0.9078045874292523, "percentage": 9.08, "elapsed_time": "0:24:19", "remaining_time": "4:03:38", "throughput": 2406.08, "total_tokens": 3511904} {"current_steps": 6100, "total_steps": 67140, "loss": 0.6532, "lr": 4.5420017873100985e-05, "epoch": 0.9085492999702115, "percentage": 9.09, "elapsed_time": "0:24:20", "remaining_time": "4:03:36", "throughput": 2406.12, "total_tokens": 3514624} {"current_steps": 6105, "total_steps": 67140, "loss": 0.5081, "lr": 4.545725350014894e-05, "epoch": 0.9092940125111707, "percentage": 9.09, "elapsed_time": "0:24:21", "remaining_time": "4:03:34", "throughput": 2406.17, "total_tokens": 3517408} {"current_steps": 6110, "total_steps": 67140, "loss": 0.9195, "lr": 4.5494489127196904e-05, "epoch": 0.9100387250521299, "percentage": 9.1, "elapsed_time": "0:24:23", "remaining_time": "4:03:33", "throughput": 2406.4, "total_tokens": 3520576} {"current_steps": 6115, "total_steps": 67140, "loss": 0.944, "lr": 4.553172475424487e-05, "epoch": 0.9107834375930891, "percentage": 9.11, "elapsed_time": "0:24:24", "remaining_time": "4:03:31", "throughput": 2406.49, "total_tokens": 3523424} {"current_steps": 6120, "total_steps": 67140, "loss": 0.5694, "lr": 4.5568960381292824e-05, "epoch": 0.9115281501340483, "percentage": 9.12, "elapsed_time": "0:24:25", "remaining_time": "4:03:29", "throughput": 2406.62, "total_tokens": 3526400} {"current_steps": 6125, "total_steps": 67140, "loss": 0.7714, "lr": 4.560619600834079e-05, "epoch": 0.9122728626750074, "percentage": 9.12, "elapsed_time": "0:24:26", "remaining_time": "4:03:29", "throughput": 2407.0, "total_tokens": 3529952} {"current_steps": 6130, "total_steps": 67140, "loss": 0.7384, "lr": 4.5643431635388744e-05, "epoch": 0.9130175752159666, "percentage": 9.13, "elapsed_time": "0:24:27", "remaining_time": "4:03:27", "throughput": 2407.16, "total_tokens": 3532992} {"current_steps": 6135, "total_steps": 67140, "loss": 0.7224, "lr": 4.56806672624367e-05, "epoch": 0.9137622877569258, "percentage": 9.14, "elapsed_time": "0:24:28", "remaining_time": "4:03:25", "throughput": 2407.38, "total_tokens": 3536096} {"current_steps": 6140, "total_steps": 67140, "loss": 0.738, "lr": 4.5717902889484657e-05, "epoch": 0.914507000297885, "percentage": 9.15, "elapsed_time": "0:24:30", "remaining_time": "4:03:24", "throughput": 2407.7, "total_tokens": 3539456} {"current_steps": 6145, "total_steps": 67140, "loss": 0.8247, "lr": 4.575513851653262e-05, "epoch": 0.9152517128388442, "percentage": 9.15, "elapsed_time": "0:24:31", "remaining_time": "4:03:23", "throughput": 2407.87, "total_tokens": 3542464} {"current_steps": 6150, "total_steps": 67140, "loss": 0.7361, "lr": 4.579237414358058e-05, "epoch": 0.9159964253798034, "percentage": 9.16, "elapsed_time": "0:24:32", "remaining_time": "4:03:21", "throughput": 2408.11, "total_tokens": 3545632} {"current_steps": 6155, "total_steps": 67140, "loss": 0.7177, "lr": 4.582960977062854e-05, "epoch": 0.9167411379207626, "percentage": 9.17, "elapsed_time": "0:24:33", "remaining_time": "4:03:19", "throughput": 2408.27, "total_tokens": 3548640} {"current_steps": 6160, "total_steps": 67140, "loss": 0.7537, "lr": 4.58668453976765e-05, "epoch": 0.9174858504617218, "percentage": 9.17, "elapsed_time": "0:24:34", "remaining_time": "4:03:17", "throughput": 2408.34, "total_tokens": 3551424} {"current_steps": 6165, "total_steps": 67140, "loss": 0.802, "lr": 4.590408102472446e-05, "epoch": 0.9182305630026809, "percentage": 9.18, "elapsed_time": "0:24:35", "remaining_time": "4:03:15", "throughput": 2408.32, "total_tokens": 3554080} {"current_steps": 6170, "total_steps": 67140, "loss": 0.7169, "lr": 4.594131665177242e-05, "epoch": 0.9189752755436401, "percentage": 9.19, "elapsed_time": "0:24:36", "remaining_time": "4:03:14", "throughput": 2408.42, "total_tokens": 3556960} {"current_steps": 6175, "total_steps": 67140, "loss": 0.594, "lr": 4.597855227882037e-05, "epoch": 0.9197199880845993, "percentage": 9.2, "elapsed_time": "0:24:38", "remaining_time": "4:03:12", "throughput": 2408.62, "total_tokens": 3560064} {"current_steps": 6180, "total_steps": 67140, "loss": 0.5869, "lr": 4.6015787905868335e-05, "epoch": 0.9204647006255585, "percentage": 9.2, "elapsed_time": "0:24:39", "remaining_time": "4:03:10", "throughput": 2408.75, "total_tokens": 3563040} {"current_steps": 6185, "total_steps": 67140, "loss": 0.6253, "lr": 4.605302353291629e-05, "epoch": 0.9212094131665177, "percentage": 9.21, "elapsed_time": "0:24:40", "remaining_time": "4:03:09", "throughput": 2409.0, "total_tokens": 3566272} {"current_steps": 6190, "total_steps": 67140, "loss": 0.7159, "lr": 4.6090259159964255e-05, "epoch": 0.9219541257074769, "percentage": 9.22, "elapsed_time": "0:24:41", "remaining_time": "4:03:07", "throughput": 2409.07, "total_tokens": 3569120} {"current_steps": 6195, "total_steps": 67140, "loss": 0.6174, "lr": 4.612749478701222e-05, "epoch": 0.9226988382484361, "percentage": 9.23, "elapsed_time": "0:24:42", "remaining_time": "4:03:06", "throughput": 2409.18, "total_tokens": 3572064} {"current_steps": 6200, "total_steps": 67140, "loss": 0.8325, "lr": 4.6164730414060175e-05, "epoch": 0.9234435507893953, "percentage": 9.23, "elapsed_time": "0:24:43", "remaining_time": "4:03:04", "throughput": 2409.27, "total_tokens": 3574944} {"current_steps": 6205, "total_steps": 67140, "loss": 0.6088, "lr": 4.620196604110814e-05, "epoch": 0.9241882633303545, "percentage": 9.24, "elapsed_time": "0:24:45", "remaining_time": "4:03:03", "throughput": 2409.5, "total_tokens": 3578176} {"current_steps": 6210, "total_steps": 67140, "loss": 0.7398, "lr": 4.6239201668156095e-05, "epoch": 0.9249329758713136, "percentage": 9.25, "elapsed_time": "0:24:46", "remaining_time": "4:03:01", "throughput": 2409.7, "total_tokens": 3581280} {"current_steps": 6215, "total_steps": 67140, "loss": 0.6807, "lr": 4.627643729520406e-05, "epoch": 0.9256776884122728, "percentage": 9.26, "elapsed_time": "0:24:47", "remaining_time": "4:03:00", "throughput": 2409.74, "total_tokens": 3584064} {"current_steps": 6220, "total_steps": 67140, "loss": 0.6213, "lr": 4.631367292225201e-05, "epoch": 0.926422400953232, "percentage": 9.26, "elapsed_time": "0:24:48", "remaining_time": "4:02:58", "throughput": 2409.98, "total_tokens": 3587200} {"current_steps": 6225, "total_steps": 67140, "loss": 0.7124, "lr": 4.635090854929997e-05, "epoch": 0.9271671134941912, "percentage": 9.27, "elapsed_time": "0:24:49", "remaining_time": "4:02:56", "throughput": 2410.13, "total_tokens": 3590208} {"current_steps": 6230, "total_steps": 67140, "loss": 0.7639, "lr": 4.6388144176347934e-05, "epoch": 0.9279118260351504, "percentage": 9.28, "elapsed_time": "0:24:50", "remaining_time": "4:02:55", "throughput": 2410.26, "total_tokens": 3593152} {"current_steps": 6235, "total_steps": 67140, "loss": 0.695, "lr": 4.642537980339589e-05, "epoch": 0.9286565385761096, "percentage": 9.29, "elapsed_time": "0:24:51", "remaining_time": "4:02:53", "throughput": 2410.41, "total_tokens": 3596160} {"current_steps": 6240, "total_steps": 67140, "loss": 0.8558, "lr": 4.6462615430443854e-05, "epoch": 0.9294012511170688, "percentage": 9.29, "elapsed_time": "0:24:53", "remaining_time": "4:02:51", "throughput": 2410.52, "total_tokens": 3599104} {"current_steps": 6245, "total_steps": 67140, "loss": 0.8374, "lr": 4.649985105749181e-05, "epoch": 0.930145963658028, "percentage": 9.3, "elapsed_time": "0:24:54", "remaining_time": "4:02:50", "throughput": 2410.69, "total_tokens": 3602144} {"current_steps": 6250, "total_steps": 67140, "loss": 0.652, "lr": 4.653708668453977e-05, "epoch": 0.9308906761989872, "percentage": 9.31, "elapsed_time": "0:24:55", "remaining_time": "4:02:48", "throughput": 2410.89, "total_tokens": 3605280} {"current_steps": 6255, "total_steps": 67140, "loss": 0.796, "lr": 4.657432231158773e-05, "epoch": 0.9316353887399463, "percentage": 9.32, "elapsed_time": "0:24:56", "remaining_time": "4:02:47", "throughput": 2410.98, "total_tokens": 3608128} {"current_steps": 6260, "total_steps": 67140, "loss": 0.6225, "lr": 4.661155793863569e-05, "epoch": 0.9323801012809055, "percentage": 9.32, "elapsed_time": "0:24:57", "remaining_time": "4:02:44", "throughput": 2410.91, "total_tokens": 3610624} {"current_steps": 6265, "total_steps": 67140, "loss": 0.6926, "lr": 4.664879356568364e-05, "epoch": 0.9331248138218647, "percentage": 9.33, "elapsed_time": "0:24:58", "remaining_time": "4:02:42", "throughput": 2411.01, "total_tokens": 3613504} {"current_steps": 6270, "total_steps": 67140, "loss": 0.6537, "lr": 4.6686029192731606e-05, "epoch": 0.9338695263628239, "percentage": 9.34, "elapsed_time": "0:24:59", "remaining_time": "4:02:40", "throughput": 2411.09, "total_tokens": 3616320} {"current_steps": 6275, "total_steps": 67140, "loss": 0.6086, "lr": 4.672326481977957e-05, "epoch": 0.9346142389037831, "percentage": 9.35, "elapsed_time": "0:25:01", "remaining_time": "4:02:39", "throughput": 2411.13, "total_tokens": 3619104} {"current_steps": 6280, "total_steps": 67140, "loss": 0.6367, "lr": 4.6760500446827526e-05, "epoch": 0.9353589514447423, "percentage": 9.35, "elapsed_time": "0:25:02", "remaining_time": "4:02:37", "throughput": 2411.13, "total_tokens": 3621792} {"current_steps": 6285, "total_steps": 67140, "loss": 0.6187, "lr": 4.679773607387549e-05, "epoch": 0.9361036639857016, "percentage": 9.36, "elapsed_time": "0:25:03", "remaining_time": "4:02:35", "throughput": 2411.18, "total_tokens": 3624544} {"current_steps": 6290, "total_steps": 67140, "loss": 0.4308, "lr": 4.6834971700923445e-05, "epoch": 0.9368483765266608, "percentage": 9.37, "elapsed_time": "0:25:04", "remaining_time": "4:02:33", "throughput": 2411.28, "total_tokens": 3627424} {"current_steps": 6295, "total_steps": 67140, "loss": 0.826, "lr": 4.687220732797141e-05, "epoch": 0.9375930890676198, "percentage": 9.38, "elapsed_time": "0:25:05", "remaining_time": "4:02:31", "throughput": 2411.37, "total_tokens": 3630304} {"current_steps": 6300, "total_steps": 67140, "loss": 0.5927, "lr": 4.6909442955019365e-05, "epoch": 0.938337801608579, "percentage": 9.38, "elapsed_time": "0:25:06", "remaining_time": "4:02:29", "throughput": 2411.48, "total_tokens": 3633216} {"current_steps": 6305, "total_steps": 67140, "loss": 0.7599, "lr": 4.694667858206732e-05, "epoch": 0.9390825141495382, "percentage": 9.39, "elapsed_time": "0:25:07", "remaining_time": "4:02:27", "throughput": 2411.55, "total_tokens": 3636000} {"current_steps": 6310, "total_steps": 67140, "loss": 0.7165, "lr": 4.6983914209115285e-05, "epoch": 0.9398272266904975, "percentage": 9.4, "elapsed_time": "0:25:08", "remaining_time": "4:02:25", "throughput": 2411.64, "total_tokens": 3638848} {"current_steps": 6315, "total_steps": 67140, "loss": 0.7906, "lr": 4.702114983616324e-05, "epoch": 0.9405719392314567, "percentage": 9.41, "elapsed_time": "0:25:10", "remaining_time": "4:02:24", "throughput": 2411.89, "total_tokens": 3642144} {"current_steps": 6320, "total_steps": 67140, "loss": 0.8511, "lr": 4.7058385463211205e-05, "epoch": 0.9413166517724159, "percentage": 9.41, "elapsed_time": "0:25:11", "remaining_time": "4:02:22", "throughput": 2411.89, "total_tokens": 3644832} {"current_steps": 6325, "total_steps": 67140, "loss": 0.6849, "lr": 4.709562109025916e-05, "epoch": 0.9420613643133751, "percentage": 9.42, "elapsed_time": "0:25:12", "remaining_time": "4:02:21", "throughput": 2411.96, "total_tokens": 3647680} {"current_steps": 6330, "total_steps": 67140, "loss": 0.8673, "lr": 4.7132856717307124e-05, "epoch": 0.9428060768543343, "percentage": 9.43, "elapsed_time": "0:25:13", "remaining_time": "4:02:19", "throughput": 2412.01, "total_tokens": 3650528} {"current_steps": 6335, "total_steps": 67140, "loss": 0.6656, "lr": 4.717009234435508e-05, "epoch": 0.9435507893952935, "percentage": 9.44, "elapsed_time": "0:25:14", "remaining_time": "4:02:17", "throughput": 2412.09, "total_tokens": 3653344} {"current_steps": 6340, "total_steps": 67140, "loss": 0.6565, "lr": 4.7207327971403044e-05, "epoch": 0.9442955019362526, "percentage": 9.44, "elapsed_time": "0:25:15", "remaining_time": "4:02:15", "throughput": 2412.27, "total_tokens": 3656416} {"current_steps": 6345, "total_steps": 67140, "loss": 0.5511, "lr": 4.7244563598451e-05, "epoch": 0.9450402144772118, "percentage": 9.45, "elapsed_time": "0:25:16", "remaining_time": "4:02:14", "throughput": 2412.33, "total_tokens": 3659200} {"current_steps": 6350, "total_steps": 67140, "loss": 0.6816, "lr": 4.728179922549896e-05, "epoch": 0.945784927018171, "percentage": 9.46, "elapsed_time": "0:25:18", "remaining_time": "4:02:12", "throughput": 2412.43, "total_tokens": 3662144} {"current_steps": 6355, "total_steps": 67140, "loss": 0.7802, "lr": 4.731903485254692e-05, "epoch": 0.9465296395591302, "percentage": 9.47, "elapsed_time": "0:25:19", "remaining_time": "4:02:10", "throughput": 2412.42, "total_tokens": 3664768} {"current_steps": 6360, "total_steps": 67140, "loss": 0.6482, "lr": 4.7356270479594877e-05, "epoch": 0.9472743521000894, "percentage": 9.47, "elapsed_time": "0:25:20", "remaining_time": "4:02:08", "throughput": 2412.36, "total_tokens": 3667296} {"current_steps": 6365, "total_steps": 67140, "loss": 0.6367, "lr": 4.739350610664284e-05, "epoch": 0.9480190646410486, "percentage": 9.48, "elapsed_time": "0:25:21", "remaining_time": "4:02:06", "throughput": 2412.43, "total_tokens": 3670112} {"current_steps": 6370, "total_steps": 67140, "loss": 0.6076, "lr": 4.7430741733690796e-05, "epoch": 0.9487637771820078, "percentage": 9.49, "elapsed_time": "0:25:22", "remaining_time": "4:02:04", "throughput": 2412.42, "total_tokens": 3672800} {"current_steps": 6375, "total_steps": 67140, "loss": 0.8135, "lr": 4.746797736073876e-05, "epoch": 0.949508489722967, "percentage": 9.5, "elapsed_time": "0:25:23", "remaining_time": "4:02:02", "throughput": 2412.64, "total_tokens": 3675968} {"current_steps": 6380, "total_steps": 67140, "loss": 0.6186, "lr": 4.7505212987786716e-05, "epoch": 0.9502532022639262, "percentage": 9.5, "elapsed_time": "0:25:24", "remaining_time": "4:02:01", "throughput": 2412.74, "total_tokens": 3678880} {"current_steps": 6385, "total_steps": 67140, "loss": 0.6198, "lr": 4.754244861483468e-05, "epoch": 0.9509979148048853, "percentage": 9.51, "elapsed_time": "0:25:25", "remaining_time": "4:01:59", "throughput": 2412.9, "total_tokens": 3681952} {"current_steps": 6390, "total_steps": 67140, "loss": 0.8326, "lr": 4.7579684241882636e-05, "epoch": 0.9517426273458445, "percentage": 9.52, "elapsed_time": "0:25:27", "remaining_time": "4:01:57", "throughput": 2412.95, "total_tokens": 3684736} {"current_steps": 6395, "total_steps": 67140, "loss": 0.7751, "lr": 4.761691986893059e-05, "epoch": 0.9524873398868037, "percentage": 9.52, "elapsed_time": "0:25:28", "remaining_time": "4:01:56", "throughput": 2413.1, "total_tokens": 3687744} {"current_steps": 6400, "total_steps": 67140, "loss": 0.7113, "lr": 4.7654155495978555e-05, "epoch": 0.9532320524277629, "percentage": 9.53, "elapsed_time": "0:25:29", "remaining_time": "4:01:54", "throughput": 2413.28, "total_tokens": 3690848} {"current_steps": 6405, "total_steps": 67140, "loss": 0.6984, "lr": 4.769139112302651e-05, "epoch": 0.9539767649687221, "percentage": 9.54, "elapsed_time": "0:25:30", "remaining_time": "4:01:53", "throughput": 2413.43, "total_tokens": 3693856} {"current_steps": 6410, "total_steps": 67140, "loss": 0.7647, "lr": 4.7728626750074475e-05, "epoch": 0.9547214775096813, "percentage": 9.55, "elapsed_time": "0:25:31", "remaining_time": "4:01:51", "throughput": 2413.5, "total_tokens": 3696608} {"current_steps": 6415, "total_steps": 67140, "loss": 0.649, "lr": 4.776586237712243e-05, "epoch": 0.9554661900506405, "percentage": 9.55, "elapsed_time": "0:25:32", "remaining_time": "4:01:49", "throughput": 2413.61, "total_tokens": 3699552} {"current_steps": 6420, "total_steps": 67140, "loss": 0.7236, "lr": 4.7803098004170395e-05, "epoch": 0.9562109025915997, "percentage": 9.56, "elapsed_time": "0:25:33", "remaining_time": "4:01:47", "throughput": 2413.61, "total_tokens": 3702176} {"current_steps": 6425, "total_steps": 67140, "loss": 0.8815, "lr": 4.784033363121835e-05, "epoch": 0.9569556151325588, "percentage": 9.57, "elapsed_time": "0:25:34", "remaining_time": "4:01:45", "throughput": 2413.66, "total_tokens": 3704960} {"current_steps": 6430, "total_steps": 67140, "loss": 0.7041, "lr": 4.7877569258266315e-05, "epoch": 0.957700327673518, "percentage": 9.58, "elapsed_time": "0:25:36", "remaining_time": "4:01:43", "throughput": 2413.65, "total_tokens": 3707584} {"current_steps": 6435, "total_steps": 67140, "loss": 0.6745, "lr": 4.791480488531427e-05, "epoch": 0.9584450402144772, "percentage": 9.58, "elapsed_time": "0:25:37", "remaining_time": "4:01:41", "throughput": 2413.64, "total_tokens": 3710240} {"current_steps": 6440, "total_steps": 67140, "loss": 0.7879, "lr": 4.795204051236223e-05, "epoch": 0.9591897527554364, "percentage": 9.59, "elapsed_time": "0:25:38", "remaining_time": "4:01:39", "throughput": 2413.66, "total_tokens": 3712960} {"current_steps": 6445, "total_steps": 67140, "loss": 0.7153, "lr": 4.798927613941019e-05, "epoch": 0.9599344652963956, "percentage": 9.6, "elapsed_time": "0:25:39", "remaining_time": "4:01:37", "throughput": 2413.62, "total_tokens": 3715552} {"current_steps": 6450, "total_steps": 67140, "loss": 0.7101, "lr": 4.802651176645815e-05, "epoch": 0.9606791778373548, "percentage": 9.61, "elapsed_time": "0:25:40", "remaining_time": "4:01:35", "throughput": 2413.65, "total_tokens": 3718304} {"current_steps": 6455, "total_steps": 67140, "loss": 0.7705, "lr": 4.806374739350611e-05, "epoch": 0.961423890378314, "percentage": 9.61, "elapsed_time": "0:25:41", "remaining_time": "4:01:33", "throughput": 2413.77, "total_tokens": 3721280} {"current_steps": 6460, "total_steps": 67140, "loss": 0.5208, "lr": 4.810098302055407e-05, "epoch": 0.9621686029192732, "percentage": 9.62, "elapsed_time": "0:25:42", "remaining_time": "4:01:32", "throughput": 2413.99, "total_tokens": 3724480} {"current_steps": 6465, "total_steps": 67140, "loss": 0.7368, "lr": 4.813821864760203e-05, "epoch": 0.9629133154602324, "percentage": 9.63, "elapsed_time": "0:25:43", "remaining_time": "4:01:30", "throughput": 2414.03, "total_tokens": 3727232} {"current_steps": 6470, "total_steps": 67140, "loss": 0.7566, "lr": 4.8175454274649987e-05, "epoch": 0.9636580280011915, "percentage": 9.64, "elapsed_time": "0:25:45", "remaining_time": "4:01:28", "throughput": 2414.06, "total_tokens": 3729952} {"current_steps": 6475, "total_steps": 67140, "loss": 0.6934, "lr": 4.821268990169795e-05, "epoch": 0.9644027405421507, "percentage": 9.64, "elapsed_time": "0:25:46", "remaining_time": "4:01:26", "throughput": 2414.16, "total_tokens": 3732800} {"current_steps": 6480, "total_steps": 67140, "loss": 0.5474, "lr": 4.8249925528745906e-05, "epoch": 0.9651474530831099, "percentage": 9.65, "elapsed_time": "0:25:47", "remaining_time": "4:01:24", "throughput": 2414.17, "total_tokens": 3735488} {"current_steps": 6485, "total_steps": 67140, "loss": 0.8892, "lr": 4.828716115579386e-05, "epoch": 0.9658921656240691, "percentage": 9.66, "elapsed_time": "0:25:48", "remaining_time": "4:01:22", "throughput": 2414.26, "total_tokens": 3738304} {"current_steps": 6490, "total_steps": 67140, "loss": 0.8015, "lr": 4.8324396782841826e-05, "epoch": 0.9666368781650283, "percentage": 9.67, "elapsed_time": "0:25:49", "remaining_time": "4:01:20", "throughput": 2414.29, "total_tokens": 3741024} {"current_steps": 6495, "total_steps": 67140, "loss": 0.8155, "lr": 4.836163240988978e-05, "epoch": 0.9673815907059875, "percentage": 9.67, "elapsed_time": "0:25:50", "remaining_time": "4:01:21", "throughput": 2414.61, "total_tokens": 3744992} {"current_steps": 6500, "total_steps": 67140, "loss": 0.8119, "lr": 4.8398868036937746e-05, "epoch": 0.9681263032469467, "percentage": 9.68, "elapsed_time": "0:25:52", "remaining_time": "4:01:19", "throughput": 2414.69, "total_tokens": 3747840} {"current_steps": 6505, "total_steps": 67140, "loss": 0.7158, "lr": 4.84361036639857e-05, "epoch": 0.9688710157879059, "percentage": 9.69, "elapsed_time": "0:25:53", "remaining_time": "4:01:18", "throughput": 2414.79, "total_tokens": 3750752} {"current_steps": 6510, "total_steps": 67140, "loss": 0.7128, "lr": 4.8473339291033665e-05, "epoch": 0.9696157283288651, "percentage": 9.7, "elapsed_time": "0:25:54", "remaining_time": "4:01:16", "throughput": 2414.96, "total_tokens": 3753856} {"current_steps": 6515, "total_steps": 67140, "loss": 0.6702, "lr": 4.851057491808162e-05, "epoch": 0.9703604408698242, "percentage": 9.7, "elapsed_time": "0:25:55", "remaining_time": "4:01:15", "throughput": 2415.02, "total_tokens": 3756704} {"current_steps": 6520, "total_steps": 67140, "loss": 0.6817, "lr": 4.8547810545129585e-05, "epoch": 0.9711051534107834, "percentage": 9.71, "elapsed_time": "0:25:56", "remaining_time": "4:01:13", "throughput": 2415.06, "total_tokens": 3759488} {"current_steps": 6525, "total_steps": 67140, "loss": 0.669, "lr": 4.858504617217754e-05, "epoch": 0.9718498659517426, "percentage": 9.72, "elapsed_time": "0:25:57", "remaining_time": "4:01:11", "throughput": 2415.1, "total_tokens": 3762272} {"current_steps": 6530, "total_steps": 67140, "loss": 0.68, "lr": 4.86222817992255e-05, "epoch": 0.9725945784927018, "percentage": 9.73, "elapsed_time": "0:25:58", "remaining_time": "4:01:09", "throughput": 2415.12, "total_tokens": 3764928} {"current_steps": 6535, "total_steps": 67140, "loss": 0.6004, "lr": 4.865951742627346e-05, "epoch": 0.973339291033661, "percentage": 9.73, "elapsed_time": "0:26:00", "remaining_time": "4:01:08", "throughput": 2415.37, "total_tokens": 3768192} {"current_steps": 6540, "total_steps": 67140, "loss": 0.7504, "lr": 4.869675305332142e-05, "epoch": 0.9740840035746202, "percentage": 9.74, "elapsed_time": "0:26:01", "remaining_time": "4:01:06", "throughput": 2415.49, "total_tokens": 3771136} {"current_steps": 6545, "total_steps": 67140, "loss": 0.7014, "lr": 4.873398868036938e-05, "epoch": 0.9748287161155794, "percentage": 9.75, "elapsed_time": "0:26:02", "remaining_time": "4:01:04", "throughput": 2415.6, "total_tokens": 3774112} {"current_steps": 6550, "total_steps": 67140, "loss": 0.7329, "lr": 4.877122430741734e-05, "epoch": 0.9755734286565386, "percentage": 9.76, "elapsed_time": "0:26:03", "remaining_time": "4:01:03", "throughput": 2415.69, "total_tokens": 3777024} {"current_steps": 6555, "total_steps": 67140, "loss": 0.6694, "lr": 4.88084599344653e-05, "epoch": 0.9763181411974977, "percentage": 9.76, "elapsed_time": "0:26:04", "remaining_time": "4:01:01", "throughput": 2415.8, "total_tokens": 3779968} {"current_steps": 6560, "total_steps": 67140, "loss": 0.7573, "lr": 4.8845695561513264e-05, "epoch": 0.9770628537384569, "percentage": 9.77, "elapsed_time": "0:26:05", "remaining_time": "4:00:59", "throughput": 2415.84, "total_tokens": 3782752} {"current_steps": 6565, "total_steps": 67140, "loss": 0.8197, "lr": 4.8882931188561214e-05, "epoch": 0.9778075662794161, "percentage": 9.78, "elapsed_time": "0:26:06", "remaining_time": "4:00:58", "throughput": 2415.95, "total_tokens": 3785664} {"current_steps": 6570, "total_steps": 67140, "loss": 0.6671, "lr": 4.892016681560918e-05, "epoch": 0.9785522788203753, "percentage": 9.79, "elapsed_time": "0:26:08", "remaining_time": "4:00:55", "throughput": 2415.91, "total_tokens": 3788224} {"current_steps": 6575, "total_steps": 67140, "loss": 0.7132, "lr": 4.895740244265713e-05, "epoch": 0.9792969913613345, "percentage": 9.79, "elapsed_time": "0:26:09", "remaining_time": "4:00:54", "throughput": 2416.01, "total_tokens": 3791136} {"current_steps": 6580, "total_steps": 67140, "loss": 0.8186, "lr": 4.8994638069705097e-05, "epoch": 0.9800417039022937, "percentage": 9.8, "elapsed_time": "0:26:10", "remaining_time": "4:00:52", "throughput": 2416.18, "total_tokens": 3794240} {"current_steps": 6585, "total_steps": 67140, "loss": 0.6636, "lr": 4.903187369675305e-05, "epoch": 0.9807864164432529, "percentage": 9.81, "elapsed_time": "0:26:11", "remaining_time": "4:00:51", "throughput": 2416.24, "total_tokens": 3797088} {"current_steps": 6590, "total_steps": 67140, "loss": 0.7817, "lr": 4.9069109323801016e-05, "epoch": 0.9815311289842121, "percentage": 9.82, "elapsed_time": "0:26:12", "remaining_time": "4:00:49", "throughput": 2416.39, "total_tokens": 3800096} {"current_steps": 6595, "total_steps": 67140, "loss": 0.6886, "lr": 4.910634495084897e-05, "epoch": 0.9822758415251713, "percentage": 9.82, "elapsed_time": "0:26:13", "remaining_time": "4:00:48", "throughput": 2416.5, "total_tokens": 3803072} {"current_steps": 6600, "total_steps": 67140, "loss": 0.6457, "lr": 4.9143580577896936e-05, "epoch": 0.9830205540661304, "percentage": 9.83, "elapsed_time": "0:26:14", "remaining_time": "4:00:46", "throughput": 2416.61, "total_tokens": 3806048} {"current_steps": 6605, "total_steps": 67140, "loss": 0.7152, "lr": 4.91808162049449e-05, "epoch": 0.9837652666070896, "percentage": 9.84, "elapsed_time": "0:26:16", "remaining_time": "4:00:44", "throughput": 2416.63, "total_tokens": 3808768} {"current_steps": 6610, "total_steps": 67140, "loss": 0.8576, "lr": 4.921805183199285e-05, "epoch": 0.9845099791480488, "percentage": 9.85, "elapsed_time": "0:26:17", "remaining_time": "4:00:43", "throughput": 2416.82, "total_tokens": 3811872} {"current_steps": 6615, "total_steps": 67140, "loss": 0.7033, "lr": 4.925528745904081e-05, "epoch": 0.985254691689008, "percentage": 9.85, "elapsed_time": "0:26:18", "remaining_time": "4:00:41", "throughput": 2416.98, "total_tokens": 3814944} {"current_steps": 6620, "total_steps": 67140, "loss": 0.7749, "lr": 4.929252308608877e-05, "epoch": 0.9859994042299672, "percentage": 9.86, "elapsed_time": "0:26:19", "remaining_time": "4:00:39", "throughput": 2417.02, "total_tokens": 3817728} {"current_steps": 6625, "total_steps": 67140, "loss": 0.6327, "lr": 4.932975871313673e-05, "epoch": 0.9867441167709264, "percentage": 9.87, "elapsed_time": "0:26:20", "remaining_time": "4:00:38", "throughput": 2417.07, "total_tokens": 3820512} {"current_steps": 6630, "total_steps": 67140, "loss": 0.7178, "lr": 4.936699434018469e-05, "epoch": 0.9874888293118856, "percentage": 9.87, "elapsed_time": "0:26:21", "remaining_time": "4:00:36", "throughput": 2417.28, "total_tokens": 3823712} {"current_steps": 6635, "total_steps": 67140, "loss": 0.673, "lr": 4.940422996723265e-05, "epoch": 0.9882335418528448, "percentage": 9.88, "elapsed_time": "0:26:22", "remaining_time": "4:00:34", "throughput": 2417.28, "total_tokens": 3826336} {"current_steps": 6640, "total_steps": 67140, "loss": 0.5929, "lr": 4.9441465594280615e-05, "epoch": 0.988978254393804, "percentage": 9.89, "elapsed_time": "0:26:24", "remaining_time": "4:00:32", "throughput": 2417.29, "total_tokens": 3828992} {"current_steps": 6645, "total_steps": 67140, "loss": 0.6191, "lr": 4.947870122132857e-05, "epoch": 0.9897229669347631, "percentage": 9.9, "elapsed_time": "0:26:25", "remaining_time": "4:00:30", "throughput": 2417.31, "total_tokens": 3831712} {"current_steps": 6650, "total_steps": 67140, "loss": 0.6532, "lr": 4.9515936848376534e-05, "epoch": 0.9904676794757223, "percentage": 9.9, "elapsed_time": "0:26:26", "remaining_time": "4:00:28", "throughput": 2417.27, "total_tokens": 3834304} {"current_steps": 6655, "total_steps": 67140, "loss": 0.7552, "lr": 4.9553172475424484e-05, "epoch": 0.9912123920166815, "percentage": 9.91, "elapsed_time": "0:26:27", "remaining_time": "4:00:26", "throughput": 2417.3, "total_tokens": 3837056} {"current_steps": 6660, "total_steps": 67140, "loss": 0.6421, "lr": 4.959040810247245e-05, "epoch": 0.9919571045576407, "percentage": 9.92, "elapsed_time": "0:26:28", "remaining_time": "4:00:25", "throughput": 2417.4, "total_tokens": 3840000} {"current_steps": 6665, "total_steps": 67140, "loss": 0.6366, "lr": 4.9627643729520404e-05, "epoch": 0.9927018170986, "percentage": 9.93, "elapsed_time": "0:26:29", "remaining_time": "4:00:23", "throughput": 2417.46, "total_tokens": 3842848} {"current_steps": 6670, "total_steps": 67140, "loss": 0.6876, "lr": 4.966487935656837e-05, "epoch": 0.9934465296395592, "percentage": 9.93, "elapsed_time": "0:26:30", "remaining_time": "4:00:21", "throughput": 2417.49, "total_tokens": 3845600} {"current_steps": 6675, "total_steps": 67140, "loss": 0.7663, "lr": 4.9702114983616324e-05, "epoch": 0.9941912421805184, "percentage": 9.94, "elapsed_time": "0:26:31", "remaining_time": "4:00:20", "throughput": 2417.65, "total_tokens": 3848704} {"current_steps": 6680, "total_steps": 67140, "loss": 0.7558, "lr": 4.973935061066429e-05, "epoch": 0.9949359547214776, "percentage": 9.95, "elapsed_time": "0:26:33", "remaining_time": "4:00:18", "throughput": 2417.77, "total_tokens": 3851680} {"current_steps": 6685, "total_steps": 67140, "loss": 0.7926, "lr": 4.977658623771225e-05, "epoch": 0.9956806672624366, "percentage": 9.96, "elapsed_time": "0:26:34", "remaining_time": "4:00:16", "throughput": 2417.8, "total_tokens": 3854400} {"current_steps": 6690, "total_steps": 67140, "loss": 0.7559, "lr": 4.9813821864760207e-05, "epoch": 0.9964253798033958, "percentage": 9.96, "elapsed_time": "0:26:35", "remaining_time": "4:00:15", "throughput": 2418.01, "total_tokens": 3857632} {"current_steps": 6695, "total_steps": 67140, "loss": 0.6751, "lr": 4.985105749180816e-05, "epoch": 0.997170092344355, "percentage": 9.97, "elapsed_time": "0:26:36", "remaining_time": "4:00:13", "throughput": 2417.99, "total_tokens": 3860192} {"current_steps": 6700, "total_steps": 67140, "loss": 0.6704, "lr": 4.988829311885612e-05, "epoch": 0.9979148048853143, "percentage": 9.98, "elapsed_time": "0:26:37", "remaining_time": "4:00:11", "throughput": 2418.02, "total_tokens": 3862944} {"current_steps": 6705, "total_steps": 67140, "loss": 0.7123, "lr": 4.992552874590408e-05, "epoch": 0.9986595174262735, "percentage": 9.99, "elapsed_time": "0:26:38", "remaining_time": "4:00:09", "throughput": 2418.13, "total_tokens": 3865856} {"current_steps": 6710, "total_steps": 67140, "loss": 0.7028, "lr": 4.996276437295204e-05, "epoch": 0.9994042299672327, "percentage": 9.99, "elapsed_time": "0:26:39", "remaining_time": "4:00:08", "throughput": 2418.2, "total_tokens": 3868704} {"current_steps": 6714, "total_steps": 67140, "eval_loss": 0.6813997030258179, "epoch": 1.0, "percentage": 10.0, "elapsed_time": "0:27:54", "remaining_time": "4:11:14", "throughput": 2310.95, "total_tokens": 3870688} {"current_steps": 6715, "total_steps": 67140, "loss": 0.5664, "lr": 5e-05, "epoch": 1.0001489425081918, "percentage": 10.0, "elapsed_time": "0:27:56", "remaining_time": "4:11:28", "throughput": 2308.79, "total_tokens": 3871200} {"current_steps": 6720, "total_steps": 67140, "loss": 0.7183, "lr": 4.999999915530083e-05, "epoch": 1.000893655049151, "percentage": 10.01, "elapsed_time": "0:27:57", "remaining_time": "4:11:25", "throughput": 2308.92, "total_tokens": 3873984} {"current_steps": 6725, "total_steps": 67140, "loss": 0.7906, "lr": 4.999999662120335e-05, "epoch": 1.0016383675901102, "percentage": 10.02, "elapsed_time": "0:27:58", "remaining_time": "4:11:23", "throughput": 2309.12, "total_tokens": 3876960} {"current_steps": 6730, "total_steps": 67140, "loss": 0.6571, "lr": 4.999999239770774e-05, "epoch": 1.0023830801310694, "percentage": 10.02, "elapsed_time": "0:28:00", "remaining_time": "4:11:21", "throughput": 2309.33, "total_tokens": 3879968} {"current_steps": 6735, "total_steps": 67140, "loss": 0.7259, "lr": 4.999998648481429e-05, "epoch": 1.0031277926720286, "percentage": 10.03, "elapsed_time": "0:28:01", "remaining_time": "4:11:18", "throughput": 2309.49, "total_tokens": 3882816} {"current_steps": 6740, "total_steps": 67140, "loss": 0.6322, "lr": 4.999997888252339e-05, "epoch": 1.0038725052129878, "percentage": 10.04, "elapsed_time": "0:28:02", "remaining_time": "4:11:16", "throughput": 2309.67, "total_tokens": 3885760} {"current_steps": 6745, "total_steps": 67140, "loss": 0.645, "lr": 4.999996959083556e-05, "epoch": 1.004617217753947, "percentage": 10.05, "elapsed_time": "0:28:03", "remaining_time": "4:11:14", "throughput": 2309.8, "total_tokens": 3888576} {"current_steps": 6750, "total_steps": 67140, "loss": 0.6339, "lr": 4.999995860975143e-05, "epoch": 1.0053619302949062, "percentage": 10.05, "elapsed_time": "0:28:04", "remaining_time": "4:11:11", "throughput": 2309.91, "total_tokens": 3891360} {"current_steps": 6755, "total_steps": 67140, "loss": 0.7399, "lr": 4.9999945939271744e-05, "epoch": 1.0061066428358654, "percentage": 10.06, "elapsed_time": "0:28:05", "remaining_time": "4:11:09", "throughput": 2310.05, "total_tokens": 3894208} {"current_steps": 6760, "total_steps": 67140, "loss": 0.5235, "lr": 4.999993157939735e-05, "epoch": 1.0068513553768246, "percentage": 10.07, "elapsed_time": "0:28:06", "remaining_time": "4:11:07", "throughput": 2310.15, "total_tokens": 3896928} {"current_steps": 6765, "total_steps": 67140, "loss": 0.6901, "lr": 4.999991553012923e-05, "epoch": 1.0075960679177838, "percentage": 10.08, "elapsed_time": "0:28:08", "remaining_time": "4:11:05", "throughput": 2310.36, "total_tokens": 3899968} {"current_steps": 6770, "total_steps": 67140, "loss": 0.6731, "lr": 4.999989779146845e-05, "epoch": 1.008340780458743, "percentage": 10.08, "elapsed_time": "0:28:09", "remaining_time": "4:11:02", "throughput": 2310.45, "total_tokens": 3902688} {"current_steps": 6775, "total_steps": 67140, "loss": 0.694, "lr": 4.999987836341622e-05, "epoch": 1.0090854929997022, "percentage": 10.09, "elapsed_time": "0:28:10", "remaining_time": "4:11:00", "throughput": 2310.58, "total_tokens": 3905504} {"current_steps": 6780, "total_steps": 67140, "loss": 0.7266, "lr": 4.999985724597386e-05, "epoch": 1.0098302055406614, "percentage": 10.1, "elapsed_time": "0:28:11", "remaining_time": "4:10:58", "throughput": 2310.77, "total_tokens": 3908480} {"current_steps": 6785, "total_steps": 67140, "loss": 0.8368, "lr": 4.9999834439142776e-05, "epoch": 1.0105749180816206, "percentage": 10.11, "elapsed_time": "0:28:12", "remaining_time": "4:10:55", "throughput": 2310.85, "total_tokens": 3911168} {"current_steps": 6790, "total_steps": 67140, "loss": 0.5436, "lr": 4.999980994292454e-05, "epoch": 1.0113196306225798, "percentage": 10.11, "elapsed_time": "0:28:13", "remaining_time": "4:10:53", "throughput": 2310.92, "total_tokens": 3913888} {"current_steps": 6795, "total_steps": 67140, "loss": 0.7364, "lr": 4.9999783757320776e-05, "epoch": 1.0120643431635388, "percentage": 10.12, "elapsed_time": "0:28:14", "remaining_time": "4:10:51", "throughput": 2311.06, "total_tokens": 3916768} {"current_steps": 6800, "total_steps": 67140, "loss": 0.645, "lr": 4.9999755882333275e-05, "epoch": 1.012809055704498, "percentage": 10.13, "elapsed_time": "0:28:15", "remaining_time": "4:10:48", "throughput": 2311.19, "total_tokens": 3919552} {"current_steps": 6805, "total_steps": 67140, "loss": 0.8634, "lr": 4.999972631796391e-05, "epoch": 1.0135537682454572, "percentage": 10.14, "elapsed_time": "0:28:17", "remaining_time": "4:10:46", "throughput": 2311.3, "total_tokens": 3922368} {"current_steps": 6810, "total_steps": 67140, "loss": 0.6727, "lr": 4.999969506421468e-05, "epoch": 1.0142984807864164, "percentage": 10.14, "elapsed_time": "0:28:18", "remaining_time": "4:10:44", "throughput": 2311.45, "total_tokens": 3925216} {"current_steps": 6815, "total_steps": 67140, "loss": 0.8229, "lr": 4.99996621210877e-05, "epoch": 1.0150431933273756, "percentage": 10.15, "elapsed_time": "0:28:19", "remaining_time": "4:10:42", "throughput": 2311.7, "total_tokens": 3928416} {"current_steps": 6820, "total_steps": 67140, "loss": 0.6535, "lr": 4.99996274885852e-05, "epoch": 1.0157879058683348, "percentage": 10.16, "elapsed_time": "0:28:20", "remaining_time": "4:10:40", "throughput": 2311.97, "total_tokens": 3931584} {"current_steps": 6825, "total_steps": 67140, "loss": 0.7883, "lr": 4.999959116670951e-05, "epoch": 1.016532618409294, "percentage": 10.17, "elapsed_time": "0:28:21", "remaining_time": "4:10:38", "throughput": 2312.12, "total_tokens": 3934464} {"current_steps": 6830, "total_steps": 67140, "loss": 0.8135, "lr": 4.999955315546309e-05, "epoch": 1.0172773309502532, "percentage": 10.17, "elapsed_time": "0:28:22", "remaining_time": "4:10:36", "throughput": 2312.32, "total_tokens": 3937440} {"current_steps": 6835, "total_steps": 67140, "loss": 0.7331, "lr": 4.999951345484851e-05, "epoch": 1.0180220434912124, "percentage": 10.18, "elapsed_time": "0:28:23", "remaining_time": "4:10:33", "throughput": 2312.42, "total_tokens": 3940224} {"current_steps": 6840, "total_steps": 67140, "loss": 0.6693, "lr": 4.999947206486846e-05, "epoch": 1.0187667560321716, "percentage": 10.19, "elapsed_time": "0:28:25", "remaining_time": "4:10:31", "throughput": 2312.55, "total_tokens": 3943040} {"current_steps": 6845, "total_steps": 67140, "loss": 0.7292, "lr": 4.999942898552571e-05, "epoch": 1.0195114685731308, "percentage": 10.2, "elapsed_time": "0:28:26", "remaining_time": "4:10:28", "throughput": 2312.67, "total_tokens": 3945792} {"current_steps": 6850, "total_steps": 67140, "loss": 0.726, "lr": 4.99993842168232e-05, "epoch": 1.02025618111409, "percentage": 10.2, "elapsed_time": "0:28:27", "remaining_time": "4:10:26", "throughput": 2312.69, "total_tokens": 3948320} {"current_steps": 6855, "total_steps": 67140, "loss": 0.7534, "lr": 4.999933775876395e-05, "epoch": 1.0210008936550492, "percentage": 10.21, "elapsed_time": "0:28:28", "remaining_time": "4:10:24", "throughput": 2312.85, "total_tokens": 3951232} {"current_steps": 6860, "total_steps": 67140, "loss": 0.6669, "lr": 4.999928961135109e-05, "epoch": 1.0217456061960084, "percentage": 10.22, "elapsed_time": "0:28:29", "remaining_time": "4:10:21", "throughput": 2312.99, "total_tokens": 3954080} {"current_steps": 6865, "total_steps": 67140, "loss": 0.588, "lr": 4.9999239774587867e-05, "epoch": 1.0224903187369676, "percentage": 10.22, "elapsed_time": "0:28:30", "remaining_time": "4:10:19", "throughput": 2313.05, "total_tokens": 3956768} {"current_steps": 6870, "total_steps": 67140, "loss": 0.6329, "lr": 4.999918824847767e-05, "epoch": 1.0232350312779268, "percentage": 10.23, "elapsed_time": "0:28:31", "remaining_time": "4:10:17", "throughput": 2313.22, "total_tokens": 3959712} {"current_steps": 6875, "total_steps": 67140, "loss": 0.6292, "lr": 4.999913503302397e-05, "epoch": 1.023979743818886, "percentage": 10.24, "elapsed_time": "0:28:32", "remaining_time": "4:10:14", "throughput": 2313.27, "total_tokens": 3962336} {"current_steps": 6880, "total_steps": 67140, "loss": 0.7023, "lr": 4.9999080128230365e-05, "epoch": 1.024724456359845, "percentage": 10.25, "elapsed_time": "0:28:34", "remaining_time": "4:10:12", "throughput": 2313.44, "total_tokens": 3965280} {"current_steps": 6885, "total_steps": 67140, "loss": 0.6253, "lr": 4.9999023534100565e-05, "epoch": 1.0254691689008042, "percentage": 10.25, "elapsed_time": "0:28:35", "remaining_time": "4:10:11", "throughput": 2313.7, "total_tokens": 3968512} {"current_steps": 6890, "total_steps": 67140, "loss": 0.702, "lr": 4.999896525063839e-05, "epoch": 1.0262138814417634, "percentage": 10.26, "elapsed_time": "0:28:36", "remaining_time": "4:10:08", "throughput": 2313.87, "total_tokens": 3971488} {"current_steps": 6895, "total_steps": 67140, "loss": 0.74, "lr": 4.999890527784777e-05, "epoch": 1.0269585939827226, "percentage": 10.27, "elapsed_time": "0:28:38", "remaining_time": "4:10:13", "throughput": 2313.17, "total_tokens": 3974560} {"current_steps": 6900, "total_steps": 67140, "loss": 0.6991, "lr": 4.999884361573279e-05, "epoch": 1.0277033065236818, "percentage": 10.28, "elapsed_time": "0:28:39", "remaining_time": "4:10:11", "throughput": 2313.37, "total_tokens": 3977600} {"current_steps": 6905, "total_steps": 67140, "loss": 0.7316, "lr": 4.999878026429758e-05, "epoch": 1.028448019064641, "percentage": 10.28, "elapsed_time": "0:28:40", "remaining_time": "4:10:09", "throughput": 2313.66, "total_tokens": 3980864} {"current_steps": 6910, "total_steps": 67140, "loss": 0.6599, "lr": 4.999871522354645e-05, "epoch": 1.0291927316056002, "percentage": 10.29, "elapsed_time": "0:28:41", "remaining_time": "4:10:07", "throughput": 2313.88, "total_tokens": 3983936} {"current_steps": 6915, "total_steps": 67140, "loss": 0.6345, "lr": 4.999864849348378e-05, "epoch": 1.0299374441465594, "percentage": 10.3, "elapsed_time": "0:28:42", "remaining_time": "4:10:05", "throughput": 2314.03, "total_tokens": 3986784} {"current_steps": 6920, "total_steps": 67140, "loss": 0.6934, "lr": 4.999858007411408e-05, "epoch": 1.0306821566875186, "percentage": 10.31, "elapsed_time": "0:28:43", "remaining_time": "4:10:02", "throughput": 2314.07, "total_tokens": 3989408} {"current_steps": 6925, "total_steps": 67140, "loss": 0.6049, "lr": 4.999850996544197e-05, "epoch": 1.0314268692284778, "percentage": 10.31, "elapsed_time": "0:28:45", "remaining_time": "4:10:00", "throughput": 2314.25, "total_tokens": 3992384} {"current_steps": 6930, "total_steps": 67140, "loss": 0.6975, "lr": 4.999843816747219e-05, "epoch": 1.032171581769437, "percentage": 10.32, "elapsed_time": "0:28:46", "remaining_time": "4:09:57", "throughput": 2314.24, "total_tokens": 3994816} {"current_steps": 6935, "total_steps": 67140, "loss": 0.7426, "lr": 4.9998364680209605e-05, "epoch": 1.0329162943103962, "percentage": 10.33, "elapsed_time": "0:28:47", "remaining_time": "4:09:55", "throughput": 2314.3, "total_tokens": 3997472} {"current_steps": 6940, "total_steps": 67140, "loss": 0.5974, "lr": 4.999828950365917e-05, "epoch": 1.0336610068513554, "percentage": 10.34, "elapsed_time": "0:28:48", "remaining_time": "4:09:52", "throughput": 2314.46, "total_tokens": 4000352} {"current_steps": 6945, "total_steps": 67140, "loss": 0.7766, "lr": 4.999821263782597e-05, "epoch": 1.0344057193923146, "percentage": 10.34, "elapsed_time": "0:28:49", "remaining_time": "4:09:50", "throughput": 2314.57, "total_tokens": 4003168} {"current_steps": 6950, "total_steps": 67140, "loss": 0.5156, "lr": 4.9998134082715184e-05, "epoch": 1.0351504319332738, "percentage": 10.35, "elapsed_time": "0:28:50", "remaining_time": "4:09:48", "throughput": 2314.71, "total_tokens": 4006016} {"current_steps": 6955, "total_steps": 67140, "loss": 0.5767, "lr": 4.999805383833214e-05, "epoch": 1.035895144474233, "percentage": 10.36, "elapsed_time": "0:28:51", "remaining_time": "4:09:46", "throughput": 2314.89, "total_tokens": 4008992} {"current_steps": 6960, "total_steps": 67140, "loss": 0.7234, "lr": 4.999797190468225e-05, "epoch": 1.0366398570151922, "percentage": 10.37, "elapsed_time": "0:28:52", "remaining_time": "4:09:43", "throughput": 2314.94, "total_tokens": 4011552} {"current_steps": 6965, "total_steps": 67140, "loss": 0.5727, "lr": 4.999788828177105e-05, "epoch": 1.0373845695561514, "percentage": 10.37, "elapsed_time": "0:28:54", "remaining_time": "4:09:41", "throughput": 2315.03, "total_tokens": 4014304} {"current_steps": 6970, "total_steps": 67140, "loss": 0.6356, "lr": 4.9997802969604195e-05, "epoch": 1.0381292820971104, "percentage": 10.38, "elapsed_time": "0:28:55", "remaining_time": "4:09:39", "throughput": 2315.25, "total_tokens": 4017376} {"current_steps": 6975, "total_steps": 67140, "loss": 0.7648, "lr": 4.9997715968187456e-05, "epoch": 1.0388739946380696, "percentage": 10.39, "elapsed_time": "0:28:56", "remaining_time": "4:09:36", "throughput": 2315.32, "total_tokens": 4020032} {"current_steps": 6980, "total_steps": 67140, "loss": 0.6479, "lr": 4.999762727752669e-05, "epoch": 1.0396187071790288, "percentage": 10.4, "elapsed_time": "0:28:57", "remaining_time": "4:09:34", "throughput": 2315.46, "total_tokens": 4022912} {"current_steps": 6985, "total_steps": 67140, "loss": 0.6954, "lr": 4.9997536897627915e-05, "epoch": 1.040363419719988, "percentage": 10.4, "elapsed_time": "0:28:58", "remaining_time": "4:09:32", "throughput": 2315.56, "total_tokens": 4025632} {"current_steps": 6990, "total_steps": 67140, "loss": 0.6209, "lr": 4.999744482849723e-05, "epoch": 1.0411081322609472, "percentage": 10.41, "elapsed_time": "0:28:59", "remaining_time": "4:09:29", "throughput": 2315.68, "total_tokens": 4028448} {"current_steps": 6995, "total_steps": 67140, "loss": 0.722, "lr": 4.9997351070140856e-05, "epoch": 1.0418528448019064, "percentage": 10.42, "elapsed_time": "0:29:00", "remaining_time": "4:09:27", "throughput": 2315.88, "total_tokens": 4031424} {"current_steps": 7000, "total_steps": 67140, "loss": 0.7127, "lr": 4.999725562256513e-05, "epoch": 1.0425975573428656, "percentage": 10.43, "elapsed_time": "0:29:01", "remaining_time": "4:09:25", "throughput": 2316.07, "total_tokens": 4034400} {"current_steps": 7005, "total_steps": 67140, "loss": 0.6643, "lr": 4.9997158485776493e-05, "epoch": 1.0433422698838248, "percentage": 10.43, "elapsed_time": "0:29:03", "remaining_time": "4:09:23", "throughput": 2316.26, "total_tokens": 4037440} {"current_steps": 7010, "total_steps": 67140, "loss": 0.6476, "lr": 4.9997059659781526e-05, "epoch": 1.044086982424784, "percentage": 10.44, "elapsed_time": "0:29:04", "remaining_time": "4:09:21", "throughput": 2316.32, "total_tokens": 4040096} {"current_steps": 7015, "total_steps": 67140, "loss": 0.7499, "lr": 4.9996959144586895e-05, "epoch": 1.0448316949657432, "percentage": 10.45, "elapsed_time": "0:29:05", "remaining_time": "4:09:18", "throughput": 2316.45, "total_tokens": 4042944} {"current_steps": 7020, "total_steps": 67140, "loss": 0.7339, "lr": 4.999685694019939e-05, "epoch": 1.0455764075067024, "percentage": 10.46, "elapsed_time": "0:29:06", "remaining_time": "4:09:16", "throughput": 2316.51, "total_tokens": 4045568} {"current_steps": 7025, "total_steps": 67140, "loss": 0.6403, "lr": 4.9996753046625925e-05, "epoch": 1.0463211200476616, "percentage": 10.46, "elapsed_time": "0:29:07", "remaining_time": "4:09:14", "throughput": 2316.59, "total_tokens": 4048288} {"current_steps": 7030, "total_steps": 67140, "loss": 0.5997, "lr": 4.9996647463873525e-05, "epoch": 1.0470658325886208, "percentage": 10.47, "elapsed_time": "0:29:08", "remaining_time": "4:09:11", "throughput": 2316.74, "total_tokens": 4051168} {"current_steps": 7035, "total_steps": 67140, "loss": 0.6126, "lr": 4.999654019194931e-05, "epoch": 1.04781054512958, "percentage": 10.48, "elapsed_time": "0:29:09", "remaining_time": "4:09:09", "throughput": 2316.77, "total_tokens": 4053728} {"current_steps": 7040, "total_steps": 67140, "loss": 0.7349, "lr": 4.9996431230860544e-05, "epoch": 1.0485552576705393, "percentage": 10.49, "elapsed_time": "0:29:10", "remaining_time": "4:09:07", "throughput": 2316.97, "total_tokens": 4056768} {"current_steps": 7045, "total_steps": 67140, "loss": 0.7035, "lr": 4.999632058061457e-05, "epoch": 1.0492999702114985, "percentage": 10.49, "elapsed_time": "0:29:12", "remaining_time": "4:09:05", "throughput": 2317.11, "total_tokens": 4059648} {"current_steps": 7050, "total_steps": 67140, "loss": 0.5791, "lr": 4.999620824121889e-05, "epoch": 1.0500446827524577, "percentage": 10.5, "elapsed_time": "0:29:13", "remaining_time": "4:09:02", "throughput": 2317.13, "total_tokens": 4062208} {"current_steps": 7055, "total_steps": 67140, "loss": 0.7654, "lr": 4.999609421268109e-05, "epoch": 1.0507893952934166, "percentage": 10.51, "elapsed_time": "0:29:14", "remaining_time": "4:09:00", "throughput": 2317.24, "total_tokens": 4064960} {"current_steps": 7060, "total_steps": 67140, "loss": 0.6789, "lr": 4.999597849500886e-05, "epoch": 1.0515341078343758, "percentage": 10.52, "elapsed_time": "0:29:15", "remaining_time": "4:08:57", "throughput": 2317.33, "total_tokens": 4067680} {"current_steps": 7065, "total_steps": 67140, "loss": 0.6513, "lr": 4.999586108821003e-05, "epoch": 1.052278820375335, "percentage": 10.52, "elapsed_time": "0:29:16", "remaining_time": "4:08:55", "throughput": 2317.44, "total_tokens": 4070464} {"current_steps": 7070, "total_steps": 67140, "loss": 0.6379, "lr": 4.999574199229254e-05, "epoch": 1.0530235329162942, "percentage": 10.53, "elapsed_time": "0:29:17", "remaining_time": "4:08:53", "throughput": 2317.61, "total_tokens": 4073408} {"current_steps": 7075, "total_steps": 67140, "loss": 0.5667, "lr": 4.9995621207264426e-05, "epoch": 1.0537682454572534, "percentage": 10.54, "elapsed_time": "0:29:18", "remaining_time": "4:08:51", "throughput": 2317.68, "total_tokens": 4076160} {"current_steps": 7080, "total_steps": 67140, "loss": 0.6824, "lr": 4.9995498733133864e-05, "epoch": 1.0545129579982127, "percentage": 10.55, "elapsed_time": "0:29:19", "remaining_time": "4:08:49", "throughput": 2317.86, "total_tokens": 4079168} {"current_steps": 7085, "total_steps": 67140, "loss": 0.9827, "lr": 4.9995374569909105e-05, "epoch": 1.0552576705391719, "percentage": 10.55, "elapsed_time": "0:29:21", "remaining_time": "4:08:47", "throughput": 2318.07, "total_tokens": 4082208} {"current_steps": 7090, "total_steps": 67140, "loss": 0.6517, "lr": 4.999524871759857e-05, "epoch": 1.056002383080131, "percentage": 10.56, "elapsed_time": "0:29:22", "remaining_time": "4:08:45", "throughput": 2318.17, "total_tokens": 4085024} {"current_steps": 7095, "total_steps": 67140, "loss": 0.6977, "lr": 4.999512117621075e-05, "epoch": 1.0567470956210903, "percentage": 10.57, "elapsed_time": "0:29:23", "remaining_time": "4:08:42", "throughput": 2318.34, "total_tokens": 4087968} {"current_steps": 7100, "total_steps": 67140, "loss": 0.7291, "lr": 4.999499194575426e-05, "epoch": 1.0574918081620495, "percentage": 10.57, "elapsed_time": "0:29:24", "remaining_time": "4:08:41", "throughput": 2318.52, "total_tokens": 4091008} {"current_steps": 7105, "total_steps": 67140, "loss": 0.6332, "lr": 4.9994861026237826e-05, "epoch": 1.0582365207030087, "percentage": 10.58, "elapsed_time": "0:29:25", "remaining_time": "4:08:39", "throughput": 2318.72, "total_tokens": 4094080} {"current_steps": 7110, "total_steps": 67140, "loss": 0.7255, "lr": 4.999472841767032e-05, "epoch": 1.0589812332439679, "percentage": 10.59, "elapsed_time": "0:29:26", "remaining_time": "4:08:36", "throughput": 2318.75, "total_tokens": 4096672} {"current_steps": 7115, "total_steps": 67140, "loss": 0.6537, "lr": 4.999459412006069e-05, "epoch": 1.059725945784927, "percentage": 10.6, "elapsed_time": "0:29:27", "remaining_time": "4:08:34", "throughput": 2318.84, "total_tokens": 4099424} {"current_steps": 7120, "total_steps": 67140, "loss": 0.7368, "lr": 4.9994458133418e-05, "epoch": 1.0604706583258863, "percentage": 10.6, "elapsed_time": "0:29:29", "remaining_time": "4:08:33", "throughput": 2319.13, "total_tokens": 4102752} {"current_steps": 7125, "total_steps": 67140, "loss": 0.6784, "lr": 4.9994320457751456e-05, "epoch": 1.0612153708668455, "percentage": 10.61, "elapsed_time": "0:29:30", "remaining_time": "4:08:31", "throughput": 2319.32, "total_tokens": 4105792} {"current_steps": 7130, "total_steps": 67140, "loss": 0.7269, "lr": 4.9994181093070345e-05, "epoch": 1.0619600834078047, "percentage": 10.62, "elapsed_time": "0:29:31", "remaining_time": "4:08:29", "throughput": 2319.63, "total_tokens": 4109152} {"current_steps": 7135, "total_steps": 67140, "loss": 0.7818, "lr": 4.9994040039384104e-05, "epoch": 1.0627047959487639, "percentage": 10.63, "elapsed_time": "0:29:32", "remaining_time": "4:08:27", "throughput": 2319.83, "total_tokens": 4112192} {"current_steps": 7140, "total_steps": 67140, "loss": 0.7749, "lr": 4.999389729670226e-05, "epoch": 1.063449508489723, "percentage": 10.63, "elapsed_time": "0:29:33", "remaining_time": "4:08:25", "throughput": 2319.96, "total_tokens": 4115072} {"current_steps": 7145, "total_steps": 67140, "loss": 0.6945, "lr": 4.999375286503445e-05, "epoch": 1.064194221030682, "percentage": 10.64, "elapsed_time": "0:29:34", "remaining_time": "4:08:23", "throughput": 2320.03, "total_tokens": 4117760} {"current_steps": 7150, "total_steps": 67140, "loss": 0.7165, "lr": 4.999360674439043e-05, "epoch": 1.0649389335716413, "percentage": 10.65, "elapsed_time": "0:29:36", "remaining_time": "4:08:21", "throughput": 2320.18, "total_tokens": 4120704} {"current_steps": 7155, "total_steps": 67140, "loss": 0.5669, "lr": 4.999345893478009e-05, "epoch": 1.0656836461126005, "percentage": 10.66, "elapsed_time": "0:29:37", "remaining_time": "4:08:19", "throughput": 2320.37, "total_tokens": 4123712} {"current_steps": 7160, "total_steps": 67140, "loss": 0.7727, "lr": 4.9993309436213415e-05, "epoch": 1.0664283586535597, "percentage": 10.66, "elapsed_time": "0:29:38", "remaining_time": "4:08:17", "throughput": 2320.49, "total_tokens": 4126528} {"current_steps": 7165, "total_steps": 67140, "loss": 0.5589, "lr": 4.99931582487005e-05, "epoch": 1.0671730711945189, "percentage": 10.67, "elapsed_time": "0:29:39", "remaining_time": "4:08:14", "throughput": 2320.57, "total_tokens": 4129312} {"current_steps": 7170, "total_steps": 67140, "loss": 0.6282, "lr": 4.999300537225157e-05, "epoch": 1.067917783735478, "percentage": 10.68, "elapsed_time": "0:29:40", "remaining_time": "4:08:12", "throughput": 2320.71, "total_tokens": 4132192} {"current_steps": 7175, "total_steps": 67140, "loss": 0.8233, "lr": 4.999285080687694e-05, "epoch": 1.0686624962764373, "percentage": 10.69, "elapsed_time": "0:29:41", "remaining_time": "4:08:10", "throughput": 2320.76, "total_tokens": 4134848} {"current_steps": 7180, "total_steps": 67140, "loss": 0.7485, "lr": 4.999269455258707e-05, "epoch": 1.0694072088173965, "percentage": 10.69, "elapsed_time": "0:29:42", "remaining_time": "4:08:08", "throughput": 2320.99, "total_tokens": 4137952} {"current_steps": 7185, "total_steps": 67140, "loss": 0.8786, "lr": 4.999253660939251e-05, "epoch": 1.0701519213583557, "percentage": 10.7, "elapsed_time": "0:29:43", "remaining_time": "4:08:06", "throughput": 2321.15, "total_tokens": 4140896} {"current_steps": 7190, "total_steps": 67140, "loss": 0.7519, "lr": 4.999237697730396e-05, "epoch": 1.0708966338993149, "percentage": 10.71, "elapsed_time": "0:29:45", "remaining_time": "4:08:04", "throughput": 2321.22, "total_tokens": 4143584} {"current_steps": 7195, "total_steps": 67140, "loss": 0.7128, "lr": 4.9992215656332166e-05, "epoch": 1.071641346440274, "percentage": 10.72, "elapsed_time": "0:29:46", "remaining_time": "4:08:01", "throughput": 2321.37, "total_tokens": 4146496} {"current_steps": 7200, "total_steps": 67140, "loss": 0.7291, "lr": 4.999205264648805e-05, "epoch": 1.0723860589812333, "percentage": 10.72, "elapsed_time": "0:29:47", "remaining_time": "4:08:00", "throughput": 2321.64, "total_tokens": 4149728} {"current_steps": 7205, "total_steps": 67140, "loss": 0.6187, "lr": 4.999188794778263e-05, "epoch": 1.0731307715221925, "percentage": 10.73, "elapsed_time": "0:29:48", "remaining_time": "4:07:57", "throughput": 2321.72, "total_tokens": 4152480} {"current_steps": 7210, "total_steps": 67140, "loss": 0.6553, "lr": 4.999172156022703e-05, "epoch": 1.0738754840631517, "percentage": 10.74, "elapsed_time": "0:29:49", "remaining_time": "4:07:56", "throughput": 2321.98, "total_tokens": 4155680} {"current_steps": 7215, "total_steps": 67140, "loss": 0.6488, "lr": 4.9991553483832506e-05, "epoch": 1.074620196604111, "percentage": 10.75, "elapsed_time": "0:29:50", "remaining_time": "4:07:53", "throughput": 2322.01, "total_tokens": 4158272} {"current_steps": 7220, "total_steps": 67140, "loss": 0.818, "lr": 4.9991383718610397e-05, "epoch": 1.07536490914507, "percentage": 10.75, "elapsed_time": "0:29:51", "remaining_time": "4:07:51", "throughput": 2322.09, "total_tokens": 4160960} {"current_steps": 7225, "total_steps": 67140, "loss": 0.5967, "lr": 4.999121226457219e-05, "epoch": 1.076109621686029, "percentage": 10.76, "elapsed_time": "0:29:53", "remaining_time": "4:07:49", "throughput": 2322.28, "total_tokens": 4164032} {"current_steps": 7230, "total_steps": 67140, "loss": 0.6856, "lr": 4.999103912172945e-05, "epoch": 1.0768543342269883, "percentage": 10.77, "elapsed_time": "0:29:54", "remaining_time": "4:07:47", "throughput": 2322.46, "total_tokens": 4167040} {"current_steps": 7235, "total_steps": 67140, "loss": 0.6438, "lr": 4.999086429009391e-05, "epoch": 1.0775990467679475, "percentage": 10.78, "elapsed_time": "0:29:55", "remaining_time": "4:07:45", "throughput": 2322.59, "total_tokens": 4169888} {"current_steps": 7240, "total_steps": 67140, "loss": 0.7801, "lr": 4.999068776967736e-05, "epoch": 1.0783437593089067, "percentage": 10.78, "elapsed_time": "0:29:56", "remaining_time": "4:07:43", "throughput": 2322.73, "total_tokens": 4172768} {"current_steps": 7245, "total_steps": 67140, "loss": 0.6393, "lr": 4.999050956049173e-05, "epoch": 1.079088471849866, "percentage": 10.79, "elapsed_time": "0:29:57", "remaining_time": "4:07:40", "throughput": 2322.84, "total_tokens": 4175552} {"current_steps": 7250, "total_steps": 67140, "loss": 0.7062, "lr": 4.999032966254907e-05, "epoch": 1.079833184390825, "percentage": 10.8, "elapsed_time": "0:29:58", "remaining_time": "4:07:38", "throughput": 2323.01, "total_tokens": 4178528} {"current_steps": 7255, "total_steps": 67140, "loss": 0.6904, "lr": 4.999014807586154e-05, "epoch": 1.0805778969317843, "percentage": 10.81, "elapsed_time": "0:29:59", "remaining_time": "4:07:36", "throughput": 2323.14, "total_tokens": 4181376} {"current_steps": 7260, "total_steps": 67140, "loss": 0.7419, "lr": 4.99899648004414e-05, "epoch": 1.0813226094727435, "percentage": 10.81, "elapsed_time": "0:30:01", "remaining_time": "4:07:34", "throughput": 2323.23, "total_tokens": 4184160} {"current_steps": 7265, "total_steps": 67140, "loss": 0.6562, "lr": 4.998977983630104e-05, "epoch": 1.0820673220137027, "percentage": 10.82, "elapsed_time": "0:30:02", "remaining_time": "4:07:32", "throughput": 2323.29, "total_tokens": 4186784} {"current_steps": 7270, "total_steps": 67140, "loss": 0.6393, "lr": 4.9989593183452965e-05, "epoch": 1.082812034554662, "percentage": 10.83, "elapsed_time": "0:30:03", "remaining_time": "4:07:29", "throughput": 2323.36, "total_tokens": 4189472} {"current_steps": 7275, "total_steps": 67140, "loss": 0.5326, "lr": 4.9989404841909784e-05, "epoch": 1.083556747095621, "percentage": 10.84, "elapsed_time": "0:30:04", "remaining_time": "4:07:28", "throughput": 2323.66, "total_tokens": 4192768} {"current_steps": 7280, "total_steps": 67140, "loss": 0.6924, "lr": 4.998921481168421e-05, "epoch": 1.0843014596365803, "percentage": 10.84, "elapsed_time": "0:30:05", "remaining_time": "4:07:25", "throughput": 2323.74, "total_tokens": 4195488} {"current_steps": 7285, "total_steps": 67140, "loss": 0.5958, "lr": 4.9989023092789113e-05, "epoch": 1.0850461721775395, "percentage": 10.85, "elapsed_time": "0:30:06", "remaining_time": "4:07:23", "throughput": 2323.93, "total_tokens": 4198528} {"current_steps": 7290, "total_steps": 67140, "loss": 0.789, "lr": 4.998882968523743e-05, "epoch": 1.0857908847184987, "percentage": 10.86, "elapsed_time": "0:30:07", "remaining_time": "4:07:21", "throughput": 2324.04, "total_tokens": 4201312} {"current_steps": 7295, "total_steps": 67140, "loss": 0.647, "lr": 4.9988634589042227e-05, "epoch": 1.086535597259458, "percentage": 10.87, "elapsed_time": "0:30:08", "remaining_time": "4:07:19", "throughput": 2324.12, "total_tokens": 4204032} {"current_steps": 7300, "total_steps": 67140, "loss": 0.6916, "lr": 4.9988437804216704e-05, "epoch": 1.0872803098004171, "percentage": 10.87, "elapsed_time": "0:30:10", "remaining_time": "4:07:17", "throughput": 2324.34, "total_tokens": 4207200} {"current_steps": 7305, "total_steps": 67140, "loss": 0.7015, "lr": 4.998823933077414e-05, "epoch": 1.0880250223413763, "percentage": 10.88, "elapsed_time": "0:30:11", "remaining_time": "4:07:16", "throughput": 2324.65, "total_tokens": 4210592} {"current_steps": 7310, "total_steps": 67140, "loss": 0.9674, "lr": 4.998803916872797e-05, "epoch": 1.0887697348823355, "percentage": 10.89, "elapsed_time": "0:30:12", "remaining_time": "4:07:14", "throughput": 2324.94, "total_tokens": 4213888} {"current_steps": 7315, "total_steps": 67140, "loss": 0.6457, "lr": 4.99878373180917e-05, "epoch": 1.0895144474232945, "percentage": 10.9, "elapsed_time": "0:30:13", "remaining_time": "4:07:12", "throughput": 2324.98, "total_tokens": 4216544} {"current_steps": 7320, "total_steps": 67140, "loss": 0.8053, "lr": 4.9987633778878975e-05, "epoch": 1.0902591599642537, "percentage": 10.9, "elapsed_time": "0:30:14", "remaining_time": "4:07:09", "throughput": 2325.09, "total_tokens": 4219328} {"current_steps": 7325, "total_steps": 67140, "loss": 0.7166, "lr": 4.9987428551103554e-05, "epoch": 1.091003872505213, "percentage": 10.91, "elapsed_time": "0:30:15", "remaining_time": "4:07:07", "throughput": 2325.2, "total_tokens": 4222144} {"current_steps": 7330, "total_steps": 67140, "loss": 0.6681, "lr": 4.9987221634779303e-05, "epoch": 1.0917485850461721, "percentage": 10.92, "elapsed_time": "0:30:16", "remaining_time": "4:07:05", "throughput": 2325.35, "total_tokens": 4225056} {"current_steps": 7335, "total_steps": 67140, "loss": 0.6376, "lr": 4.99870130299202e-05, "epoch": 1.0924932975871313, "percentage": 10.92, "elapsed_time": "0:30:18", "remaining_time": "4:07:03", "throughput": 2325.56, "total_tokens": 4228160} {"current_steps": 7340, "total_steps": 67140, "loss": 0.6247, "lr": 4.998680273654035e-05, "epoch": 1.0932380101280905, "percentage": 10.93, "elapsed_time": "0:30:19", "remaining_time": "4:07:01", "throughput": 2325.67, "total_tokens": 4230976} {"current_steps": 7345, "total_steps": 67140, "loss": 0.7456, "lr": 4.998659075465396e-05, "epoch": 1.0939827226690497, "percentage": 10.94, "elapsed_time": "0:30:20", "remaining_time": "4:06:59", "throughput": 2325.8, "total_tokens": 4233792} {"current_steps": 7350, "total_steps": 67140, "loss": 0.6958, "lr": 4.998637708427536e-05, "epoch": 1.094727435210009, "percentage": 10.95, "elapsed_time": "0:30:21", "remaining_time": "4:06:57", "throughput": 2326.03, "total_tokens": 4236992} {"current_steps": 7355, "total_steps": 67140, "loss": 0.6617, "lr": 4.998616172541898e-05, "epoch": 1.0954721477509681, "percentage": 10.95, "elapsed_time": "0:30:22", "remaining_time": "4:06:55", "throughput": 2326.09, "total_tokens": 4239712} {"current_steps": 7360, "total_steps": 67140, "loss": 0.828, "lr": 4.9985944678099374e-05, "epoch": 1.0962168602919273, "percentage": 10.96, "elapsed_time": "0:30:23", "remaining_time": "4:06:53", "throughput": 2326.17, "total_tokens": 4242464} {"current_steps": 7365, "total_steps": 67140, "loss": 0.659, "lr": 4.998572594233121e-05, "epoch": 1.0969615728328865, "percentage": 10.97, "elapsed_time": "0:30:24", "remaining_time": "4:06:51", "throughput": 2326.33, "total_tokens": 4245408} {"current_steps": 7370, "total_steps": 67140, "loss": 0.6657, "lr": 4.998550551812927e-05, "epoch": 1.0977062853738457, "percentage": 10.98, "elapsed_time": "0:30:26", "remaining_time": "4:06:49", "throughput": 2326.52, "total_tokens": 4248416} {"current_steps": 7375, "total_steps": 67140, "loss": 0.7718, "lr": 4.998528340550846e-05, "epoch": 1.098450997914805, "percentage": 10.98, "elapsed_time": "0:30:27", "remaining_time": "4:06:47", "throughput": 2326.75, "total_tokens": 4251584} {"current_steps": 7380, "total_steps": 67140, "loss": 0.5802, "lr": 4.998505960448377e-05, "epoch": 1.0991957104557641, "percentage": 10.99, "elapsed_time": "0:30:28", "remaining_time": "4:06:45", "throughput": 2326.9, "total_tokens": 4254528} {"current_steps": 7385, "total_steps": 67140, "loss": 0.5921, "lr": 4.998483411507034e-05, "epoch": 1.0999404229967233, "percentage": 11.0, "elapsed_time": "0:30:29", "remaining_time": "4:06:43", "throughput": 2327.03, "total_tokens": 4257376} {"current_steps": 7390, "total_steps": 67140, "loss": 0.5513, "lr": 4.9984606937283405e-05, "epoch": 1.1006851355376825, "percentage": 11.01, "elapsed_time": "0:30:30", "remaining_time": "4:06:41", "throughput": 2327.15, "total_tokens": 4260288} {"current_steps": 7395, "total_steps": 67140, "loss": 0.65, "lr": 4.9984378071138315e-05, "epoch": 1.1014298480786415, "percentage": 11.01, "elapsed_time": "0:30:31", "remaining_time": "4:06:39", "throughput": 2327.29, "total_tokens": 4263200} {"current_steps": 7400, "total_steps": 67140, "loss": 0.6079, "lr": 4.998414751665053e-05, "epoch": 1.1021745606196007, "percentage": 11.02, "elapsed_time": "0:30:32", "remaining_time": "4:06:37", "throughput": 2327.41, "total_tokens": 4266048} {"current_steps": 7405, "total_steps": 67140, "loss": 0.7482, "lr": 4.998391527383563e-05, "epoch": 1.10291927316056, "percentage": 11.03, "elapsed_time": "0:30:34", "remaining_time": "4:06:35", "throughput": 2327.6, "total_tokens": 4269088} {"current_steps": 7410, "total_steps": 67140, "loss": 0.6269, "lr": 4.9983681342709316e-05, "epoch": 1.1036639857015191, "percentage": 11.04, "elapsed_time": "0:30:35", "remaining_time": "4:06:33", "throughput": 2327.81, "total_tokens": 4272192} {"current_steps": 7415, "total_steps": 67140, "loss": 0.6271, "lr": 4.998344572328739e-05, "epoch": 1.1044086982424783, "percentage": 11.04, "elapsed_time": "0:30:36", "remaining_time": "4:06:31", "throughput": 2327.97, "total_tokens": 4275200} {"current_steps": 7420, "total_steps": 67140, "loss": 0.682, "lr": 4.998320841558578e-05, "epoch": 1.1051534107834375, "percentage": 11.05, "elapsed_time": "0:30:37", "remaining_time": "4:06:30", "throughput": 2328.2, "total_tokens": 4278368} {"current_steps": 7425, "total_steps": 67140, "loss": 0.6737, "lr": 4.9982969419620516e-05, "epoch": 1.1058981233243967, "percentage": 11.06, "elapsed_time": "0:30:38", "remaining_time": "4:06:27", "throughput": 2328.3, "total_tokens": 4281152} {"current_steps": 7430, "total_steps": 67140, "loss": 0.7484, "lr": 4.9982728735407756e-05, "epoch": 1.106642835865356, "percentage": 11.07, "elapsed_time": "0:30:39", "remaining_time": "4:06:25", "throughput": 2328.35, "total_tokens": 4283840} {"current_steps": 7435, "total_steps": 67140, "loss": 0.6423, "lr": 4.998248636296377e-05, "epoch": 1.1073875484063151, "percentage": 11.07, "elapsed_time": "0:30:40", "remaining_time": "4:06:23", "throughput": 2328.36, "total_tokens": 4286432} {"current_steps": 7440, "total_steps": 67140, "loss": 0.6897, "lr": 4.998224230230491e-05, "epoch": 1.1081322609472744, "percentage": 11.08, "elapsed_time": "0:30:42", "remaining_time": "4:06:21", "throughput": 2328.4, "total_tokens": 4289088} {"current_steps": 7445, "total_steps": 67140, "loss": 0.8966, "lr": 4.9981996553447695e-05, "epoch": 1.1088769734882336, "percentage": 11.09, "elapsed_time": "0:30:43", "remaining_time": "4:06:18", "throughput": 2328.44, "total_tokens": 4291712} {"current_steps": 7450, "total_steps": 67140, "loss": 0.7089, "lr": 4.998174911640872e-05, "epoch": 1.1096216860291928, "percentage": 11.1, "elapsed_time": "0:30:44", "remaining_time": "4:06:16", "throughput": 2328.52, "total_tokens": 4294432} {"current_steps": 7455, "total_steps": 67140, "loss": 0.6191, "lr": 4.9981499991204704e-05, "epoch": 1.110366398570152, "percentage": 11.1, "elapsed_time": "0:30:45", "remaining_time": "4:06:14", "throughput": 2328.61, "total_tokens": 4297184} {"current_steps": 7460, "total_steps": 67140, "loss": 0.7084, "lr": 4.998124917785249e-05, "epoch": 1.1111111111111112, "percentage": 11.11, "elapsed_time": "0:30:46", "remaining_time": "4:06:11", "throughput": 2328.69, "total_tokens": 4299904} {"current_steps": 7465, "total_steps": 67140, "loss": 0.5055, "lr": 4.9980996676369026e-05, "epoch": 1.1118558236520704, "percentage": 11.12, "elapsed_time": "0:30:47", "remaining_time": "4:06:10", "throughput": 2328.88, "total_tokens": 4303008} {"current_steps": 7470, "total_steps": 67140, "loss": 0.6281, "lr": 4.998074248677137e-05, "epoch": 1.1126005361930296, "percentage": 11.13, "elapsed_time": "0:30:48", "remaining_time": "4:06:08", "throughput": 2329.01, "total_tokens": 4305888} {"current_steps": 7475, "total_steps": 67140, "loss": 0.8312, "lr": 4.9980486609076695e-05, "epoch": 1.1133452487339888, "percentage": 11.13, "elapsed_time": "0:30:49", "remaining_time": "4:06:06", "throughput": 2329.23, "total_tokens": 4309024} {"current_steps": 7480, "total_steps": 67140, "loss": 0.7738, "lr": 4.998022904330231e-05, "epoch": 1.114089961274948, "percentage": 11.14, "elapsed_time": "0:30:51", "remaining_time": "4:06:04", "throughput": 2329.39, "total_tokens": 4311936} {"current_steps": 7485, "total_steps": 67140, "loss": 0.7303, "lr": 4.9979969789465594e-05, "epoch": 1.1148346738159072, "percentage": 11.15, "elapsed_time": "0:30:52", "remaining_time": "4:06:02", "throughput": 2329.51, "total_tokens": 4314784} {"current_steps": 7490, "total_steps": 67140, "loss": 0.6653, "lr": 4.9979708847584095e-05, "epoch": 1.1155793863568662, "percentage": 11.16, "elapsed_time": "0:30:53", "remaining_time": "4:06:00", "throughput": 2329.68, "total_tokens": 4317792} {"current_steps": 7495, "total_steps": 67140, "loss": 0.7906, "lr": 4.9979446217675416e-05, "epoch": 1.1163240988978254, "percentage": 11.16, "elapsed_time": "0:30:54", "remaining_time": "4:05:58", "throughput": 2329.84, "total_tokens": 4320768} {"current_steps": 7500, "total_steps": 67140, "loss": 0.6502, "lr": 4.997918189975733e-05, "epoch": 1.1170688114387846, "percentage": 11.17, "elapsed_time": "0:30:55", "remaining_time": "4:05:55", "throughput": 2329.92, "total_tokens": 4323456} {"current_steps": 7505, "total_steps": 67140, "loss": 0.7933, "lr": 4.99789158938477e-05, "epoch": 1.1178135239797438, "percentage": 11.18, "elapsed_time": "0:30:56", "remaining_time": "4:05:53", "throughput": 2330.09, "total_tokens": 4326432} {"current_steps": 7510, "total_steps": 67140, "loss": 0.6241, "lr": 4.9978648199964476e-05, "epoch": 1.118558236520703, "percentage": 11.19, "elapsed_time": "0:30:57", "remaining_time": "4:05:52", "throughput": 2330.27, "total_tokens": 4329504} {"current_steps": 7515, "total_steps": 67140, "loss": 0.6677, "lr": 4.997837881812577e-05, "epoch": 1.1193029490616622, "percentage": 11.19, "elapsed_time": "0:30:59", "remaining_time": "4:05:50", "throughput": 2330.46, "total_tokens": 4332576} {"current_steps": 7520, "total_steps": 67140, "loss": 0.7303, "lr": 4.997810774834977e-05, "epoch": 1.1200476616026214, "percentage": 11.2, "elapsed_time": "0:31:00", "remaining_time": "4:05:48", "throughput": 2330.62, "total_tokens": 4335520} {"current_steps": 7525, "total_steps": 67140, "loss": 0.5664, "lr": 4.9977834990654804e-05, "epoch": 1.1207923741435806, "percentage": 11.21, "elapsed_time": "0:31:01", "remaining_time": "4:05:46", "throughput": 2330.76, "total_tokens": 4338400} {"current_steps": 7530, "total_steps": 67140, "loss": 0.7836, "lr": 4.997756054505931e-05, "epoch": 1.1215370866845398, "percentage": 11.22, "elapsed_time": "0:31:02", "remaining_time": "4:05:44", "throughput": 2330.89, "total_tokens": 4341280} {"current_steps": 7535, "total_steps": 67140, "loss": 0.7353, "lr": 4.9977284411581816e-05, "epoch": 1.122281799225499, "percentage": 11.22, "elapsed_time": "0:31:03", "remaining_time": "4:05:42", "throughput": 2331.06, "total_tokens": 4344320} {"current_steps": 7540, "total_steps": 67140, "loss": 0.6085, "lr": 4.997700659024099e-05, "epoch": 1.1230265117664582, "percentage": 11.23, "elapsed_time": "0:31:04", "remaining_time": "4:05:40", "throughput": 2331.13, "total_tokens": 4347040} {"current_steps": 7545, "total_steps": 67140, "loss": 0.7186, "lr": 4.997672708105562e-05, "epoch": 1.1237712243074174, "percentage": 11.24, "elapsed_time": "0:31:05", "remaining_time": "4:05:38", "throughput": 2331.29, "total_tokens": 4350016} {"current_steps": 7550, "total_steps": 67140, "loss": 0.6283, "lr": 4.9976445884044575e-05, "epoch": 1.1245159368483766, "percentage": 11.25, "elapsed_time": "0:31:07", "remaining_time": "4:05:36", "throughput": 2331.38, "total_tokens": 4352768} {"current_steps": 7555, "total_steps": 67140, "loss": 0.6841, "lr": 4.9976162999226865e-05, "epoch": 1.1252606493893358, "percentage": 11.25, "elapsed_time": "0:31:08", "remaining_time": "4:05:33", "throughput": 2331.45, "total_tokens": 4355520} {"current_steps": 7560, "total_steps": 67140, "loss": 0.8478, "lr": 4.9975878426621605e-05, "epoch": 1.126005361930295, "percentage": 11.26, "elapsed_time": "0:31:09", "remaining_time": "4:05:31", "throughput": 2331.54, "total_tokens": 4358272} {"current_steps": 7565, "total_steps": 67140, "loss": 0.5541, "lr": 4.9975592166248025e-05, "epoch": 1.1267500744712542, "percentage": 11.27, "elapsed_time": "0:31:10", "remaining_time": "4:05:29", "throughput": 2331.7, "total_tokens": 4361280} {"current_steps": 7570, "total_steps": 67140, "loss": 0.8079, "lr": 4.997530421812547e-05, "epoch": 1.1274947870122132, "percentage": 11.27, "elapsed_time": "0:31:11", "remaining_time": "4:05:27", "throughput": 2331.93, "total_tokens": 4364416} {"current_steps": 7575, "total_steps": 67140, "loss": 0.6712, "lr": 4.997501458227339e-05, "epoch": 1.1282394995531724, "percentage": 11.28, "elapsed_time": "0:31:12", "remaining_time": "4:05:25", "throughput": 2332.09, "total_tokens": 4367360} {"current_steps": 7580, "total_steps": 67140, "loss": 0.713, "lr": 4.997472325871138e-05, "epoch": 1.1289842120941316, "percentage": 11.29, "elapsed_time": "0:31:13", "remaining_time": "4:05:24", "throughput": 2332.22, "total_tokens": 4370304} {"current_steps": 7585, "total_steps": 67140, "loss": 0.7347, "lr": 4.9974430247459106e-05, "epoch": 1.1297289246350908, "percentage": 11.3, "elapsed_time": "0:31:15", "remaining_time": "4:05:21", "throughput": 2332.34, "total_tokens": 4373152} {"current_steps": 7590, "total_steps": 67140, "loss": 0.661, "lr": 4.997413554853637e-05, "epoch": 1.13047363717605, "percentage": 11.3, "elapsed_time": "0:31:16", "remaining_time": "4:05:20", "throughput": 2332.48, "total_tokens": 4376096} {"current_steps": 7595, "total_steps": 67140, "loss": 0.8127, "lr": 4.99738391619631e-05, "epoch": 1.1312183497170092, "percentage": 11.31, "elapsed_time": "0:31:17", "remaining_time": "4:05:17", "throughput": 2332.65, "total_tokens": 4379040} {"current_steps": 7600, "total_steps": 67140, "loss": 0.7021, "lr": 4.997354108775931e-05, "epoch": 1.1319630622579684, "percentage": 11.32, "elapsed_time": "0:31:18", "remaining_time": "4:05:15", "throughput": 2332.67, "total_tokens": 4381664} {"current_steps": 7605, "total_steps": 67140, "loss": 0.6444, "lr": 4.997324132594515e-05, "epoch": 1.1327077747989276, "percentage": 11.33, "elapsed_time": "0:31:19", "remaining_time": "4:05:13", "throughput": 2332.71, "total_tokens": 4384288} {"current_steps": 7610, "total_steps": 67140, "loss": 0.5598, "lr": 4.997293987654087e-05, "epoch": 1.1334524873398868, "percentage": 11.33, "elapsed_time": "0:31:20", "remaining_time": "4:05:11", "throughput": 2332.86, "total_tokens": 4387264} {"current_steps": 7615, "total_steps": 67140, "loss": 0.7161, "lr": 4.997263673956685e-05, "epoch": 1.134197199880846, "percentage": 11.34, "elapsed_time": "0:31:21", "remaining_time": "4:05:09", "throughput": 2332.94, "total_tokens": 4389952} {"current_steps": 7620, "total_steps": 67140, "loss": 0.7313, "lr": 4.9972331915043575e-05, "epoch": 1.1349419124218052, "percentage": 11.35, "elapsed_time": "0:31:22", "remaining_time": "4:05:07", "throughput": 2333.14, "total_tokens": 4393088} {"current_steps": 7625, "total_steps": 67140, "loss": 0.7032, "lr": 4.997202540299163e-05, "epoch": 1.1356866249627644, "percentage": 11.36, "elapsed_time": "0:31:24", "remaining_time": "4:05:05", "throughput": 2333.26, "total_tokens": 4395968} {"current_steps": 7630, "total_steps": 67140, "loss": 0.6122, "lr": 4.997171720343175e-05, "epoch": 1.1364313375037236, "percentage": 11.36, "elapsed_time": "0:31:25", "remaining_time": "4:05:03", "throughput": 2333.4, "total_tokens": 4398912} {"current_steps": 7635, "total_steps": 67140, "loss": 0.6998, "lr": 4.9971407316384736e-05, "epoch": 1.1371760500446828, "percentage": 11.37, "elapsed_time": "0:31:26", "remaining_time": "4:05:01", "throughput": 2333.54, "total_tokens": 4401824} {"current_steps": 7640, "total_steps": 67140, "loss": 0.7254, "lr": 4.997109574187154e-05, "epoch": 1.137920762585642, "percentage": 11.38, "elapsed_time": "0:31:27", "remaining_time": "4:04:59", "throughput": 2333.66, "total_tokens": 4404704} {"current_steps": 7645, "total_steps": 67140, "loss": 0.5737, "lr": 4.997078247991323e-05, "epoch": 1.1386654751266012, "percentage": 11.39, "elapsed_time": "0:31:28", "remaining_time": "4:04:57", "throughput": 2333.9, "total_tokens": 4407936} {"current_steps": 7650, "total_steps": 67140, "loss": 0.6746, "lr": 4.9970467530530964e-05, "epoch": 1.1394101876675604, "percentage": 11.39, "elapsed_time": "0:31:29", "remaining_time": "4:04:55", "throughput": 2334.01, "total_tokens": 4410784} {"current_steps": 7655, "total_steps": 67140, "loss": 0.7812, "lr": 4.9970150893746016e-05, "epoch": 1.1401549002085196, "percentage": 11.4, "elapsed_time": "0:31:30", "remaining_time": "4:04:53", "throughput": 2334.05, "total_tokens": 4413440} {"current_steps": 7660, "total_steps": 67140, "loss": 0.5848, "lr": 4.99698325695798e-05, "epoch": 1.1408996127494788, "percentage": 11.41, "elapsed_time": "0:31:31", "remaining_time": "4:04:51", "throughput": 2334.07, "total_tokens": 4416000} {"current_steps": 7665, "total_steps": 67140, "loss": 0.5429, "lr": 4.996951255805381e-05, "epoch": 1.1416443252904378, "percentage": 11.42, "elapsed_time": "0:31:33", "remaining_time": "4:04:49", "throughput": 2334.17, "total_tokens": 4418816} {"current_steps": 7670, "total_steps": 67140, "loss": 0.72, "lr": 4.996919085918969e-05, "epoch": 1.142389037831397, "percentage": 11.42, "elapsed_time": "0:31:34", "remaining_time": "4:04:47", "throughput": 2334.34, "total_tokens": 4421792} {"current_steps": 7675, "total_steps": 67140, "loss": 0.5768, "lr": 4.996886747300916e-05, "epoch": 1.1431337503723562, "percentage": 11.43, "elapsed_time": "0:31:35", "remaining_time": "4:04:45", "throughput": 2334.45, "total_tokens": 4424640} {"current_steps": 7680, "total_steps": 67140, "loss": 0.7032, "lr": 4.996854239953409e-05, "epoch": 1.1438784629133154, "percentage": 11.44, "elapsed_time": "0:31:36", "remaining_time": "4:04:42", "throughput": 2334.53, "total_tokens": 4427392} {"current_steps": 7685, "total_steps": 67140, "loss": 0.7669, "lr": 4.996821563878643e-05, "epoch": 1.1446231754542746, "percentage": 11.45, "elapsed_time": "0:31:37", "remaining_time": "4:04:40", "throughput": 2334.71, "total_tokens": 4430400} {"current_steps": 7690, "total_steps": 67140, "loss": 0.5206, "lr": 4.9967887190788274e-05, "epoch": 1.1453678879952338, "percentage": 11.45, "elapsed_time": "0:31:38", "remaining_time": "4:04:38", "throughput": 2334.72, "total_tokens": 4432992} {"current_steps": 7695, "total_steps": 67140, "loss": 0.5633, "lr": 4.996755705556182e-05, "epoch": 1.146112600536193, "percentage": 11.46, "elapsed_time": "0:31:39", "remaining_time": "4:04:36", "throughput": 2334.9, "total_tokens": 4436032} {"current_steps": 7700, "total_steps": 67140, "loss": 0.7104, "lr": 4.9967225233129366e-05, "epoch": 1.1468573130771522, "percentage": 11.47, "elapsed_time": "0:31:41", "remaining_time": "4:04:34", "throughput": 2335.03, "total_tokens": 4438944} {"current_steps": 7705, "total_steps": 67140, "loss": 0.9416, "lr": 4.9966891723513344e-05, "epoch": 1.1476020256181114, "percentage": 11.48, "elapsed_time": "0:31:42", "remaining_time": "4:04:32", "throughput": 2335.07, "total_tokens": 4441632} {"current_steps": 7710, "total_steps": 67140, "loss": 0.7606, "lr": 4.996655652673628e-05, "epoch": 1.1483467381590706, "percentage": 11.48, "elapsed_time": "0:31:43", "remaining_time": "4:04:31", "throughput": 2335.3, "total_tokens": 4444832} {"current_steps": 7715, "total_steps": 67140, "loss": 0.7466, "lr": 4.9966219642820834e-05, "epoch": 1.1490914507000298, "percentage": 11.49, "elapsed_time": "0:31:44", "remaining_time": "4:04:28", "throughput": 2335.4, "total_tokens": 4447616} {"current_steps": 7720, "total_steps": 67140, "loss": 0.5822, "lr": 4.996588107178977e-05, "epoch": 1.149836163240989, "percentage": 11.5, "elapsed_time": "0:31:45", "remaining_time": "4:04:26", "throughput": 2335.52, "total_tokens": 4450496} {"current_steps": 7725, "total_steps": 67140, "loss": 0.6089, "lr": 4.996554081366597e-05, "epoch": 1.1505808757819482, "percentage": 11.51, "elapsed_time": "0:31:46", "remaining_time": "4:04:24", "throughput": 2335.6, "total_tokens": 4453312} {"current_steps": 7730, "total_steps": 67140, "loss": 0.6662, "lr": 4.996519886847243e-05, "epoch": 1.1513255883229074, "percentage": 11.51, "elapsed_time": "0:31:47", "remaining_time": "4:04:23", "throughput": 2335.85, "total_tokens": 4456608} {"current_steps": 7735, "total_steps": 67140, "loss": 0.7929, "lr": 4.996485523623224e-05, "epoch": 1.1520703008638666, "percentage": 11.52, "elapsed_time": "0:31:49", "remaining_time": "4:04:21", "throughput": 2336.07, "total_tokens": 4459744} {"current_steps": 7740, "total_steps": 67140, "loss": 0.6735, "lr": 4.996450991696864e-05, "epoch": 1.1528150134048256, "percentage": 11.53, "elapsed_time": "0:31:50", "remaining_time": "4:04:19", "throughput": 2336.2, "total_tokens": 4462624} {"current_steps": 7745, "total_steps": 67140, "loss": 0.6969, "lr": 4.996416291070495e-05, "epoch": 1.1535597259457848, "percentage": 11.54, "elapsed_time": "0:31:51", "remaining_time": "4:04:18", "throughput": 2336.44, "total_tokens": 4465856} {"current_steps": 7750, "total_steps": 67140, "loss": 0.7272, "lr": 4.996381421746464e-05, "epoch": 1.154304438486744, "percentage": 11.54, "elapsed_time": "0:31:52", "remaining_time": "4:04:16", "throughput": 2336.54, "total_tokens": 4468704} {"current_steps": 7755, "total_steps": 67140, "loss": 0.6737, "lr": 4.9963463837271254e-05, "epoch": 1.1550491510277032, "percentage": 11.55, "elapsed_time": "0:31:53", "remaining_time": "4:04:14", "throughput": 2336.71, "total_tokens": 4471776} {"current_steps": 7760, "total_steps": 67140, "loss": 0.7775, "lr": 4.996311177014847e-05, "epoch": 1.1557938635686624, "percentage": 11.56, "elapsed_time": "0:31:54", "remaining_time": "4:04:12", "throughput": 2336.89, "total_tokens": 4474848} {"current_steps": 7765, "total_steps": 67140, "loss": 0.7184, "lr": 4.9962758016120095e-05, "epoch": 1.1565385761096216, "percentage": 11.57, "elapsed_time": "0:31:56", "remaining_time": "4:04:10", "throughput": 2337.03, "total_tokens": 4477760} {"current_steps": 7770, "total_steps": 67140, "loss": 0.6397, "lr": 4.996240257521002e-05, "epoch": 1.1572832886505808, "percentage": 11.57, "elapsed_time": "0:31:57", "remaining_time": "4:04:08", "throughput": 2337.2, "total_tokens": 4480800} {"current_steps": 7775, "total_steps": 67140, "loss": 0.5986, "lr": 4.996204544744227e-05, "epoch": 1.15802800119154, "percentage": 11.58, "elapsed_time": "0:31:58", "remaining_time": "4:04:07", "throughput": 2337.39, "total_tokens": 4483936} {"current_steps": 7780, "total_steps": 67140, "loss": 0.5943, "lr": 4.9961686632840976e-05, "epoch": 1.1587727137324992, "percentage": 11.59, "elapsed_time": "0:31:59", "remaining_time": "4:04:05", "throughput": 2337.48, "total_tokens": 4486752} {"current_steps": 7785, "total_steps": 67140, "loss": 0.67, "lr": 4.9961326131430386e-05, "epoch": 1.1595174262734584, "percentage": 11.6, "elapsed_time": "0:32:00", "remaining_time": "4:04:03", "throughput": 2337.53, "total_tokens": 4489472} {"current_steps": 7790, "total_steps": 67140, "loss": 0.6746, "lr": 4.996096394323486e-05, "epoch": 1.1602621388144176, "percentage": 11.6, "elapsed_time": "0:32:01", "remaining_time": "4:04:01", "throughput": 2337.6, "total_tokens": 4492256} {"current_steps": 7795, "total_steps": 67140, "loss": 0.6156, "lr": 4.9960600068278876e-05, "epoch": 1.1610068513553768, "percentage": 11.61, "elapsed_time": "0:32:02", "remaining_time": "4:03:59", "throughput": 2337.7, "total_tokens": 4495072} {"current_steps": 7800, "total_steps": 67140, "loss": 0.6053, "lr": 4.9960234506587024e-05, "epoch": 1.161751563896336, "percentage": 11.62, "elapsed_time": "0:32:04", "remaining_time": "4:03:58", "throughput": 2338.04, "total_tokens": 4498656} {"current_steps": 7805, "total_steps": 67140, "loss": 0.6681, "lr": 4.9959867258184e-05, "epoch": 1.1624962764372953, "percentage": 11.62, "elapsed_time": "0:32:05", "remaining_time": "4:03:55", "throughput": 2338.06, "total_tokens": 4501280} {"current_steps": 7810, "total_steps": 67140, "loss": 0.8067, "lr": 4.9959498323094636e-05, "epoch": 1.1632409889782545, "percentage": 11.63, "elapsed_time": "0:32:06", "remaining_time": "4:03:53", "throughput": 2338.14, "total_tokens": 4504064} {"current_steps": 7815, "total_steps": 67140, "loss": 0.6176, "lr": 4.9959127701343844e-05, "epoch": 1.1639857015192137, "percentage": 11.64, "elapsed_time": "0:32:07", "remaining_time": "4:03:51", "throughput": 2338.19, "total_tokens": 4506816} {"current_steps": 7820, "total_steps": 67140, "loss": 0.7613, "lr": 4.995875539295668e-05, "epoch": 1.1647304140601729, "percentage": 11.65, "elapsed_time": "0:32:08", "remaining_time": "4:03:49", "throughput": 2338.18, "total_tokens": 4509280} {"current_steps": 7825, "total_steps": 67140, "loss": 0.8877, "lr": 4.9958381397958305e-05, "epoch": 1.165475126601132, "percentage": 11.65, "elapsed_time": "0:32:09", "remaining_time": "4:03:47", "throughput": 2338.31, "total_tokens": 4512192} {"current_steps": 7830, "total_steps": 67140, "loss": 0.5771, "lr": 4.995800571637399e-05, "epoch": 1.1662198391420913, "percentage": 11.66, "elapsed_time": "0:32:10", "remaining_time": "4:03:45", "throughput": 2338.41, "total_tokens": 4515008} {"current_steps": 7835, "total_steps": 67140, "loss": 0.6195, "lr": 4.995762834822911e-05, "epoch": 1.1669645516830505, "percentage": 11.67, "elapsed_time": "0:32:11", "remaining_time": "4:03:43", "throughput": 2338.51, "total_tokens": 4517856} {"current_steps": 7840, "total_steps": 67140, "loss": 0.6874, "lr": 4.995724929354918e-05, "epoch": 1.1677092642240094, "percentage": 11.68, "elapsed_time": "0:32:13", "remaining_time": "4:03:41", "throughput": 2338.72, "total_tokens": 4521024} {"current_steps": 7845, "total_steps": 67140, "loss": 0.641, "lr": 4.9956868552359816e-05, "epoch": 1.1684539767649686, "percentage": 11.68, "elapsed_time": "0:32:14", "remaining_time": "4:03:39", "throughput": 2338.8, "total_tokens": 4523840} {"current_steps": 7850, "total_steps": 67140, "loss": 0.7251, "lr": 4.995648612468674e-05, "epoch": 1.1691986893059279, "percentage": 11.69, "elapsed_time": "0:32:15", "remaining_time": "4:03:37", "throughput": 2338.85, "total_tokens": 4526528} {"current_steps": 7855, "total_steps": 67140, "loss": 0.6547, "lr": 4.9956102010555806e-05, "epoch": 1.169943401846887, "percentage": 11.7, "elapsed_time": "0:32:16", "remaining_time": "4:03:35", "throughput": 2338.93, "total_tokens": 4529312} {"current_steps": 7860, "total_steps": 67140, "loss": 0.631, "lr": 4.9955716209992956e-05, "epoch": 1.1706881143878463, "percentage": 11.71, "elapsed_time": "0:32:17", "remaining_time": "4:03:33", "throughput": 2338.92, "total_tokens": 4531840} {"current_steps": 7865, "total_steps": 67140, "loss": 0.6552, "lr": 4.9955328723024263e-05, "epoch": 1.1714328269288055, "percentage": 11.71, "elapsed_time": "0:32:18", "remaining_time": "4:03:31", "throughput": 2339.05, "total_tokens": 4534752} {"current_steps": 7870, "total_steps": 67140, "loss": 0.62, "lr": 4.995493954967592e-05, "epoch": 1.1721775394697647, "percentage": 11.72, "elapsed_time": "0:32:19", "remaining_time": "4:03:28", "throughput": 2339.1, "total_tokens": 4537408} {"current_steps": 7875, "total_steps": 67140, "loss": 0.715, "lr": 4.995454868997421e-05, "epoch": 1.1729222520107239, "percentage": 11.73, "elapsed_time": "0:32:21", "remaining_time": "4:03:27", "throughput": 2339.34, "total_tokens": 4540736} {"current_steps": 7880, "total_steps": 67140, "loss": 0.5697, "lr": 4.9954156143945575e-05, "epoch": 1.173666964551683, "percentage": 11.74, "elapsed_time": "0:32:22", "remaining_time": "4:03:25", "throughput": 2339.46, "total_tokens": 4543584} {"current_steps": 7885, "total_steps": 67140, "loss": 0.6582, "lr": 4.9953761911616515e-05, "epoch": 1.1744116770926423, "percentage": 11.74, "elapsed_time": "0:32:23", "remaining_time": "4:03:23", "throughput": 2339.65, "total_tokens": 4546656} {"current_steps": 7890, "total_steps": 67140, "loss": 0.7498, "lr": 4.995336599301368e-05, "epoch": 1.1751563896336015, "percentage": 11.75, "elapsed_time": "0:32:24", "remaining_time": "4:03:21", "throughput": 2339.72, "total_tokens": 4549376} {"current_steps": 7895, "total_steps": 67140, "loss": 0.7204, "lr": 4.9952968388163826e-05, "epoch": 1.1759011021745607, "percentage": 11.76, "elapsed_time": "0:32:25", "remaining_time": "4:03:19", "throughput": 2339.8, "total_tokens": 4552128} {"current_steps": 7900, "total_steps": 67140, "loss": 0.8326, "lr": 4.995256909709382e-05, "epoch": 1.1766458147155199, "percentage": 11.77, "elapsed_time": "0:32:26", "remaining_time": "4:03:17", "throughput": 2339.82, "total_tokens": 4554720} {"current_steps": 7905, "total_steps": 67140, "loss": 0.5168, "lr": 4.9952168119830644e-05, "epoch": 1.177390527256479, "percentage": 11.77, "elapsed_time": "0:32:27", "remaining_time": "4:03:14", "throughput": 2339.9, "total_tokens": 4557472} {"current_steps": 7910, "total_steps": 67140, "loss": 0.6928, "lr": 4.995176545640139e-05, "epoch": 1.1781352397974383, "percentage": 11.78, "elapsed_time": "0:32:28", "remaining_time": "4:03:13", "throughput": 2340.1, "total_tokens": 4560576} {"current_steps": 7915, "total_steps": 67140, "loss": 0.6617, "lr": 4.995136110683328e-05, "epoch": 1.1788799523383973, "percentage": 11.79, "elapsed_time": "0:32:30", "remaining_time": "4:03:11", "throughput": 2340.25, "total_tokens": 4563552} {"current_steps": 7920, "total_steps": 67140, "loss": 0.6873, "lr": 4.995095507115363e-05, "epoch": 1.1796246648793565, "percentage": 11.8, "elapsed_time": "0:32:31", "remaining_time": "4:03:09", "throughput": 2340.29, "total_tokens": 4566208} {"current_steps": 7925, "total_steps": 67140, "loss": 0.5974, "lr": 4.9950547349389873e-05, "epoch": 1.1803693774203157, "percentage": 11.8, "elapsed_time": "0:32:32", "remaining_time": "4:03:07", "throughput": 2340.47, "total_tokens": 4569248} {"current_steps": 7930, "total_steps": 67140, "loss": 0.5979, "lr": 4.995013794156957e-05, "epoch": 1.1811140899612749, "percentage": 11.81, "elapsed_time": "0:32:33", "remaining_time": "4:03:05", "throughput": 2340.51, "total_tokens": 4571904} {"current_steps": 7935, "total_steps": 67140, "loss": 0.7313, "lr": 4.994972684772039e-05, "epoch": 1.181858802502234, "percentage": 11.82, "elapsed_time": "0:32:34", "remaining_time": "4:03:03", "throughput": 2340.58, "total_tokens": 4574688} {"current_steps": 7940, "total_steps": 67140, "loss": 0.8024, "lr": 4.9949314067870105e-05, "epoch": 1.1826035150431933, "percentage": 11.83, "elapsed_time": "0:32:35", "remaining_time": "4:03:00", "throughput": 2340.69, "total_tokens": 4577504} {"current_steps": 7945, "total_steps": 67140, "loss": 0.6902, "lr": 4.9948899602046614e-05, "epoch": 1.1833482275841525, "percentage": 11.83, "elapsed_time": "0:32:36", "remaining_time": "4:02:59", "throughput": 2340.8, "total_tokens": 4580384} {"current_steps": 7950, "total_steps": 67140, "loss": 0.7244, "lr": 4.9948483450277915e-05, "epoch": 1.1840929401251117, "percentage": 11.84, "elapsed_time": "0:32:37", "remaining_time": "4:02:57", "throughput": 2340.99, "total_tokens": 4583456} {"current_steps": 7955, "total_steps": 67140, "loss": 0.6745, "lr": 4.9948065612592145e-05, "epoch": 1.1848376526660709, "percentage": 11.85, "elapsed_time": "0:32:39", "remaining_time": "4:02:55", "throughput": 2341.09, "total_tokens": 4586336} {"current_steps": 7960, "total_steps": 67140, "loss": 0.936, "lr": 4.9947646089017534e-05, "epoch": 1.18558236520703, "percentage": 11.86, "elapsed_time": "0:32:40", "remaining_time": "4:02:53", "throughput": 2341.07, "total_tokens": 4588832} {"current_steps": 7965, "total_steps": 67140, "loss": 0.5611, "lr": 4.994722487958242e-05, "epoch": 1.1863270777479893, "percentage": 11.86, "elapsed_time": "0:32:41", "remaining_time": "4:02:50", "throughput": 2341.13, "total_tokens": 4591552} {"current_steps": 7970, "total_steps": 67140, "loss": 0.7316, "lr": 4.994680198431528e-05, "epoch": 1.1870717902889485, "percentage": 11.87, "elapsed_time": "0:32:42", "remaining_time": "4:02:49", "throughput": 2341.34, "total_tokens": 4594752} {"current_steps": 7975, "total_steps": 67140, "loss": 0.7346, "lr": 4.9946377403244695e-05, "epoch": 1.1878165028299077, "percentage": 11.88, "elapsed_time": "0:32:43", "remaining_time": "4:02:47", "throughput": 2341.51, "total_tokens": 4597792} {"current_steps": 7980, "total_steps": 67140, "loss": 0.7438, "lr": 4.994595113639935e-05, "epoch": 1.188561215370867, "percentage": 11.89, "elapsed_time": "0:32:44", "remaining_time": "4:02:45", "throughput": 2341.58, "total_tokens": 4600544} {"current_steps": 7985, "total_steps": 67140, "loss": 0.5136, "lr": 4.994552318380804e-05, "epoch": 1.189305927911826, "percentage": 11.89, "elapsed_time": "0:32:45", "remaining_time": "4:02:43", "throughput": 2341.67, "total_tokens": 4603392} {"current_steps": 7990, "total_steps": 67140, "loss": 0.8104, "lr": 4.9945093545499706e-05, "epoch": 1.1900506404527853, "percentage": 11.9, "elapsed_time": "0:32:46", "remaining_time": "4:02:41", "throughput": 2341.73, "total_tokens": 4606112} {"current_steps": 7995, "total_steps": 67140, "loss": 0.6473, "lr": 4.9944662221503364e-05, "epoch": 1.1907953529937445, "percentage": 11.91, "elapsed_time": "0:32:48", "remaining_time": "4:02:39", "throughput": 2341.88, "total_tokens": 4609120} {"current_steps": 8000, "total_steps": 67140, "loss": 0.6599, "lr": 4.9944229211848166e-05, "epoch": 1.1915400655347037, "percentage": 11.92, "elapsed_time": "0:32:49", "remaining_time": "4:02:37", "throughput": 2341.96, "total_tokens": 4611904} {"current_steps": 8005, "total_steps": 67140, "loss": 0.6746, "lr": 4.9943794516563366e-05, "epoch": 1.192284778075663, "percentage": 11.92, "elapsed_time": "0:32:50", "remaining_time": "4:02:35", "throughput": 2341.99, "total_tokens": 4614528} {"current_steps": 8010, "total_steps": 67140, "loss": 0.7814, "lr": 4.9943358135678366e-05, "epoch": 1.193029490616622, "percentage": 11.93, "elapsed_time": "0:32:51", "remaining_time": "4:02:33", "throughput": 2342.11, "total_tokens": 4617408} {"current_steps": 8015, "total_steps": 67140, "loss": 0.7049, "lr": 4.994292006922262e-05, "epoch": 1.193774203157581, "percentage": 11.94, "elapsed_time": "0:32:52", "remaining_time": "4:02:31", "throughput": 2342.21, "total_tokens": 4620256} {"current_steps": 8020, "total_steps": 67140, "loss": 0.6793, "lr": 4.994248031722575e-05, "epoch": 1.1945189156985403, "percentage": 11.95, "elapsed_time": "0:32:53", "remaining_time": "4:02:29", "throughput": 2342.32, "total_tokens": 4623136} {"current_steps": 8025, "total_steps": 67140, "loss": 0.6318, "lr": 4.994203887971747e-05, "epoch": 1.1952636282394995, "percentage": 11.95, "elapsed_time": "0:32:54", "remaining_time": "4:02:27", "throughput": 2342.36, "total_tokens": 4625792} {"current_steps": 8030, "total_steps": 67140, "loss": 0.6568, "lr": 4.994159575672761e-05, "epoch": 1.1960083407804587, "percentage": 11.96, "elapsed_time": "0:32:55", "remaining_time": "4:02:25", "throughput": 2342.44, "total_tokens": 4628544} {"current_steps": 8035, "total_steps": 67140, "loss": 0.8163, "lr": 4.9941150948286106e-05, "epoch": 1.196753053321418, "percentage": 11.97, "elapsed_time": "0:32:57", "remaining_time": "4:02:23", "throughput": 2342.5, "total_tokens": 4631232} {"current_steps": 8040, "total_steps": 67140, "loss": 0.6225, "lr": 4.994070445442304e-05, "epoch": 1.197497765862377, "percentage": 11.97, "elapsed_time": "0:32:58", "remaining_time": "4:02:21", "throughput": 2342.61, "total_tokens": 4634144} {"current_steps": 8045, "total_steps": 67140, "loss": 0.6658, "lr": 4.994025627516856e-05, "epoch": 1.1982424784033363, "percentage": 11.98, "elapsed_time": "0:32:59", "remaining_time": "4:02:19", "throughput": 2342.75, "total_tokens": 4637088} {"current_steps": 8050, "total_steps": 67140, "loss": 0.7998, "lr": 4.9939806410552955e-05, "epoch": 1.1989871909442955, "percentage": 11.99, "elapsed_time": "0:33:00", "remaining_time": "4:02:17", "throughput": 2342.8, "total_tokens": 4639840} {"current_steps": 8055, "total_steps": 67140, "loss": 0.7152, "lr": 4.9939354860606636e-05, "epoch": 1.1997319034852547, "percentage": 12.0, "elapsed_time": "0:33:01", "remaining_time": "4:02:15", "throughput": 2342.81, "total_tokens": 4642400} {"current_steps": 8060, "total_steps": 67140, "loss": 0.7196, "lr": 4.9938901625360115e-05, "epoch": 1.200476616026214, "percentage": 12.0, "elapsed_time": "0:33:02", "remaining_time": "4:02:12", "throughput": 2342.8, "total_tokens": 4644960} {"current_steps": 8065, "total_steps": 67140, "loss": 0.6883, "lr": 4.993844670484401e-05, "epoch": 1.2012213285671731, "percentage": 12.01, "elapsed_time": "0:33:03", "remaining_time": "4:02:10", "throughput": 2342.88, "total_tokens": 4647680} {"current_steps": 8070, "total_steps": 67140, "loss": 0.7572, "lr": 4.993799009908907e-05, "epoch": 1.2019660411081323, "percentage": 12.02, "elapsed_time": "0:33:04", "remaining_time": "4:02:08", "throughput": 2342.97, "total_tokens": 4650496} {"current_steps": 8075, "total_steps": 67140, "loss": 0.6345, "lr": 4.9937531808126155e-05, "epoch": 1.2027107536490915, "percentage": 12.03, "elapsed_time": "0:33:06", "remaining_time": "4:02:06", "throughput": 2343.05, "total_tokens": 4653312} {"current_steps": 8080, "total_steps": 67140, "loss": 0.7949, "lr": 4.993707183198623e-05, "epoch": 1.2034554661900507, "percentage": 12.03, "elapsed_time": "0:33:07", "remaining_time": "4:02:04", "throughput": 2343.13, "total_tokens": 4656064} {"current_steps": 8085, "total_steps": 67140, "loss": 0.6608, "lr": 4.993661017070037e-05, "epoch": 1.2042001787310097, "percentage": 12.04, "elapsed_time": "0:33:08", "remaining_time": "4:02:02", "throughput": 2343.17, "total_tokens": 4658720} {"current_steps": 8090, "total_steps": 67140, "loss": 0.6137, "lr": 4.993614682429978e-05, "epoch": 1.204944891271969, "percentage": 12.05, "elapsed_time": "0:33:09", "remaining_time": "4:02:01", "throughput": 2343.44, "total_tokens": 4662176} {"current_steps": 8095, "total_steps": 67140, "loss": 0.7453, "lr": 4.993568179281577e-05, "epoch": 1.2056896038129281, "percentage": 12.06, "elapsed_time": "0:33:10", "remaining_time": "4:01:59", "throughput": 2343.6, "total_tokens": 4665152} {"current_steps": 8100, "total_steps": 67140, "loss": 0.8035, "lr": 4.9935215076279766e-05, "epoch": 1.2064343163538873, "percentage": 12.06, "elapsed_time": "0:33:11", "remaining_time": "4:01:57", "throughput": 2343.73, "total_tokens": 4668096} {"current_steps": 8105, "total_steps": 67140, "loss": 0.7766, "lr": 4.993474667472331e-05, "epoch": 1.2071790288948465, "percentage": 12.07, "elapsed_time": "0:33:12", "remaining_time": "4:01:55", "throughput": 2343.85, "total_tokens": 4671040} {"current_steps": 8110, "total_steps": 67140, "loss": 0.8234, "lr": 4.9934276588178054e-05, "epoch": 1.2079237414358057, "percentage": 12.08, "elapsed_time": "0:33:14", "remaining_time": "4:01:53", "throughput": 2343.97, "total_tokens": 4673952} {"current_steps": 8115, "total_steps": 67140, "loss": 0.7272, "lr": 4.993380481667576e-05, "epoch": 1.208668453976765, "percentage": 12.09, "elapsed_time": "0:33:15", "remaining_time": "4:01:52", "throughput": 2344.12, "total_tokens": 4676928} {"current_steps": 8120, "total_steps": 67140, "loss": 0.6567, "lr": 4.9933331360248306e-05, "epoch": 1.2094131665177241, "percentage": 12.09, "elapsed_time": "0:33:16", "remaining_time": "4:01:50", "throughput": 2344.23, "total_tokens": 4679776} {"current_steps": 8125, "total_steps": 67140, "loss": 0.7257, "lr": 4.993285621892769e-05, "epoch": 1.2101578790586833, "percentage": 12.1, "elapsed_time": "0:33:17", "remaining_time": "4:01:48", "throughput": 2344.32, "total_tokens": 4682624} {"current_steps": 8130, "total_steps": 67140, "loss": 0.7148, "lr": 4.993237939274602e-05, "epoch": 1.2109025915996425, "percentage": 12.11, "elapsed_time": "0:33:18", "remaining_time": "4:01:45", "throughput": 2344.36, "total_tokens": 4685280} {"current_steps": 8135, "total_steps": 67140, "loss": 0.705, "lr": 4.9931900881735517e-05, "epoch": 1.2116473041406017, "percentage": 12.12, "elapsed_time": "0:33:19", "remaining_time": "4:01:43", "throughput": 2344.49, "total_tokens": 4688192} {"current_steps": 8140, "total_steps": 67140, "loss": 0.7289, "lr": 4.993142068592852e-05, "epoch": 1.212392016681561, "percentage": 12.12, "elapsed_time": "0:33:20", "remaining_time": "4:01:41", "throughput": 2344.6, "total_tokens": 4691008} {"current_steps": 8145, "total_steps": 67140, "loss": 0.6772, "lr": 4.993093880535748e-05, "epoch": 1.2131367292225201, "percentage": 12.13, "elapsed_time": "0:33:21", "remaining_time": "4:01:40", "throughput": 2344.76, "total_tokens": 4694080} {"current_steps": 8150, "total_steps": 67140, "loss": 0.6436, "lr": 4.993045524005496e-05, "epoch": 1.2138814417634793, "percentage": 12.14, "elapsed_time": "0:33:23", "remaining_time": "4:01:38", "throughput": 2344.86, "total_tokens": 4696896} {"current_steps": 8155, "total_steps": 67140, "loss": 0.6643, "lr": 4.992996999005363e-05, "epoch": 1.2146261543044385, "percentage": 12.15, "elapsed_time": "0:33:24", "remaining_time": "4:01:36", "throughput": 2344.95, "total_tokens": 4699712} {"current_steps": 8160, "total_steps": 67140, "loss": 0.6304, "lr": 4.992948305538628e-05, "epoch": 1.2153708668453977, "percentage": 12.15, "elapsed_time": "0:33:25", "remaining_time": "4:01:34", "throughput": 2345.05, "total_tokens": 4702528} {"current_steps": 8165, "total_steps": 67140, "loss": 0.6933, "lr": 4.992899443608583e-05, "epoch": 1.216115579386357, "percentage": 12.16, "elapsed_time": "0:33:26", "remaining_time": "4:01:31", "throughput": 2345.03, "total_tokens": 4705024} {"current_steps": 8170, "total_steps": 67140, "loss": 0.5345, "lr": 4.9928504132185284e-05, "epoch": 1.2168602919273162, "percentage": 12.17, "elapsed_time": "0:33:27", "remaining_time": "4:01:29", "throughput": 2345.11, "total_tokens": 4707776} {"current_steps": 8175, "total_steps": 67140, "loss": 0.6827, "lr": 4.992801214371778e-05, "epoch": 1.2176050044682754, "percentage": 12.18, "elapsed_time": "0:33:28", "remaining_time": "4:01:27", "throughput": 2345.16, "total_tokens": 4710496} {"current_steps": 8180, "total_steps": 67140, "loss": 0.7029, "lr": 4.992751847071657e-05, "epoch": 1.2183497170092346, "percentage": 12.18, "elapsed_time": "0:33:29", "remaining_time": "4:01:26", "throughput": 2345.35, "total_tokens": 4713632} {"current_steps": 8185, "total_steps": 67140, "loss": 0.6977, "lr": 4.992702311321501e-05, "epoch": 1.2190944295501935, "percentage": 12.19, "elapsed_time": "0:33:30", "remaining_time": "4:01:24", "throughput": 2345.48, "total_tokens": 4716512} {"current_steps": 8190, "total_steps": 67140, "loss": 0.6311, "lr": 4.992652607124658e-05, "epoch": 1.2198391420911527, "percentage": 12.2, "elapsed_time": "0:33:32", "remaining_time": "4:01:22", "throughput": 2345.58, "total_tokens": 4719392} {"current_steps": 8195, "total_steps": 67140, "loss": 0.5925, "lr": 4.992602734484485e-05, "epoch": 1.220583854632112, "percentage": 12.21, "elapsed_time": "0:33:33", "remaining_time": "4:01:20", "throughput": 2345.69, "total_tokens": 4722304} {"current_steps": 8200, "total_steps": 67140, "loss": 0.8112, "lr": 4.992552693404354e-05, "epoch": 1.2213285671730711, "percentage": 12.21, "elapsed_time": "0:33:34", "remaining_time": "4:01:18", "throughput": 2345.74, "total_tokens": 4724960} {"current_steps": 8205, "total_steps": 67140, "loss": 0.5891, "lr": 4.992502483887645e-05, "epoch": 1.2220732797140303, "percentage": 12.22, "elapsed_time": "0:33:35", "remaining_time": "4:01:16", "throughput": 2345.83, "total_tokens": 4727808} {"current_steps": 8210, "total_steps": 67140, "loss": 0.7517, "lr": 4.9924521059377535e-05, "epoch": 1.2228179922549895, "percentage": 12.23, "elapsed_time": "0:33:36", "remaining_time": "4:01:14", "throughput": 2346.02, "total_tokens": 4730944} {"current_steps": 8215, "total_steps": 67140, "loss": 0.7452, "lr": 4.992401559558081e-05, "epoch": 1.2235627047959488, "percentage": 12.24, "elapsed_time": "0:33:37", "remaining_time": "4:01:12", "throughput": 2346.08, "total_tokens": 4733664} {"current_steps": 8220, "total_steps": 67140, "loss": 0.6302, "lr": 4.992350844752045e-05, "epoch": 1.224307417336908, "percentage": 12.24, "elapsed_time": "0:33:38", "remaining_time": "4:01:10", "throughput": 2346.21, "total_tokens": 4736608} {"current_steps": 8225, "total_steps": 67140, "loss": 0.6868, "lr": 4.9922999615230726e-05, "epoch": 1.2250521298778672, "percentage": 12.25, "elapsed_time": "0:33:40", "remaining_time": "4:01:09", "throughput": 2346.43, "total_tokens": 4739904} {"current_steps": 8230, "total_steps": 67140, "loss": 0.5808, "lr": 4.992248909874601e-05, "epoch": 1.2257968424188264, "percentage": 12.26, "elapsed_time": "0:33:41", "remaining_time": "4:01:07", "throughput": 2346.54, "total_tokens": 4742784} {"current_steps": 8235, "total_steps": 67140, "loss": 0.7104, "lr": 4.992197689810081e-05, "epoch": 1.2265415549597856, "percentage": 12.27, "elapsed_time": "0:33:42", "remaining_time": "4:01:05", "throughput": 2346.67, "total_tokens": 4745696} {"current_steps": 8240, "total_steps": 67140, "loss": 0.5105, "lr": 4.9921463013329736e-05, "epoch": 1.2272862675007448, "percentage": 12.27, "elapsed_time": "0:33:43", "remaining_time": "4:01:04", "throughput": 2346.84, "total_tokens": 4748800} {"current_steps": 8245, "total_steps": 67140, "loss": 0.6515, "lr": 4.9920947444467515e-05, "epoch": 1.228030980041704, "percentage": 12.28, "elapsed_time": "0:33:44", "remaining_time": "4:01:02", "throughput": 2346.95, "total_tokens": 4751712} {"current_steps": 8250, "total_steps": 67140, "loss": 0.7422, "lr": 4.9920430191548986e-05, "epoch": 1.2287756925826632, "percentage": 12.29, "elapsed_time": "0:33:45", "remaining_time": "4:01:00", "throughput": 2347.01, "total_tokens": 4754464} {"current_steps": 8255, "total_steps": 67140, "loss": 0.5327, "lr": 4.9919911254609105e-05, "epoch": 1.2295204051236224, "percentage": 12.3, "elapsed_time": "0:33:46", "remaining_time": "4:00:58", "throughput": 2347.1, "total_tokens": 4757280} {"current_steps": 8260, "total_steps": 67140, "loss": 0.7482, "lr": 4.991939063368294e-05, "epoch": 1.2302651176645814, "percentage": 12.3, "elapsed_time": "0:33:48", "remaining_time": "4:00:56", "throughput": 2347.19, "total_tokens": 4760128} {"current_steps": 8265, "total_steps": 67140, "loss": 0.6635, "lr": 4.991886832880567e-05, "epoch": 1.2310098302055406, "percentage": 12.31, "elapsed_time": "0:33:49", "remaining_time": "4:00:54", "throughput": 2347.29, "total_tokens": 4762976} {"current_steps": 8270, "total_steps": 67140, "loss": 0.8059, "lr": 4.9918344340012584e-05, "epoch": 1.2317545427464998, "percentage": 12.32, "elapsed_time": "0:33:50", "remaining_time": "4:00:52", "throughput": 2347.43, "total_tokens": 4765920} {"current_steps": 8275, "total_steps": 67140, "loss": 0.7374, "lr": 4.99178186673391e-05, "epoch": 1.232499255287459, "percentage": 12.32, "elapsed_time": "0:33:51", "remaining_time": "4:00:50", "throughput": 2347.52, "total_tokens": 4768736} {"current_steps": 8280, "total_steps": 67140, "loss": 0.745, "lr": 4.9917291310820745e-05, "epoch": 1.2332439678284182, "percentage": 12.33, "elapsed_time": "0:33:52", "remaining_time": "4:00:48", "throughput": 2347.58, "total_tokens": 4771488} {"current_steps": 8285, "total_steps": 67140, "loss": 0.6341, "lr": 4.9916762270493154e-05, "epoch": 1.2339886803693774, "percentage": 12.34, "elapsed_time": "0:33:53", "remaining_time": "4:00:46", "throughput": 2347.69, "total_tokens": 4774368} {"current_steps": 8290, "total_steps": 67140, "loss": 0.7154, "lr": 4.991623154639207e-05, "epoch": 1.2347333929103366, "percentage": 12.35, "elapsed_time": "0:33:54", "remaining_time": "4:00:44", "throughput": 2347.77, "total_tokens": 4777216} {"current_steps": 8295, "total_steps": 67140, "loss": 0.545, "lr": 4.991569913855335e-05, "epoch": 1.2354781054512958, "percentage": 12.35, "elapsed_time": "0:33:55", "remaining_time": "4:00:43", "throughput": 2347.9, "total_tokens": 4780192} {"current_steps": 8300, "total_steps": 67140, "loss": 0.8353, "lr": 4.991516504701299e-05, "epoch": 1.236222817992255, "percentage": 12.36, "elapsed_time": "0:33:57", "remaining_time": "4:00:41", "throughput": 2348.05, "total_tokens": 4783232} {"current_steps": 8305, "total_steps": 67140, "loss": 0.7263, "lr": 4.991462927180707e-05, "epoch": 1.2369675305332142, "percentage": 12.37, "elapsed_time": "0:33:58", "remaining_time": "4:00:39", "throughput": 2348.2, "total_tokens": 4786208} {"current_steps": 8310, "total_steps": 67140, "loss": 0.7736, "lr": 4.991409181297181e-05, "epoch": 1.2377122430741734, "percentage": 12.38, "elapsed_time": "0:33:59", "remaining_time": "4:00:37", "throughput": 2348.28, "total_tokens": 4789024} {"current_steps": 8315, "total_steps": 67140, "loss": 0.7485, "lr": 4.991355267054351e-05, "epoch": 1.2384569556151326, "percentage": 12.38, "elapsed_time": "0:34:00", "remaining_time": "4:00:35", "throughput": 2348.37, "total_tokens": 4791808} {"current_steps": 8320, "total_steps": 67140, "loss": 0.6938, "lr": 4.991301184455861e-05, "epoch": 1.2392016681560918, "percentage": 12.39, "elapsed_time": "0:34:01", "remaining_time": "4:00:33", "throughput": 2348.45, "total_tokens": 4794592} {"current_steps": 8325, "total_steps": 67140, "loss": 0.5908, "lr": 4.9912469335053656e-05, "epoch": 1.239946380697051, "percentage": 12.4, "elapsed_time": "0:34:02", "remaining_time": "4:00:31", "throughput": 2348.62, "total_tokens": 4797664} {"current_steps": 8330, "total_steps": 67140, "loss": 0.584, "lr": 4.991192514206532e-05, "epoch": 1.2406910932380102, "percentage": 12.41, "elapsed_time": "0:34:03", "remaining_time": "4:00:29", "throughput": 2348.66, "total_tokens": 4800352} {"current_steps": 8335, "total_steps": 67140, "loss": 0.7618, "lr": 4.991137926563036e-05, "epoch": 1.2414358057789694, "percentage": 12.41, "elapsed_time": "0:34:04", "remaining_time": "4:00:27", "throughput": 2348.72, "total_tokens": 4803040} {"current_steps": 8340, "total_steps": 67140, "loss": 0.5937, "lr": 4.991083170578568e-05, "epoch": 1.2421805183199286, "percentage": 12.42, "elapsed_time": "0:34:06", "remaining_time": "4:00:25", "throughput": 2348.86, "total_tokens": 4806048} {"current_steps": 8345, "total_steps": 67140, "loss": 0.8666, "lr": 4.991028246256826e-05, "epoch": 1.2429252308608878, "percentage": 12.43, "elapsed_time": "0:34:07", "remaining_time": "4:00:23", "throughput": 2348.95, "total_tokens": 4808864} {"current_steps": 8350, "total_steps": 67140, "loss": 0.8009, "lr": 4.9909731536015235e-05, "epoch": 1.243669943401847, "percentage": 12.44, "elapsed_time": "0:34:08", "remaining_time": "4:00:21", "throughput": 2349.04, "total_tokens": 4811680} {"current_steps": 8355, "total_steps": 67140, "loss": 0.7615, "lr": 4.9909178926163835e-05, "epoch": 1.244414655942806, "percentage": 12.44, "elapsed_time": "0:34:09", "remaining_time": "4:00:20", "throughput": 2349.24, "total_tokens": 4814880} {"current_steps": 8360, "total_steps": 67140, "loss": 0.7006, "lr": 4.9908624633051395e-05, "epoch": 1.2451593684837652, "percentage": 12.45, "elapsed_time": "0:34:10", "remaining_time": "4:00:18", "throughput": 2349.43, "total_tokens": 4818048} {"current_steps": 8365, "total_steps": 67140, "loss": 0.8166, "lr": 4.990806865671537e-05, "epoch": 1.2459040810247244, "percentage": 12.46, "elapsed_time": "0:34:11", "remaining_time": "4:00:17", "throughput": 2349.63, "total_tokens": 4821248} {"current_steps": 8370, "total_steps": 67140, "loss": 0.7201, "lr": 4.990751099719333e-05, "epoch": 1.2466487935656836, "percentage": 12.47, "elapsed_time": "0:34:13", "remaining_time": "4:00:15", "throughput": 2349.75, "total_tokens": 4824160} {"current_steps": 8375, "total_steps": 67140, "loss": 0.7263, "lr": 4.990695165452297e-05, "epoch": 1.2473935061066428, "percentage": 12.47, "elapsed_time": "0:34:14", "remaining_time": "4:00:13", "throughput": 2349.8, "total_tokens": 4826848} {"current_steps": 8380, "total_steps": 67140, "loss": 0.7286, "lr": 4.990639062874208e-05, "epoch": 1.248138218647602, "percentage": 12.48, "elapsed_time": "0:34:15", "remaining_time": "4:00:11", "throughput": 2349.88, "total_tokens": 4829696} {"current_steps": 8385, "total_steps": 67140, "loss": 0.6597, "lr": 4.990582791988857e-05, "epoch": 1.2488829311885612, "percentage": 12.49, "elapsed_time": "0:34:16", "remaining_time": "4:00:09", "throughput": 2349.95, "total_tokens": 4832512} {"current_steps": 8390, "total_steps": 67140, "loss": 0.6411, "lr": 4.990526352800047e-05, "epoch": 1.2496276437295204, "percentage": 12.5, "elapsed_time": "0:34:17", "remaining_time": "4:00:07", "throughput": 2350.09, "total_tokens": 4835488} {"current_steps": 8395, "total_steps": 67140, "loss": 0.6128, "lr": 4.990469745311592e-05, "epoch": 1.2503723562704796, "percentage": 12.5, "elapsed_time": "0:34:18", "remaining_time": "4:00:05", "throughput": 2350.18, "total_tokens": 4838304} {"current_steps": 8400, "total_steps": 67140, "loss": 0.7143, "lr": 4.990412969527317e-05, "epoch": 1.2511170688114388, "percentage": 12.51, "elapsed_time": "0:34:19", "remaining_time": "4:00:03", "throughput": 2350.18, "total_tokens": 4840832} {"current_steps": 8405, "total_steps": 67140, "loss": 0.654, "lr": 4.99035602545106e-05, "epoch": 1.251861781352398, "percentage": 12.52, "elapsed_time": "0:34:20", "remaining_time": "4:00:01", "throughput": 2350.28, "total_tokens": 4843680} {"current_steps": 8410, "total_steps": 67140, "loss": 0.6503, "lr": 4.990298913086666e-05, "epoch": 1.2526064938933572, "percentage": 12.53, "elapsed_time": "0:34:22", "remaining_time": "3:59:59", "throughput": 2350.44, "total_tokens": 4846720} {"current_steps": 8415, "total_steps": 67140, "loss": 0.7957, "lr": 4.990241632437997e-05, "epoch": 1.2533512064343164, "percentage": 12.53, "elapsed_time": "0:34:23", "remaining_time": "3:59:58", "throughput": 2350.58, "total_tokens": 4849728} {"current_steps": 8420, "total_steps": 67140, "loss": 0.6374, "lr": 4.990184183508923e-05, "epoch": 1.2540959189752756, "percentage": 12.54, "elapsed_time": "0:34:24", "remaining_time": "3:59:56", "throughput": 2350.76, "total_tokens": 4852800} {"current_steps": 8425, "total_steps": 67140, "loss": 0.7463, "lr": 4.990126566303326e-05, "epoch": 1.2548406315162346, "percentage": 12.55, "elapsed_time": "0:34:25", "remaining_time": "3:59:54", "throughput": 2350.91, "total_tokens": 4855776} {"current_steps": 8430, "total_steps": 67140, "loss": 0.8353, "lr": 4.9900687808251e-05, "epoch": 1.2555853440571938, "percentage": 12.56, "elapsed_time": "0:34:26", "remaining_time": "3:59:52", "throughput": 2350.99, "total_tokens": 4858592} {"current_steps": 8435, "total_steps": 67140, "loss": 0.6182, "lr": 4.99001082707815e-05, "epoch": 1.256330056598153, "percentage": 12.56, "elapsed_time": "0:34:27", "remaining_time": "3:59:50", "throughput": 2351.08, "total_tokens": 4861408} {"current_steps": 8440, "total_steps": 67140, "loss": 0.6538, "lr": 4.989952705066392e-05, "epoch": 1.2570747691391122, "percentage": 12.57, "elapsed_time": "0:34:28", "remaining_time": "3:59:48", "throughput": 2351.15, "total_tokens": 4864224} {"current_steps": 8445, "total_steps": 67140, "loss": 0.731, "lr": 4.9898944147937534e-05, "epoch": 1.2578194816800714, "percentage": 12.58, "elapsed_time": "0:34:29", "remaining_time": "3:59:46", "throughput": 2351.21, "total_tokens": 4866944} {"current_steps": 8450, "total_steps": 67140, "loss": 0.7131, "lr": 4.989835956264173e-05, "epoch": 1.2585641942210306, "percentage": 12.59, "elapsed_time": "0:34:31", "remaining_time": "3:59:45", "throughput": 2351.36, "total_tokens": 4870016} {"current_steps": 8455, "total_steps": 67140, "loss": 0.6564, "lr": 4.989777329481602e-05, "epoch": 1.2593089067619898, "percentage": 12.59, "elapsed_time": "0:34:32", "remaining_time": "3:59:43", "throughput": 2351.46, "total_tokens": 4872864} {"current_steps": 8460, "total_steps": 67140, "loss": 0.727, "lr": 4.989718534450002e-05, "epoch": 1.260053619302949, "percentage": 12.6, "elapsed_time": "0:34:33", "remaining_time": "3:59:41", "throughput": 2351.52, "total_tokens": 4875584} {"current_steps": 8465, "total_steps": 67140, "loss": 0.6023, "lr": 4.989659571173345e-05, "epoch": 1.2607983318439082, "percentage": 12.61, "elapsed_time": "0:34:34", "remaining_time": "3:59:39", "throughput": 2351.61, "total_tokens": 4878400} {"current_steps": 8470, "total_steps": 67140, "loss": 0.7928, "lr": 4.9896004396556176e-05, "epoch": 1.2615430443848674, "percentage": 12.62, "elapsed_time": "0:34:35", "remaining_time": "3:59:37", "throughput": 2351.77, "total_tokens": 4881440} {"current_steps": 8475, "total_steps": 67140, "loss": 0.7058, "lr": 4.989541139900814e-05, "epoch": 1.2622877569258266, "percentage": 12.62, "elapsed_time": "0:34:36", "remaining_time": "3:59:35", "throughput": 2351.97, "total_tokens": 4884608} {"current_steps": 8480, "total_steps": 67140, "loss": 0.7891, "lr": 4.989481671912941e-05, "epoch": 1.2630324694667858, "percentage": 12.63, "elapsed_time": "0:34:37", "remaining_time": "3:59:34", "throughput": 2352.09, "total_tokens": 4887520} {"current_steps": 8485, "total_steps": 67140, "loss": 0.8271, "lr": 4.989422035696019e-05, "epoch": 1.263777182007745, "percentage": 12.64, "elapsed_time": "0:34:39", "remaining_time": "3:59:32", "throughput": 2352.2, "total_tokens": 4890432} {"current_steps": 8490, "total_steps": 67140, "loss": 0.7741, "lr": 4.9893622312540764e-05, "epoch": 1.2645218945487042, "percentage": 12.65, "elapsed_time": "0:34:40", "remaining_time": "3:59:30", "throughput": 2352.23, "total_tokens": 4893056} {"current_steps": 8495, "total_steps": 67140, "loss": 0.6642, "lr": 4.989302258591157e-05, "epoch": 1.2652666070896634, "percentage": 12.65, "elapsed_time": "0:34:41", "remaining_time": "3:59:28", "throughput": 2352.39, "total_tokens": 4896096} {"current_steps": 8500, "total_steps": 67140, "loss": 0.7058, "lr": 4.98924211771131e-05, "epoch": 1.2660113196306226, "percentage": 12.66, "elapsed_time": "0:34:42", "remaining_time": "3:59:26", "throughput": 2352.57, "total_tokens": 4899232} {"current_steps": 8505, "total_steps": 67140, "loss": 0.6607, "lr": 4.9891818086186014e-05, "epoch": 1.2667560321715818, "percentage": 12.67, "elapsed_time": "0:34:43", "remaining_time": "3:59:24", "throughput": 2352.61, "total_tokens": 4901920} {"current_steps": 8510, "total_steps": 67140, "loss": 0.6705, "lr": 4.989121331317107e-05, "epoch": 1.267500744712541, "percentage": 12.68, "elapsed_time": "0:34:44", "remaining_time": "3:59:22", "throughput": 2352.72, "total_tokens": 4904800} {"current_steps": 8515, "total_steps": 67140, "loss": 0.7029, "lr": 4.9890606858109126e-05, "epoch": 1.2682454572535002, "percentage": 12.68, "elapsed_time": "0:34:45", "remaining_time": "3:59:20", "throughput": 2352.75, "total_tokens": 4907456} {"current_steps": 8520, "total_steps": 67140, "loss": 0.7356, "lr": 4.9889998721041173e-05, "epoch": 1.2689901697944594, "percentage": 12.69, "elapsed_time": "0:34:46", "remaining_time": "3:59:19", "throughput": 2352.89, "total_tokens": 4910464} {"current_steps": 8525, "total_steps": 67140, "loss": 0.8206, "lr": 4.98893889020083e-05, "epoch": 1.2697348823354186, "percentage": 12.7, "elapsed_time": "0:34:48", "remaining_time": "3:59:17", "throughput": 2353.07, "total_tokens": 4913600} {"current_steps": 8530, "total_steps": 67140, "loss": 0.6256, "lr": 4.988877740105171e-05, "epoch": 1.2704795948763778, "percentage": 12.7, "elapsed_time": "0:34:49", "remaining_time": "3:59:15", "throughput": 2353.18, "total_tokens": 4916544} {"current_steps": 8535, "total_steps": 67140, "loss": 0.775, "lr": 4.9888164218212746e-05, "epoch": 1.2712243074173368, "percentage": 12.71, "elapsed_time": "0:34:50", "remaining_time": "3:59:13", "throughput": 2353.22, "total_tokens": 4919232} {"current_steps": 8540, "total_steps": 67140, "loss": 0.8356, "lr": 4.988754935353282e-05, "epoch": 1.271969019958296, "percentage": 12.72, "elapsed_time": "0:34:51", "remaining_time": "3:59:11", "throughput": 2353.28, "total_tokens": 4921984} {"current_steps": 8545, "total_steps": 67140, "loss": 0.7431, "lr": 4.988693280705351e-05, "epoch": 1.2727137324992552, "percentage": 12.73, "elapsed_time": "0:34:52", "remaining_time": "3:59:10", "throughput": 2353.38, "total_tokens": 4924896} {"current_steps": 8550, "total_steps": 67140, "loss": 0.7586, "lr": 4.988631457881645e-05, "epoch": 1.2734584450402144, "percentage": 12.73, "elapsed_time": "0:34:53", "remaining_time": "3:59:07", "throughput": 2353.44, "total_tokens": 4927616} {"current_steps": 8555, "total_steps": 67140, "loss": 0.7242, "lr": 4.9885694668863435e-05, "epoch": 1.2742031575811736, "percentage": 12.74, "elapsed_time": "0:34:54", "remaining_time": "3:59:06", "throughput": 2353.58, "total_tokens": 4930624} {"current_steps": 8560, "total_steps": 67140, "loss": 0.6751, "lr": 4.9885073077236354e-05, "epoch": 1.2749478701221328, "percentage": 12.75, "elapsed_time": "0:34:56", "remaining_time": "3:59:04", "throughput": 2353.64, "total_tokens": 4933376} {"current_steps": 8565, "total_steps": 67140, "loss": 0.6268, "lr": 4.988444980397721e-05, "epoch": 1.275692582663092, "percentage": 12.76, "elapsed_time": "0:34:57", "remaining_time": "3:59:02", "throughput": 2353.74, "total_tokens": 4936256} {"current_steps": 8570, "total_steps": 67140, "loss": 0.7802, "lr": 4.9883824849128125e-05, "epoch": 1.2764372952040512, "percentage": 12.76, "elapsed_time": "0:34:58", "remaining_time": "3:59:00", "throughput": 2353.78, "total_tokens": 4938944} {"current_steps": 8575, "total_steps": 67140, "loss": 0.7752, "lr": 4.988319821273132e-05, "epoch": 1.2771820077450105, "percentage": 12.77, "elapsed_time": "0:34:59", "remaining_time": "3:58:59", "throughput": 2354.09, "total_tokens": 4942528} {"current_steps": 8580, "total_steps": 67140, "loss": 0.6974, "lr": 4.9882569894829144e-05, "epoch": 1.2779267202859697, "percentage": 12.78, "elapsed_time": "0:35:00", "remaining_time": "3:58:57", "throughput": 2354.14, "total_tokens": 4945280} {"current_steps": 8585, "total_steps": 67140, "loss": 0.619, "lr": 4.988193989546407e-05, "epoch": 1.2786714328269289, "percentage": 12.79, "elapsed_time": "0:35:01", "remaining_time": "3:58:55", "throughput": 2354.31, "total_tokens": 4948352} {"current_steps": 8590, "total_steps": 67140, "loss": 0.6169, "lr": 4.988130821467866e-05, "epoch": 1.279416145367888, "percentage": 12.79, "elapsed_time": "0:35:02", "remaining_time": "3:58:54", "throughput": 2354.43, "total_tokens": 4951296} {"current_steps": 8595, "total_steps": 67140, "loss": 0.6534, "lr": 4.988067485251559e-05, "epoch": 1.2801608579088473, "percentage": 12.8, "elapsed_time": "0:35:04", "remaining_time": "3:58:51", "throughput": 2354.46, "total_tokens": 4953984} {"current_steps": 8600, "total_steps": 67140, "loss": 0.6562, "lr": 4.988003980901768e-05, "epoch": 1.2809055704498062, "percentage": 12.81, "elapsed_time": "0:35:05", "remaining_time": "3:58:50", "throughput": 2354.51, "total_tokens": 4956736} {"current_steps": 8605, "total_steps": 67140, "loss": 0.7591, "lr": 4.987940308422783e-05, "epoch": 1.2816502829907654, "percentage": 12.82, "elapsed_time": "0:35:06", "remaining_time": "3:58:48", "throughput": 2354.65, "total_tokens": 4959712} {"current_steps": 8610, "total_steps": 67140, "loss": 0.6416, "lr": 4.9878764678189075e-05, "epoch": 1.2823949955317246, "percentage": 12.82, "elapsed_time": "0:35:07", "remaining_time": "3:58:46", "throughput": 2354.83, "total_tokens": 4962816} {"current_steps": 8615, "total_steps": 67140, "loss": 0.7089, "lr": 4.9878124590944555e-05, "epoch": 1.2831397080726838, "percentage": 12.83, "elapsed_time": "0:35:08", "remaining_time": "3:58:45", "throughput": 2355.01, "total_tokens": 4965952} {"current_steps": 8620, "total_steps": 67140, "loss": 0.7044, "lr": 4.9877482822537516e-05, "epoch": 1.283884420613643, "percentage": 12.84, "elapsed_time": "0:35:09", "remaining_time": "3:58:43", "throughput": 2355.09, "total_tokens": 4968832} {"current_steps": 8625, "total_steps": 67140, "loss": 0.6913, "lr": 4.987683937301133e-05, "epoch": 1.2846291331546023, "percentage": 12.85, "elapsed_time": "0:35:10", "remaining_time": "3:58:41", "throughput": 2355.22, "total_tokens": 4971744} {"current_steps": 8630, "total_steps": 67140, "loss": 0.6356, "lr": 4.987619424240949e-05, "epoch": 1.2853738456955615, "percentage": 12.85, "elapsed_time": "0:35:12", "remaining_time": "3:58:39", "throughput": 2355.24, "total_tokens": 4974368} {"current_steps": 8635, "total_steps": 67140, "loss": 0.7154, "lr": 4.9875547430775575e-05, "epoch": 1.2861185582365207, "percentage": 12.86, "elapsed_time": "0:35:13", "remaining_time": "3:58:37", "throughput": 2355.4, "total_tokens": 4977440} {"current_steps": 8640, "total_steps": 67140, "loss": 0.6835, "lr": 4.98748989381533e-05, "epoch": 1.2868632707774799, "percentage": 12.87, "elapsed_time": "0:35:14", "remaining_time": "3:58:35", "throughput": 2355.47, "total_tokens": 4980256} {"current_steps": 8645, "total_steps": 67140, "loss": 0.6912, "lr": 4.98742487645865e-05, "epoch": 1.287607983318439, "percentage": 12.88, "elapsed_time": "0:35:15", "remaining_time": "3:58:34", "throughput": 2355.54, "total_tokens": 4983072} {"current_steps": 8650, "total_steps": 67140, "loss": 0.79, "lr": 4.987359691011909e-05, "epoch": 1.2883526958593983, "percentage": 12.88, "elapsed_time": "0:35:16", "remaining_time": "3:58:32", "throughput": 2355.61, "total_tokens": 4985856} {"current_steps": 8655, "total_steps": 67140, "loss": 0.7182, "lr": 4.987294337479513e-05, "epoch": 1.2890974084003575, "percentage": 12.89, "elapsed_time": "0:35:17", "remaining_time": "3:58:30", "throughput": 2355.77, "total_tokens": 4988896} {"current_steps": 8660, "total_steps": 67140, "loss": 0.8771, "lr": 4.987228815865879e-05, "epoch": 1.2898421209413167, "percentage": 12.9, "elapsed_time": "0:35:18", "remaining_time": "3:58:28", "throughput": 2355.85, "total_tokens": 4991744} {"current_steps": 8665, "total_steps": 67140, "loss": 0.5924, "lr": 4.987163126175434e-05, "epoch": 1.2905868334822759, "percentage": 12.91, "elapsed_time": "0:35:19", "remaining_time": "3:58:26", "throughput": 2355.96, "total_tokens": 4994624} {"current_steps": 8670, "total_steps": 67140, "loss": 0.5901, "lr": 4.987097268412616e-05, "epoch": 1.291331546023235, "percentage": 12.91, "elapsed_time": "0:35:21", "remaining_time": "3:58:24", "throughput": 2356.07, "total_tokens": 4997600} {"current_steps": 8675, "total_steps": 67140, "loss": 0.6172, "lr": 4.987031242581877e-05, "epoch": 1.2920762585641943, "percentage": 12.92, "elapsed_time": "0:35:22", "remaining_time": "3:58:23", "throughput": 2356.18, "total_tokens": 5000544} {"current_steps": 8680, "total_steps": 67140, "loss": 0.7066, "lr": 4.9869650486876786e-05, "epoch": 1.2928209711051535, "percentage": 12.93, "elapsed_time": "0:35:23", "remaining_time": "3:58:21", "throughput": 2356.34, "total_tokens": 5003616} {"current_steps": 8685, "total_steps": 67140, "loss": 0.7014, "lr": 4.986898686734493e-05, "epoch": 1.2935656836461127, "percentage": 12.94, "elapsed_time": "0:35:24", "remaining_time": "3:58:19", "throughput": 2356.41, "total_tokens": 5006400} {"current_steps": 8690, "total_steps": 67140, "loss": 0.7692, "lr": 4.9868321567268043e-05, "epoch": 1.2943103961870719, "percentage": 12.94, "elapsed_time": "0:35:25", "remaining_time": "3:58:17", "throughput": 2356.37, "total_tokens": 5008832} {"current_steps": 8695, "total_steps": 67140, "loss": 0.5875, "lr": 4.98676545866911e-05, "epoch": 1.295055108728031, "percentage": 12.95, "elapsed_time": "0:35:26", "remaining_time": "3:58:15", "throughput": 2356.49, "total_tokens": 5011776} {"current_steps": 8700, "total_steps": 67140, "loss": 0.7002, "lr": 4.986698592565917e-05, "epoch": 1.2957998212689903, "percentage": 12.96, "elapsed_time": "0:35:27", "remaining_time": "3:58:13", "throughput": 2356.55, "total_tokens": 5014560} {"current_steps": 8705, "total_steps": 67140, "loss": 0.6595, "lr": 4.986631558421742e-05, "epoch": 1.2965445338099495, "percentage": 12.97, "elapsed_time": "0:35:28", "remaining_time": "3:58:11", "throughput": 2356.52, "total_tokens": 5016992} {"current_steps": 8710, "total_steps": 67140, "loss": 0.5709, "lr": 4.986564356241117e-05, "epoch": 1.2972892463509085, "percentage": 12.97, "elapsed_time": "0:35:30", "remaining_time": "3:58:09", "throughput": 2356.6, "total_tokens": 5019904} {"current_steps": 8715, "total_steps": 67140, "loss": 0.6577, "lr": 4.986496986028583e-05, "epoch": 1.2980339588918677, "percentage": 12.98, "elapsed_time": "0:35:31", "remaining_time": "3:58:07", "throughput": 2356.69, "total_tokens": 5022752} {"current_steps": 8720, "total_steps": 67140, "loss": 0.6701, "lr": 4.986429447788691e-05, "epoch": 1.2987786714328269, "percentage": 12.99, "elapsed_time": "0:35:32", "remaining_time": "3:58:05", "throughput": 2356.73, "total_tokens": 5025408} {"current_steps": 8725, "total_steps": 67140, "loss": 0.8648, "lr": 4.986361741526006e-05, "epoch": 1.299523383973786, "percentage": 13.0, "elapsed_time": "0:35:33", "remaining_time": "3:58:04", "throughput": 2356.91, "total_tokens": 5028576} {"current_steps": 8730, "total_steps": 67140, "loss": 0.4937, "lr": 4.9862938672451045e-05, "epoch": 1.3002680965147453, "percentage": 13.0, "elapsed_time": "0:35:34", "remaining_time": "3:58:02", "throughput": 2356.97, "total_tokens": 5031328} {"current_steps": 8735, "total_steps": 67140, "loss": 0.6386, "lr": 4.986225824950571e-05, "epoch": 1.3010128090557045, "percentage": 13.01, "elapsed_time": "0:35:35", "remaining_time": "3:58:00", "throughput": 2357.13, "total_tokens": 5034400} {"current_steps": 8740, "total_steps": 67140, "loss": 0.7332, "lr": 4.986157614647005e-05, "epoch": 1.3017575215966637, "percentage": 13.02, "elapsed_time": "0:35:36", "remaining_time": "3:57:59", "throughput": 2357.24, "total_tokens": 5037344} {"current_steps": 8745, "total_steps": 67140, "loss": 0.7231, "lr": 4.9860892363390145e-05, "epoch": 1.302502234137623, "percentage": 13.03, "elapsed_time": "0:35:38", "remaining_time": "3:57:57", "throughput": 2357.3, "total_tokens": 5040128} {"current_steps": 8750, "total_steps": 67140, "loss": 0.6675, "lr": 4.986020690031221e-05, "epoch": 1.303246946678582, "percentage": 13.03, "elapsed_time": "0:35:39", "remaining_time": "3:57:55", "throughput": 2357.39, "total_tokens": 5042944} {"current_steps": 8755, "total_steps": 67140, "loss": 0.6615, "lr": 4.985951975728258e-05, "epoch": 1.3039916592195413, "percentage": 13.04, "elapsed_time": "0:35:40", "remaining_time": "3:57:53", "throughput": 2357.43, "total_tokens": 5045664} {"current_steps": 8760, "total_steps": 67140, "loss": 0.6177, "lr": 4.9858830934347665e-05, "epoch": 1.3047363717605005, "percentage": 13.05, "elapsed_time": "0:35:41", "remaining_time": "3:57:51", "throughput": 2357.49, "total_tokens": 5048416} {"current_steps": 8765, "total_steps": 67140, "loss": 0.7493, "lr": 4.9858140431554036e-05, "epoch": 1.3054810843014597, "percentage": 13.05, "elapsed_time": "0:35:42", "remaining_time": "3:57:49", "throughput": 2357.58, "total_tokens": 5051264} {"current_steps": 8770, "total_steps": 67140, "loss": 0.7067, "lr": 4.9857448248948336e-05, "epoch": 1.306225796842419, "percentage": 13.06, "elapsed_time": "0:35:43", "remaining_time": "3:57:47", "throughput": 2357.65, "total_tokens": 5054048} {"current_steps": 8775, "total_steps": 67140, "loss": 0.5688, "lr": 4.985675438657734e-05, "epoch": 1.3069705093833779, "percentage": 13.07, "elapsed_time": "0:35:44", "remaining_time": "3:57:45", "throughput": 2357.62, "total_tokens": 5056544} {"current_steps": 8780, "total_steps": 67140, "loss": 0.8608, "lr": 4.985605884448795e-05, "epoch": 1.307715221924337, "percentage": 13.08, "elapsed_time": "0:35:45", "remaining_time": "3:57:43", "throughput": 2357.68, "total_tokens": 5059296} {"current_steps": 8785, "total_steps": 67140, "loss": 0.7852, "lr": 4.985536162272716e-05, "epoch": 1.3084599344652963, "percentage": 13.08, "elapsed_time": "0:35:46", "remaining_time": "3:57:41", "throughput": 2357.7, "total_tokens": 5061952} {"current_steps": 8790, "total_steps": 67140, "loss": 0.798, "lr": 4.9854662721342086e-05, "epoch": 1.3092046470062555, "percentage": 13.09, "elapsed_time": "0:35:48", "remaining_time": "3:57:39", "throughput": 2357.79, "total_tokens": 5064800} {"current_steps": 8795, "total_steps": 67140, "loss": 0.7268, "lr": 4.985396214037995e-05, "epoch": 1.3099493595472147, "percentage": 13.1, "elapsed_time": "0:35:49", "remaining_time": "3:57:37", "throughput": 2357.85, "total_tokens": 5067584} {"current_steps": 8800, "total_steps": 67140, "loss": 0.826, "lr": 4.9853259879888116e-05, "epoch": 1.310694072088174, "percentage": 13.11, "elapsed_time": "0:35:50", "remaining_time": "3:57:36", "throughput": 2357.98, "total_tokens": 5070592} {"current_steps": 8805, "total_steps": 67140, "loss": 0.607, "lr": 4.9852555939914014e-05, "epoch": 1.311438784629133, "percentage": 13.11, "elapsed_time": "0:35:51", "remaining_time": "3:57:34", "throughput": 2358.09, "total_tokens": 5073504} {"current_steps": 8810, "total_steps": 67140, "loss": 0.6302, "lr": 4.9851850320505225e-05, "epoch": 1.3121834971700923, "percentage": 13.12, "elapsed_time": "0:35:52", "remaining_time": "3:57:32", "throughput": 2358.2, "total_tokens": 5076384} {"current_steps": 8815, "total_steps": 67140, "loss": 0.6518, "lr": 4.985114302170943e-05, "epoch": 1.3129282097110515, "percentage": 13.13, "elapsed_time": "0:35:53", "remaining_time": "3:57:30", "throughput": 2358.31, "total_tokens": 5079360} {"current_steps": 8820, "total_steps": 67140, "loss": 0.6874, "lr": 4.985043404357444e-05, "epoch": 1.3136729222520107, "percentage": 13.14, "elapsed_time": "0:35:54", "remaining_time": "3:57:28", "throughput": 2358.32, "total_tokens": 5081952} {"current_steps": 8825, "total_steps": 67140, "loss": 0.7217, "lr": 4.984972338614814e-05, "epoch": 1.31441763479297, "percentage": 13.14, "elapsed_time": "0:35:56", "remaining_time": "3:57:27", "throughput": 2358.47, "total_tokens": 5085024} {"current_steps": 8830, "total_steps": 67140, "loss": 0.5524, "lr": 4.984901104947857e-05, "epoch": 1.3151623473339291, "percentage": 13.15, "elapsed_time": "0:35:57", "remaining_time": "3:57:25", "throughput": 2358.47, "total_tokens": 5087584} {"current_steps": 8835, "total_steps": 67140, "loss": 0.8177, "lr": 4.984829703361386e-05, "epoch": 1.3159070598748883, "percentage": 13.16, "elapsed_time": "0:35:58", "remaining_time": "3:57:23", "throughput": 2358.56, "total_tokens": 5090464} {"current_steps": 8840, "total_steps": 67140, "loss": 0.6612, "lr": 4.984758133860227e-05, "epoch": 1.3166517724158475, "percentage": 13.17, "elapsed_time": "0:35:59", "remaining_time": "3:57:21", "throughput": 2358.67, "total_tokens": 5093376} {"current_steps": 8845, "total_steps": 67140, "loss": 0.7426, "lr": 4.984686396449214e-05, "epoch": 1.3173964849568067, "percentage": 13.17, "elapsed_time": "0:36:00", "remaining_time": "3:57:19", "throughput": 2358.8, "total_tokens": 5096416} {"current_steps": 8850, "total_steps": 67140, "loss": 0.6632, "lr": 4.984614491133197e-05, "epoch": 1.318141197497766, "percentage": 13.18, "elapsed_time": "0:36:01", "remaining_time": "3:57:18", "throughput": 2358.9, "total_tokens": 5099328} {"current_steps": 8855, "total_steps": 67140, "loss": 0.8381, "lr": 4.984542417917035e-05, "epoch": 1.3188859100387251, "percentage": 13.19, "elapsed_time": "0:36:02", "remaining_time": "3:57:16", "throughput": 2358.97, "total_tokens": 5102112} {"current_steps": 8860, "total_steps": 67140, "loss": 0.6782, "lr": 4.984470176805598e-05, "epoch": 1.3196306225796843, "percentage": 13.2, "elapsed_time": "0:36:03", "remaining_time": "3:57:14", "throughput": 2359.03, "total_tokens": 5104896} {"current_steps": 8865, "total_steps": 67140, "loss": 0.6383, "lr": 4.9843977678037666e-05, "epoch": 1.3203753351206435, "percentage": 13.2, "elapsed_time": "0:36:05", "remaining_time": "3:57:12", "throughput": 2359.08, "total_tokens": 5107648} {"current_steps": 8870, "total_steps": 67140, "loss": 0.7785, "lr": 4.984325190916435e-05, "epoch": 1.3211200476616027, "percentage": 13.21, "elapsed_time": "0:36:06", "remaining_time": "3:57:10", "throughput": 2359.16, "total_tokens": 5110432} {"current_steps": 8875, "total_steps": 67140, "loss": 0.7187, "lr": 4.984252446148508e-05, "epoch": 1.321864760202562, "percentage": 13.22, "elapsed_time": "0:36:07", "remaining_time": "3:57:08", "throughput": 2359.29, "total_tokens": 5113472} {"current_steps": 8880, "total_steps": 67140, "loss": 0.7459, "lr": 4.9841795335049006e-05, "epoch": 1.322609472743521, "percentage": 13.23, "elapsed_time": "0:36:08", "remaining_time": "3:57:07", "throughput": 2359.41, "total_tokens": 5116416} {"current_steps": 8885, "total_steps": 67140, "loss": 0.7614, "lr": 4.98410645299054e-05, "epoch": 1.3233541852844801, "percentage": 13.23, "elapsed_time": "0:36:09", "remaining_time": "3:57:05", "throughput": 2359.47, "total_tokens": 5119168} {"current_steps": 8890, "total_steps": 67140, "loss": 0.7092, "lr": 4.9840332046103656e-05, "epoch": 1.3240988978254393, "percentage": 13.24, "elapsed_time": "0:36:10", "remaining_time": "3:57:03", "throughput": 2359.46, "total_tokens": 5121696} {"current_steps": 8895, "total_steps": 67140, "loss": 0.7965, "lr": 4.9839597883693267e-05, "epoch": 1.3248436103663985, "percentage": 13.25, "elapsed_time": "0:36:11", "remaining_time": "3:57:01", "throughput": 2359.6, "total_tokens": 5124704} {"current_steps": 8900, "total_steps": 67140, "loss": 0.6582, "lr": 4.983886204272383e-05, "epoch": 1.3255883229073577, "percentage": 13.26, "elapsed_time": "0:36:12", "remaining_time": "3:56:59", "throughput": 2359.68, "total_tokens": 5127520} {"current_steps": 8905, "total_steps": 67140, "loss": 0.6785, "lr": 4.98381245232451e-05, "epoch": 1.326333035448317, "percentage": 13.26, "elapsed_time": "0:36:14", "remaining_time": "3:56:57", "throughput": 2359.7, "total_tokens": 5130176} {"current_steps": 8910, "total_steps": 67140, "loss": 0.6274, "lr": 4.98373853253069e-05, "epoch": 1.3270777479892761, "percentage": 13.27, "elapsed_time": "0:36:15", "remaining_time": "3:56:55", "throughput": 2359.81, "total_tokens": 5133152} {"current_steps": 8915, "total_steps": 67140, "loss": 0.7799, "lr": 4.983664444895917e-05, "epoch": 1.3278224605302353, "percentage": 13.28, "elapsed_time": "0:36:16", "remaining_time": "3:56:54", "throughput": 2359.91, "total_tokens": 5136064} {"current_steps": 8920, "total_steps": 67140, "loss": 0.8272, "lr": 4.983590189425198e-05, "epoch": 1.3285671730711945, "percentage": 13.29, "elapsed_time": "0:36:17", "remaining_time": "3:56:52", "throughput": 2359.97, "total_tokens": 5138848} {"current_steps": 8925, "total_steps": 67140, "loss": 0.7957, "lr": 4.9835157661235534e-05, "epoch": 1.3293118856121537, "percentage": 13.29, "elapsed_time": "0:36:18", "remaining_time": "3:56:51", "throughput": 2360.16, "total_tokens": 5142080} {"current_steps": 8930, "total_steps": 67140, "loss": 0.5847, "lr": 4.98344117499601e-05, "epoch": 1.330056598153113, "percentage": 13.3, "elapsed_time": "0:36:19", "remaining_time": "3:56:49", "throughput": 2360.31, "total_tokens": 5145152} {"current_steps": 8935, "total_steps": 67140, "loss": 0.6403, "lr": 4.983366416047608e-05, "epoch": 1.3308013106940721, "percentage": 13.31, "elapsed_time": "0:36:20", "remaining_time": "3:56:47", "throughput": 2360.36, "total_tokens": 5147936} {"current_steps": 8940, "total_steps": 67140, "loss": 0.7914, "lr": 4.983291489283401e-05, "epoch": 1.3315460232350314, "percentage": 13.32, "elapsed_time": "0:36:22", "remaining_time": "3:56:45", "throughput": 2360.49, "total_tokens": 5150944} {"current_steps": 8945, "total_steps": 67140, "loss": 0.8337, "lr": 4.983216394708451e-05, "epoch": 1.3322907357759903, "percentage": 13.32, "elapsed_time": "0:36:23", "remaining_time": "3:56:44", "throughput": 2360.61, "total_tokens": 5153920} {"current_steps": 8950, "total_steps": 67140, "loss": 0.642, "lr": 4.983141132327833e-05, "epoch": 1.3330354483169495, "percentage": 13.33, "elapsed_time": "0:36:24", "remaining_time": "3:56:42", "throughput": 2360.72, "total_tokens": 5156864} {"current_steps": 8955, "total_steps": 67140, "loss": 0.5876, "lr": 4.983065702146634e-05, "epoch": 1.3337801608579087, "percentage": 13.34, "elapsed_time": "0:36:25", "remaining_time": "3:56:40", "throughput": 2360.71, "total_tokens": 5159360} {"current_steps": 8960, "total_steps": 67140, "loss": 0.7457, "lr": 4.98299010416995e-05, "epoch": 1.334524873398868, "percentage": 13.35, "elapsed_time": "0:36:26", "remaining_time": "3:56:38", "throughput": 2360.7, "total_tokens": 5161952} {"current_steps": 8965, "total_steps": 67140, "loss": 0.5862, "lr": 4.982914338402889e-05, "epoch": 1.3352695859398271, "percentage": 13.35, "elapsed_time": "0:36:27", "remaining_time": "3:56:36", "throughput": 2360.8, "total_tokens": 5164896} {"current_steps": 8970, "total_steps": 67140, "loss": 0.5828, "lr": 4.982838404850573e-05, "epoch": 1.3360142984807863, "percentage": 13.36, "elapsed_time": "0:36:28", "remaining_time": "3:56:34", "throughput": 2360.86, "total_tokens": 5167680} {"current_steps": 8975, "total_steps": 67140, "loss": 0.7037, "lr": 4.982762303518131e-05, "epoch": 1.3367590110217455, "percentage": 13.37, "elapsed_time": "0:36:30", "remaining_time": "3:56:33", "throughput": 2361.06, "total_tokens": 5170944} {"current_steps": 8980, "total_steps": 67140, "loss": 0.5852, "lr": 4.982686034410707e-05, "epoch": 1.3375037235627047, "percentage": 13.38, "elapsed_time": "0:36:31", "remaining_time": "3:56:31", "throughput": 2361.15, "total_tokens": 5173824} {"current_steps": 8985, "total_steps": 67140, "loss": 0.5374, "lr": 4.982609597533455e-05, "epoch": 1.338248436103664, "percentage": 13.38, "elapsed_time": "0:36:32", "remaining_time": "3:56:29", "throughput": 2361.21, "total_tokens": 5176640} {"current_steps": 8990, "total_steps": 67140, "loss": 0.6367, "lr": 4.98253299289154e-05, "epoch": 1.3389931486446232, "percentage": 13.39, "elapsed_time": "0:36:33", "remaining_time": "3:56:28", "throughput": 2361.28, "total_tokens": 5179424} {"current_steps": 8995, "total_steps": 67140, "loss": 0.7761, "lr": 4.982456220490138e-05, "epoch": 1.3397378611855824, "percentage": 13.4, "elapsed_time": "0:36:34", "remaining_time": "3:56:26", "throughput": 2361.46, "total_tokens": 5182592} {"current_steps": 9000, "total_steps": 67140, "loss": 0.5559, "lr": 4.982379280334438e-05, "epoch": 1.3404825737265416, "percentage": 13.4, "elapsed_time": "0:36:35", "remaining_time": "3:56:24", "throughput": 2361.53, "total_tokens": 5185376} {"current_steps": 9005, "total_steps": 67140, "loss": 0.8362, "lr": 4.982302172429638e-05, "epoch": 1.3412272862675008, "percentage": 13.41, "elapsed_time": "0:36:36", "remaining_time": "3:56:22", "throughput": 2361.63, "total_tokens": 5188288} {"current_steps": 9010, "total_steps": 67140, "loss": 0.7225, "lr": 4.98222489678095e-05, "epoch": 1.34197199880846, "percentage": 13.42, "elapsed_time": "0:36:38", "remaining_time": "3:56:21", "throughput": 2361.75, "total_tokens": 5191264} {"current_steps": 9015, "total_steps": 67140, "loss": 0.6768, "lr": 4.9821474533935966e-05, "epoch": 1.3427167113494192, "percentage": 13.43, "elapsed_time": "0:36:39", "remaining_time": "3:56:21", "throughput": 2362.18, "total_tokens": 5195488} {"current_steps": 9020, "total_steps": 67140, "loss": 0.6289, "lr": 4.982069842272809e-05, "epoch": 1.3434614238903784, "percentage": 13.43, "elapsed_time": "0:36:40", "remaining_time": "3:56:19", "throughput": 2362.19, "total_tokens": 5198112} {"current_steps": 9025, "total_steps": 67140, "loss": 0.6998, "lr": 4.9819920634238323e-05, "epoch": 1.3442061364313376, "percentage": 13.44, "elapsed_time": "0:36:41", "remaining_time": "3:56:17", "throughput": 2362.28, "total_tokens": 5201024} {"current_steps": 9030, "total_steps": 67140, "loss": 0.7839, "lr": 4.981914116851924e-05, "epoch": 1.3449508489722968, "percentage": 13.45, "elapsed_time": "0:36:42", "remaining_time": "3:56:15", "throughput": 2362.39, "total_tokens": 5203968} {"current_steps": 9035, "total_steps": 67140, "loss": 0.6389, "lr": 4.98183600256235e-05, "epoch": 1.345695561513256, "percentage": 13.46, "elapsed_time": "0:36:43", "remaining_time": "3:56:14", "throughput": 2362.52, "total_tokens": 5206976} {"current_steps": 9040, "total_steps": 67140, "loss": 0.7372, "lr": 4.981757720560389e-05, "epoch": 1.3464402740542152, "percentage": 13.46, "elapsed_time": "0:36:45", "remaining_time": "3:56:12", "throughput": 2362.7, "total_tokens": 5210176} {"current_steps": 9045, "total_steps": 67140, "loss": 0.5689, "lr": 4.981679270851332e-05, "epoch": 1.3471849865951744, "percentage": 13.47, "elapsed_time": "0:36:46", "remaining_time": "3:56:10", "throughput": 2362.77, "total_tokens": 5213024} {"current_steps": 9050, "total_steps": 67140, "loss": 0.665, "lr": 4.981600653440479e-05, "epoch": 1.3479296991361336, "percentage": 13.48, "elapsed_time": "0:36:47", "remaining_time": "3:56:09", "throughput": 2362.91, "total_tokens": 5216064} {"current_steps": 9055, "total_steps": 67140, "loss": 0.5412, "lr": 4.981521868333144e-05, "epoch": 1.3486744116770926, "percentage": 13.49, "elapsed_time": "0:36:48", "remaining_time": "3:56:07", "throughput": 2363.07, "total_tokens": 5219200} {"current_steps": 9060, "total_steps": 67140, "loss": 0.6615, "lr": 4.98144291553465e-05, "epoch": 1.3494191242180518, "percentage": 13.49, "elapsed_time": "0:36:49", "remaining_time": "3:56:06", "throughput": 2363.24, "total_tokens": 5222336} {"current_steps": 9065, "total_steps": 67140, "loss": 0.6751, "lr": 4.981363795050332e-05, "epoch": 1.350163836759011, "percentage": 13.5, "elapsed_time": "0:36:50", "remaining_time": "3:56:04", "throughput": 2363.35, "total_tokens": 5225248} {"current_steps": 9070, "total_steps": 67140, "loss": 0.7443, "lr": 4.9812845068855384e-05, "epoch": 1.3509085492999702, "percentage": 13.51, "elapsed_time": "0:36:52", "remaining_time": "3:56:02", "throughput": 2363.5, "total_tokens": 5228320} {"current_steps": 9075, "total_steps": 67140, "loss": 0.642, "lr": 4.9812050510456254e-05, "epoch": 1.3516532618409294, "percentage": 13.52, "elapsed_time": "0:36:53", "remaining_time": "3:56:00", "throughput": 2363.53, "total_tokens": 5231008} {"current_steps": 9080, "total_steps": 67140, "loss": 0.6619, "lr": 4.9811254275359626e-05, "epoch": 1.3523979743818886, "percentage": 13.52, "elapsed_time": "0:36:54", "remaining_time": "3:55:59", "throughput": 2363.59, "total_tokens": 5233792} {"current_steps": 9085, "total_steps": 67140, "loss": 0.4988, "lr": 4.9810456363619304e-05, "epoch": 1.3531426869228478, "percentage": 13.53, "elapsed_time": "0:36:55", "remaining_time": "3:55:57", "throughput": 2363.69, "total_tokens": 5236768} {"current_steps": 9090, "total_steps": 67140, "loss": 0.6792, "lr": 4.980965677528923e-05, "epoch": 1.353887399463807, "percentage": 13.54, "elapsed_time": "0:36:56", "remaining_time": "3:55:56", "throughput": 2363.85, "total_tokens": 5239936} {"current_steps": 9095, "total_steps": 67140, "loss": 0.6897, "lr": 4.98088555104234e-05, "epoch": 1.3546321120047662, "percentage": 13.55, "elapsed_time": "0:36:57", "remaining_time": "3:55:54", "throughput": 2363.9, "total_tokens": 5242624} {"current_steps": 9100, "total_steps": 67140, "loss": 0.4956, "lr": 4.9808052569076e-05, "epoch": 1.3553768245457254, "percentage": 13.55, "elapsed_time": "0:36:58", "remaining_time": "3:55:52", "throughput": 2363.95, "total_tokens": 5245344} {"current_steps": 9105, "total_steps": 67140, "loss": 0.6061, "lr": 4.9807247951301255e-05, "epoch": 1.3561215370866846, "percentage": 13.56, "elapsed_time": "0:37:00", "remaining_time": "3:55:50", "throughput": 2364.06, "total_tokens": 5248352} {"current_steps": 9110, "total_steps": 67140, "loss": 0.7867, "lr": 4.9806441657153555e-05, "epoch": 1.3568662496276438, "percentage": 13.57, "elapsed_time": "0:37:01", "remaining_time": "3:55:49", "throughput": 2364.16, "total_tokens": 5251328} {"current_steps": 9115, "total_steps": 67140, "loss": 0.8196, "lr": 4.9805633686687394e-05, "epoch": 1.357610962168603, "percentage": 13.58, "elapsed_time": "0:37:02", "remaining_time": "3:55:47", "throughput": 2364.17, "total_tokens": 5253952} {"current_steps": 9120, "total_steps": 67140, "loss": 0.6438, "lr": 4.980482403995734e-05, "epoch": 1.358355674709562, "percentage": 13.58, "elapsed_time": "0:37:03", "remaining_time": "3:55:45", "throughput": 2364.25, "total_tokens": 5256736} {"current_steps": 9125, "total_steps": 67140, "loss": 0.677, "lr": 4.9804012717018146e-05, "epoch": 1.3591003872505212, "percentage": 13.59, "elapsed_time": "0:37:04", "remaining_time": "3:55:43", "throughput": 2364.39, "total_tokens": 5259808} {"current_steps": 9130, "total_steps": 67140, "loss": 0.6404, "lr": 4.980319971792461e-05, "epoch": 1.3598450997914804, "percentage": 13.6, "elapsed_time": "0:37:05", "remaining_time": "3:55:42", "throughput": 2364.59, "total_tokens": 5263104} {"current_steps": 9135, "total_steps": 67140, "loss": 0.6927, "lr": 4.980238504273168e-05, "epoch": 1.3605898123324396, "percentage": 13.61, "elapsed_time": "0:37:06", "remaining_time": "3:55:40", "throughput": 2364.6, "total_tokens": 5265696} {"current_steps": 9140, "total_steps": 67140, "loss": 0.5273, "lr": 4.98015686914944e-05, "epoch": 1.3613345248733988, "percentage": 13.61, "elapsed_time": "0:37:07", "remaining_time": "3:55:38", "throughput": 2364.64, "total_tokens": 5268416} {"current_steps": 9145, "total_steps": 67140, "loss": 0.6316, "lr": 4.980075066426796e-05, "epoch": 1.362079237414358, "percentage": 13.62, "elapsed_time": "0:37:09", "remaining_time": "3:55:36", "throughput": 2364.86, "total_tokens": 5271744} {"current_steps": 9150, "total_steps": 67140, "loss": 0.5981, "lr": 4.979993096110762e-05, "epoch": 1.3628239499553172, "percentage": 13.63, "elapsed_time": "0:37:10", "remaining_time": "3:55:35", "throughput": 2364.99, "total_tokens": 5274784} {"current_steps": 9155, "total_steps": 67140, "loss": 0.8802, "lr": 4.979910958206876e-05, "epoch": 1.3635686624962764, "percentage": 13.64, "elapsed_time": "0:37:11", "remaining_time": "3:55:33", "throughput": 2365.02, "total_tokens": 5277472} {"current_steps": 9160, "total_steps": 67140, "loss": 0.685, "lr": 4.9798286527206915e-05, "epoch": 1.3643133750372356, "percentage": 13.64, "elapsed_time": "0:37:12", "remaining_time": "3:55:31", "throughput": 2365.06, "total_tokens": 5280160} {"current_steps": 9165, "total_steps": 67140, "loss": 0.6391, "lr": 4.979746179657768e-05, "epoch": 1.3650580875781948, "percentage": 13.65, "elapsed_time": "0:37:13", "remaining_time": "3:55:29", "throughput": 2365.18, "total_tokens": 5283200} {"current_steps": 9170, "total_steps": 67140, "loss": 0.7704, "lr": 4.97966353902368e-05, "epoch": 1.365802800119154, "percentage": 13.66, "elapsed_time": "0:37:14", "remaining_time": "3:55:28", "throughput": 2365.37, "total_tokens": 5286432} {"current_steps": 9175, "total_steps": 67140, "loss": 0.54, "lr": 4.9795807308240115e-05, "epoch": 1.3665475126601132, "percentage": 13.67, "elapsed_time": "0:37:16", "remaining_time": "3:55:26", "throughput": 2365.44, "total_tokens": 5289248} {"current_steps": 9180, "total_steps": 67140, "loss": 0.6939, "lr": 4.979497755064359e-05, "epoch": 1.3672922252010724, "percentage": 13.67, "elapsed_time": "0:37:17", "remaining_time": "3:55:24", "throughput": 2365.5, "total_tokens": 5292064} {"current_steps": 9185, "total_steps": 67140, "loss": 0.7518, "lr": 4.979414611750329e-05, "epoch": 1.3680369377420316, "percentage": 13.68, "elapsed_time": "0:37:18", "remaining_time": "3:55:23", "throughput": 2365.56, "total_tokens": 5294848} {"current_steps": 9190, "total_steps": 67140, "loss": 0.6088, "lr": 4.97933130088754e-05, "epoch": 1.3687816502829908, "percentage": 13.69, "elapsed_time": "0:37:19", "remaining_time": "3:55:21", "throughput": 2365.57, "total_tokens": 5297472} {"current_steps": 9195, "total_steps": 67140, "loss": 0.5954, "lr": 4.9792478224816206e-05, "epoch": 1.36952636282395, "percentage": 13.7, "elapsed_time": "0:37:20", "remaining_time": "3:55:19", "throughput": 2365.66, "total_tokens": 5300320} {"current_steps": 9200, "total_steps": 67140, "loss": 0.5515, "lr": 4.979164176538215e-05, "epoch": 1.3702710753649092, "percentage": 13.7, "elapsed_time": "0:37:21", "remaining_time": "3:55:17", "throughput": 2365.72, "total_tokens": 5303104} {"current_steps": 9205, "total_steps": 67140, "loss": 0.6281, "lr": 4.979080363062974e-05, "epoch": 1.3710157879058684, "percentage": 13.71, "elapsed_time": "0:37:22", "remaining_time": "3:55:15", "throughput": 2365.83, "total_tokens": 5306048} {"current_steps": 9210, "total_steps": 67140, "loss": 0.732, "lr": 4.978996382061559e-05, "epoch": 1.3717605004468276, "percentage": 13.72, "elapsed_time": "0:37:23", "remaining_time": "3:55:14", "throughput": 2365.94, "total_tokens": 5308992} {"current_steps": 9215, "total_steps": 67140, "loss": 0.5414, "lr": 4.978912233539649e-05, "epoch": 1.3725052129877868, "percentage": 13.73, "elapsed_time": "0:37:25", "remaining_time": "3:55:12", "throughput": 2366.03, "total_tokens": 5311872} {"current_steps": 9220, "total_steps": 67140, "loss": 0.8511, "lr": 4.978827917502929e-05, "epoch": 1.373249925528746, "percentage": 13.73, "elapsed_time": "0:37:26", "remaining_time": "3:55:10", "throughput": 2366.06, "total_tokens": 5314592} {"current_steps": 9225, "total_steps": 67140, "loss": 0.5915, "lr": 4.978743433957096e-05, "epoch": 1.3739946380697052, "percentage": 13.74, "elapsed_time": "0:37:27", "remaining_time": "3:55:08", "throughput": 2366.17, "total_tokens": 5317536} {"current_steps": 9230, "total_steps": 67140, "loss": 0.7073, "lr": 4.97865878290786e-05, "epoch": 1.3747393506106642, "percentage": 13.75, "elapsed_time": "0:37:28", "remaining_time": "3:55:07", "throughput": 2366.33, "total_tokens": 5320640} {"current_steps": 9235, "total_steps": 67140, "loss": 0.6559, "lr": 4.9785739643609406e-05, "epoch": 1.3754840631516234, "percentage": 13.75, "elapsed_time": "0:37:29", "remaining_time": "3:55:05", "throughput": 2366.42, "total_tokens": 5323552} {"current_steps": 9240, "total_steps": 67140, "loss": 0.7855, "lr": 4.97848897832207e-05, "epoch": 1.3762287756925826, "percentage": 13.76, "elapsed_time": "0:37:30", "remaining_time": "3:55:03", "throughput": 2366.48, "total_tokens": 5326400} {"current_steps": 9245, "total_steps": 67140, "loss": 0.6012, "lr": 4.978403824796991e-05, "epoch": 1.3769734882335418, "percentage": 13.77, "elapsed_time": "0:37:31", "remaining_time": "3:55:02", "throughput": 2366.61, "total_tokens": 5329376} {"current_steps": 9250, "total_steps": 67140, "loss": 0.6072, "lr": 4.978318503791458e-05, "epoch": 1.377718200774501, "percentage": 13.78, "elapsed_time": "0:37:33", "remaining_time": "3:55:00", "throughput": 2366.76, "total_tokens": 5332448} {"current_steps": 9255, "total_steps": 67140, "loss": 0.6097, "lr": 4.978233015311236e-05, "epoch": 1.3784629133154602, "percentage": 13.78, "elapsed_time": "0:37:34", "remaining_time": "3:54:58", "throughput": 2366.78, "total_tokens": 5335136} {"current_steps": 9260, "total_steps": 67140, "loss": 0.8387, "lr": 4.978147359362103e-05, "epoch": 1.3792076258564194, "percentage": 13.79, "elapsed_time": "0:37:35", "remaining_time": "3:54:57", "throughput": 2366.89, "total_tokens": 5338112} {"current_steps": 9265, "total_steps": 67140, "loss": 0.7128, "lr": 4.978061535949847e-05, "epoch": 1.3799523383973786, "percentage": 13.8, "elapsed_time": "0:37:36", "remaining_time": "3:54:55", "throughput": 2367.0, "total_tokens": 5341056} {"current_steps": 9270, "total_steps": 67140, "loss": 0.6279, "lr": 4.9779755450802675e-05, "epoch": 1.3806970509383378, "percentage": 13.81, "elapsed_time": "0:37:37", "remaining_time": "3:54:53", "throughput": 2367.15, "total_tokens": 5344128} {"current_steps": 9275, "total_steps": 67140, "loss": 0.6708, "lr": 4.977889386759176e-05, "epoch": 1.381441763479297, "percentage": 13.81, "elapsed_time": "0:37:38", "remaining_time": "3:54:51", "throughput": 2367.18, "total_tokens": 5346848} {"current_steps": 9280, "total_steps": 67140, "loss": 0.7328, "lr": 4.977803060992393e-05, "epoch": 1.3821864760202562, "percentage": 13.82, "elapsed_time": "0:37:39", "remaining_time": "3:54:50", "throughput": 2367.31, "total_tokens": 5349856} {"current_steps": 9285, "total_steps": 67140, "loss": 0.7497, "lr": 4.977716567785754e-05, "epoch": 1.3829311885612154, "percentage": 13.83, "elapsed_time": "0:37:40", "remaining_time": "3:54:48", "throughput": 2367.34, "total_tokens": 5352544} {"current_steps": 9290, "total_steps": 67140, "loss": 0.5897, "lr": 4.977629907145102e-05, "epoch": 1.3836759011021746, "percentage": 13.84, "elapsed_time": "0:37:42", "remaining_time": "3:54:46", "throughput": 2367.42, "total_tokens": 5355392} {"current_steps": 9295, "total_steps": 67140, "loss": 0.681, "lr": 4.977543079076295e-05, "epoch": 1.3844206136431336, "percentage": 13.84, "elapsed_time": "0:37:43", "remaining_time": "3:54:44", "throughput": 2367.45, "total_tokens": 5358112} {"current_steps": 9300, "total_steps": 67140, "loss": 0.6802, "lr": 4.977456083585199e-05, "epoch": 1.3851653261840928, "percentage": 13.85, "elapsed_time": "0:37:44", "remaining_time": "3:54:42", "throughput": 2367.53, "total_tokens": 5360960} {"current_steps": 9305, "total_steps": 67140, "loss": 0.7854, "lr": 4.977368920677694e-05, "epoch": 1.385910038725052, "percentage": 13.86, "elapsed_time": "0:37:45", "remaining_time": "3:54:41", "throughput": 2367.54, "total_tokens": 5363616} {"current_steps": 9310, "total_steps": 67140, "loss": 0.7354, "lr": 4.97728159035967e-05, "epoch": 1.3866547512660112, "percentage": 13.87, "elapsed_time": "0:37:46", "remaining_time": "3:54:39", "throughput": 2367.56, "total_tokens": 5366240} {"current_steps": 9315, "total_steps": 67140, "loss": 0.7132, "lr": 4.9771940926370274e-05, "epoch": 1.3873994638069704, "percentage": 13.87, "elapsed_time": "0:37:47", "remaining_time": "3:54:36", "throughput": 2367.55, "total_tokens": 5368768} {"current_steps": 9320, "total_steps": 67140, "loss": 0.5941, "lr": 4.97710642751568e-05, "epoch": 1.3881441763479296, "percentage": 13.88, "elapsed_time": "0:37:48", "remaining_time": "3:54:35", "throughput": 2367.62, "total_tokens": 5371584} {"current_steps": 9325, "total_steps": 67140, "loss": 0.6108, "lr": 4.977018595001551e-05, "epoch": 1.3888888888888888, "percentage": 13.89, "elapsed_time": "0:37:49", "remaining_time": "3:54:33", "throughput": 2367.69, "total_tokens": 5374400} {"current_steps": 9330, "total_steps": 67140, "loss": 0.762, "lr": 4.9769305951005766e-05, "epoch": 1.389633601429848, "percentage": 13.9, "elapsed_time": "0:37:51", "remaining_time": "3:54:31", "throughput": 2367.77, "total_tokens": 5377280} {"current_steps": 9335, "total_steps": 67140, "loss": 0.572, "lr": 4.976842427818702e-05, "epoch": 1.3903783139708072, "percentage": 13.9, "elapsed_time": "0:37:52", "remaining_time": "3:54:29", "throughput": 2367.83, "total_tokens": 5380032} {"current_steps": 9340, "total_steps": 67140, "loss": 0.6848, "lr": 4.9767540931618874e-05, "epoch": 1.3911230265117664, "percentage": 13.91, "elapsed_time": "0:37:53", "remaining_time": "3:54:28", "throughput": 2367.99, "total_tokens": 5383200} {"current_steps": 9345, "total_steps": 67140, "loss": 0.6648, "lr": 4.9766655911361e-05, "epoch": 1.3918677390527256, "percentage": 13.92, "elapsed_time": "0:37:54", "remaining_time": "3:54:26", "throughput": 2368.16, "total_tokens": 5386336} {"current_steps": 9350, "total_steps": 67140, "loss": 0.8842, "lr": 4.976576921747322e-05, "epoch": 1.3926124515936849, "percentage": 13.93, "elapsed_time": "0:37:55", "remaining_time": "3:54:24", "throughput": 2368.22, "total_tokens": 5389120} {"current_steps": 9355, "total_steps": 67140, "loss": 0.6631, "lr": 4.976488085001545e-05, "epoch": 1.393357164134644, "percentage": 13.93, "elapsed_time": "0:37:56", "remaining_time": "3:54:23", "throughput": 2368.33, "total_tokens": 5392064} {"current_steps": 9360, "total_steps": 67140, "loss": 0.8132, "lr": 4.976399080904771e-05, "epoch": 1.3941018766756033, "percentage": 13.94, "elapsed_time": "0:37:57", "remaining_time": "3:54:21", "throughput": 2368.39, "total_tokens": 5394880} {"current_steps": 9365, "total_steps": 67140, "loss": 0.4974, "lr": 4.9763099094630164e-05, "epoch": 1.3948465892165625, "percentage": 13.95, "elapsed_time": "0:37:58", "remaining_time": "3:54:19", "throughput": 2368.47, "total_tokens": 5397696} {"current_steps": 9370, "total_steps": 67140, "loss": 0.6916, "lr": 4.976220570682305e-05, "epoch": 1.3955913017575217, "percentage": 13.96, "elapsed_time": "0:38:00", "remaining_time": "3:54:17", "throughput": 2368.54, "total_tokens": 5400480} {"current_steps": 9375, "total_steps": 67140, "loss": 0.779, "lr": 4.976131064568675e-05, "epoch": 1.3963360142984809, "percentage": 13.96, "elapsed_time": "0:38:01", "remaining_time": "3:54:16", "throughput": 2368.65, "total_tokens": 5403488} {"current_steps": 9380, "total_steps": 67140, "loss": 0.6821, "lr": 4.976041391128175e-05, "epoch": 1.39708072683944, "percentage": 13.97, "elapsed_time": "0:38:02", "remaining_time": "3:54:14", "throughput": 2368.7, "total_tokens": 5406240} {"current_steps": 9385, "total_steps": 67140, "loss": 0.5835, "lr": 4.975951550366866e-05, "epoch": 1.3978254393803993, "percentage": 13.98, "elapsed_time": "0:38:03", "remaining_time": "3:54:12", "throughput": 2368.79, "total_tokens": 5409216} {"current_steps": 9390, "total_steps": 67140, "loss": 0.9074, "lr": 4.9758615422908164e-05, "epoch": 1.3985701519213585, "percentage": 13.99, "elapsed_time": "0:38:04", "remaining_time": "3:54:11", "throughput": 2368.87, "total_tokens": 5412064} {"current_steps": 9395, "total_steps": 67140, "loss": 0.7526, "lr": 4.97577136690611e-05, "epoch": 1.3993148644623177, "percentage": 13.99, "elapsed_time": "0:38:05", "remaining_time": "3:54:09", "throughput": 2369.0, "total_tokens": 5415104} {"current_steps": 9400, "total_steps": 67140, "loss": 0.6935, "lr": 4.975681024218841e-05, "epoch": 1.4000595770032767, "percentage": 14.0, "elapsed_time": "0:38:06", "remaining_time": "3:54:07", "throughput": 2369.09, "total_tokens": 5418048} {"current_steps": 9405, "total_steps": 67140, "loss": 0.6601, "lr": 4.9755905142351133e-05, "epoch": 1.4008042895442359, "percentage": 14.01, "elapsed_time": "0:38:08", "remaining_time": "3:54:06", "throughput": 2369.21, "total_tokens": 5421024} {"current_steps": 9410, "total_steps": 67140, "loss": 0.6796, "lr": 4.975499836961044e-05, "epoch": 1.401549002085195, "percentage": 14.02, "elapsed_time": "0:38:09", "remaining_time": "3:54:04", "throughput": 2369.21, "total_tokens": 5423616} {"current_steps": 9415, "total_steps": 67140, "loss": 0.6394, "lr": 4.97540899240276e-05, "epoch": 1.4022937146261543, "percentage": 14.02, "elapsed_time": "0:38:10", "remaining_time": "3:54:02", "throughput": 2369.27, "total_tokens": 5426368} {"current_steps": 9420, "total_steps": 67140, "loss": 0.6186, "lr": 4.9753179805664e-05, "epoch": 1.4030384271671135, "percentage": 14.03, "elapsed_time": "0:38:11", "remaining_time": "3:54:00", "throughput": 2369.32, "total_tokens": 5429120} {"current_steps": 9425, "total_steps": 67140, "loss": 0.8234, "lr": 4.975226801458116e-05, "epoch": 1.4037831397080727, "percentage": 14.04, "elapsed_time": "0:38:12", "remaining_time": "3:53:58", "throughput": 2369.39, "total_tokens": 5431936} {"current_steps": 9430, "total_steps": 67140, "loss": 0.7001, "lr": 4.975135455084067e-05, "epoch": 1.4045278522490319, "percentage": 14.05, "elapsed_time": "0:38:13", "remaining_time": "3:53:56", "throughput": 2369.48, "total_tokens": 5434816} {"current_steps": 9435, "total_steps": 67140, "loss": 0.6618, "lr": 4.975043941450428e-05, "epoch": 1.405272564789991, "percentage": 14.05, "elapsed_time": "0:38:14", "remaining_time": "3:53:55", "throughput": 2369.54, "total_tokens": 5437632} {"current_steps": 9440, "total_steps": 67140, "loss": 0.5752, "lr": 4.9749522605633825e-05, "epoch": 1.4060172773309503, "percentage": 14.06, "elapsed_time": "0:38:15", "remaining_time": "3:53:53", "throughput": 2369.59, "total_tokens": 5440352} {"current_steps": 9445, "total_steps": 67140, "loss": 0.6957, "lr": 4.9748604124291254e-05, "epoch": 1.4067619898719095, "percentage": 14.07, "elapsed_time": "0:38:17", "remaining_time": "3:53:51", "throughput": 2369.72, "total_tokens": 5443424} {"current_steps": 9450, "total_steps": 67140, "loss": 0.5697, "lr": 4.974768397053863e-05, "epoch": 1.4075067024128687, "percentage": 14.08, "elapsed_time": "0:38:18", "remaining_time": "3:53:49", "throughput": 2369.8, "total_tokens": 5446272} {"current_steps": 9455, "total_steps": 67140, "loss": 0.7152, "lr": 4.9746762144438144e-05, "epoch": 1.4082514149538279, "percentage": 14.08, "elapsed_time": "0:38:19", "remaining_time": "3:53:48", "throughput": 2369.93, "total_tokens": 5449344} {"current_steps": 9460, "total_steps": 67140, "loss": 0.6539, "lr": 4.974583864605209e-05, "epoch": 1.408996127494787, "percentage": 14.09, "elapsed_time": "0:38:20", "remaining_time": "3:53:47", "throughput": 2370.1, "total_tokens": 5452544} {"current_steps": 9465, "total_steps": 67140, "loss": 0.8048, "lr": 4.974491347544287e-05, "epoch": 1.409740840035746, "percentage": 14.1, "elapsed_time": "0:38:21", "remaining_time": "3:53:45", "throughput": 2370.14, "total_tokens": 5455200} {"current_steps": 9470, "total_steps": 67140, "loss": 0.5867, "lr": 4.974398663267299e-05, "epoch": 1.4104855525767053, "percentage": 14.1, "elapsed_time": "0:38:22", "remaining_time": "3:53:42", "throughput": 2370.14, "total_tokens": 5457760} {"current_steps": 9475, "total_steps": 67140, "loss": 0.6897, "lr": 4.9743058117805105e-05, "epoch": 1.4112302651176645, "percentage": 14.11, "elapsed_time": "0:38:23", "remaining_time": "3:53:41", "throughput": 2370.2, "total_tokens": 5460576} {"current_steps": 9480, "total_steps": 67140, "loss": 0.6229, "lr": 4.974212793090195e-05, "epoch": 1.4119749776586237, "percentage": 14.12, "elapsed_time": "0:38:24", "remaining_time": "3:53:39", "throughput": 2370.29, "total_tokens": 5463456} {"current_steps": 9485, "total_steps": 67140, "loss": 0.6425, "lr": 4.974119607202638e-05, "epoch": 1.4127196901995829, "percentage": 14.13, "elapsed_time": "0:38:26", "remaining_time": "3:53:37", "throughput": 2370.33, "total_tokens": 5466208} {"current_steps": 9490, "total_steps": 67140, "loss": 0.5896, "lr": 4.974026254124138e-05, "epoch": 1.413464402740542, "percentage": 14.13, "elapsed_time": "0:38:27", "remaining_time": "3:53:36", "throughput": 2370.45, "total_tokens": 5469184} {"current_steps": 9495, "total_steps": 67140, "loss": 0.7589, "lr": 4.973932733861001e-05, "epoch": 1.4142091152815013, "percentage": 14.14, "elapsed_time": "0:38:28", "remaining_time": "3:53:34", "throughput": 2370.54, "total_tokens": 5472096} {"current_steps": 9500, "total_steps": 67140, "loss": 0.6185, "lr": 4.9738390464195486e-05, "epoch": 1.4149538278224605, "percentage": 14.15, "elapsed_time": "0:38:29", "remaining_time": "3:53:32", "throughput": 2370.57, "total_tokens": 5474752} {"current_steps": 9505, "total_steps": 67140, "loss": 0.6476, "lr": 4.973745191806112e-05, "epoch": 1.4156985403634197, "percentage": 14.16, "elapsed_time": "0:38:30", "remaining_time": "3:53:30", "throughput": 2370.69, "total_tokens": 5477792} {"current_steps": 9510, "total_steps": 67140, "loss": 0.7286, "lr": 4.9736511700270324e-05, "epoch": 1.416443252904379, "percentage": 14.16, "elapsed_time": "0:38:31", "remaining_time": "3:53:29", "throughput": 2370.82, "total_tokens": 5480864} {"current_steps": 9515, "total_steps": 67140, "loss": 0.7164, "lr": 4.973556981088664e-05, "epoch": 1.417187965445338, "percentage": 14.17, "elapsed_time": "0:38:32", "remaining_time": "3:53:27", "throughput": 2370.85, "total_tokens": 5483584} {"current_steps": 9520, "total_steps": 67140, "loss": 0.5586, "lr": 4.9734626249973715e-05, "epoch": 1.4179326779862973, "percentage": 14.18, "elapsed_time": "0:38:34", "remaining_time": "3:53:25", "throughput": 2370.9, "total_tokens": 5486368} {"current_steps": 9525, "total_steps": 67140, "loss": 0.819, "lr": 4.973368101759531e-05, "epoch": 1.4186773905272565, "percentage": 14.19, "elapsed_time": "0:38:35", "remaining_time": "3:53:24", "throughput": 2371.0, "total_tokens": 5489344} {"current_steps": 9530, "total_steps": 67140, "loss": 0.7683, "lr": 4.97327341138153e-05, "epoch": 1.4194221030682157, "percentage": 14.19, "elapsed_time": "0:38:36", "remaining_time": "3:53:22", "throughput": 2371.14, "total_tokens": 5492416} {"current_steps": 9535, "total_steps": 67140, "loss": 0.8204, "lr": 4.973178553869767e-05, "epoch": 1.420166815609175, "percentage": 14.2, "elapsed_time": "0:38:37", "remaining_time": "3:53:21", "throughput": 2371.27, "total_tokens": 5495520} {"current_steps": 9540, "total_steps": 67140, "loss": 0.6083, "lr": 4.973083529230654e-05, "epoch": 1.420911528150134, "percentage": 14.21, "elapsed_time": "0:38:38", "remaining_time": "3:53:19", "throughput": 2371.33, "total_tokens": 5498272} {"current_steps": 9545, "total_steps": 67140, "loss": 0.664, "lr": 4.97298833747061e-05, "epoch": 1.4216562406910933, "percentage": 14.22, "elapsed_time": "0:38:39", "remaining_time": "3:53:17", "throughput": 2371.45, "total_tokens": 5501344} {"current_steps": 9550, "total_steps": 67140, "loss": 0.6473, "lr": 4.972892978596069e-05, "epoch": 1.4224009532320525, "percentage": 14.22, "elapsed_time": "0:38:40", "remaining_time": "3:53:16", "throughput": 2371.55, "total_tokens": 5504352} {"current_steps": 9555, "total_steps": 67140, "loss": 0.5693, "lr": 4.972797452613474e-05, "epoch": 1.4231456657730117, "percentage": 14.23, "elapsed_time": "0:38:42", "remaining_time": "3:53:14", "throughput": 2371.64, "total_tokens": 5507232} {"current_steps": 9560, "total_steps": 67140, "loss": 0.8109, "lr": 4.972701759529281e-05, "epoch": 1.423890378313971, "percentage": 14.24, "elapsed_time": "0:38:43", "remaining_time": "3:53:13", "throughput": 2371.75, "total_tokens": 5510208} {"current_steps": 9565, "total_steps": 67140, "loss": 0.5829, "lr": 4.972605899349957e-05, "epoch": 1.4246350908549301, "percentage": 14.25, "elapsed_time": "0:38:44", "remaining_time": "3:53:11", "throughput": 2371.78, "total_tokens": 5512896} {"current_steps": 9570, "total_steps": 67140, "loss": 0.6657, "lr": 4.9725098720819784e-05, "epoch": 1.4253798033958893, "percentage": 14.25, "elapsed_time": "0:38:45", "remaining_time": "3:53:09", "throughput": 2371.86, "total_tokens": 5515808} {"current_steps": 9575, "total_steps": 67140, "loss": 0.6357, "lr": 4.9724136777318354e-05, "epoch": 1.4261245159368483, "percentage": 14.26, "elapsed_time": "0:38:46", "remaining_time": "3:53:07", "throughput": 2371.96, "total_tokens": 5518752} {"current_steps": 9580, "total_steps": 67140, "loss": 0.63, "lr": 4.972317316306028e-05, "epoch": 1.4268692284778075, "percentage": 14.27, "elapsed_time": "0:38:47", "remaining_time": "3:53:06", "throughput": 2372.03, "total_tokens": 5521632} {"current_steps": 9585, "total_steps": 67140, "loss": 0.6404, "lr": 4.972220787811068e-05, "epoch": 1.4276139410187667, "percentage": 14.28, "elapsed_time": "0:38:48", "remaining_time": "3:53:04", "throughput": 2372.15, "total_tokens": 5524704} {"current_steps": 9590, "total_steps": 67140, "loss": 0.6806, "lr": 4.972124092253479e-05, "epoch": 1.428358653559726, "percentage": 14.28, "elapsed_time": "0:38:50", "remaining_time": "3:53:03", "throughput": 2372.23, "total_tokens": 5527584} {"current_steps": 9595, "total_steps": 67140, "loss": 0.8443, "lr": 4.9720272296397946e-05, "epoch": 1.4291033661006851, "percentage": 14.29, "elapsed_time": "0:38:51", "remaining_time": "3:53:01", "throughput": 2372.26, "total_tokens": 5530240} {"current_steps": 9600, "total_steps": 67140, "loss": 0.7161, "lr": 4.9719301999765605e-05, "epoch": 1.4298480786416443, "percentage": 14.3, "elapsed_time": "0:38:52", "remaining_time": "3:52:59", "throughput": 2372.32, "total_tokens": 5532992} {"current_steps": 9605, "total_steps": 67140, "loss": 0.6329, "lr": 4.971833003270333e-05, "epoch": 1.4305927911826035, "percentage": 14.31, "elapsed_time": "0:38:53", "remaining_time": "3:52:57", "throughput": 2372.36, "total_tokens": 5535712} {"current_steps": 9610, "total_steps": 67140, "loss": 0.7237, "lr": 4.9717356395276814e-05, "epoch": 1.4313375037235627, "percentage": 14.31, "elapsed_time": "0:38:54", "remaining_time": "3:52:56", "throughput": 2372.59, "total_tokens": 5539168} {"current_steps": 9615, "total_steps": 67140, "loss": 0.6502, "lr": 4.971638108755186e-05, "epoch": 1.432082216264522, "percentage": 14.32, "elapsed_time": "0:38:55", "remaining_time": "3:52:54", "throughput": 2372.69, "total_tokens": 5542112} {"current_steps": 9620, "total_steps": 67140, "loss": 0.6917, "lr": 4.9715404109594347e-05, "epoch": 1.4328269288054811, "percentage": 14.33, "elapsed_time": "0:38:56", "remaining_time": "3:52:53", "throughput": 2372.83, "total_tokens": 5545248} {"current_steps": 9625, "total_steps": 67140, "loss": 0.6438, "lr": 4.971442546147031e-05, "epoch": 1.4335716413464403, "percentage": 14.34, "elapsed_time": "0:38:58", "remaining_time": "3:52:51", "throughput": 2372.92, "total_tokens": 5548128} {"current_steps": 9630, "total_steps": 67140, "loss": 0.634, "lr": 4.9713445143245876e-05, "epoch": 1.4343163538873995, "percentage": 14.34, "elapsed_time": "0:38:59", "remaining_time": "3:52:49", "throughput": 2372.91, "total_tokens": 5550720} {"current_steps": 9635, "total_steps": 67140, "loss": 0.8276, "lr": 4.9712463154987305e-05, "epoch": 1.4350610664283587, "percentage": 14.35, "elapsed_time": "0:39:00", "remaining_time": "3:52:47", "throughput": 2372.99, "total_tokens": 5553600} {"current_steps": 9640, "total_steps": 67140, "loss": 0.6343, "lr": 4.9711479496760947e-05, "epoch": 1.4358057789693177, "percentage": 14.36, "elapsed_time": "0:39:01", "remaining_time": "3:52:46", "throughput": 2373.13, "total_tokens": 5556768} {"current_steps": 9645, "total_steps": 67140, "loss": 0.6709, "lr": 4.971049416863327e-05, "epoch": 1.436550491510277, "percentage": 14.37, "elapsed_time": "0:39:02", "remaining_time": "3:52:44", "throughput": 2373.21, "total_tokens": 5559648} {"current_steps": 9650, "total_steps": 67140, "loss": 0.5009, "lr": 4.9709507170670866e-05, "epoch": 1.4372952040512361, "percentage": 14.37, "elapsed_time": "0:39:03", "remaining_time": "3:52:43", "throughput": 2373.24, "total_tokens": 5562368} {"current_steps": 9655, "total_steps": 67140, "loss": 0.6582, "lr": 4.970851850294043e-05, "epoch": 1.4380399165921953, "percentage": 14.38, "elapsed_time": "0:39:04", "remaining_time": "3:52:41", "throughput": 2373.3, "total_tokens": 5565184} {"current_steps": 9660, "total_steps": 67140, "loss": 0.499, "lr": 4.970752816550877e-05, "epoch": 1.4387846291331545, "percentage": 14.39, "elapsed_time": "0:39:06", "remaining_time": "3:52:39", "throughput": 2373.47, "total_tokens": 5568352} {"current_steps": 9665, "total_steps": 67140, "loss": 0.7235, "lr": 4.970653615844281e-05, "epoch": 1.4395293416741137, "percentage": 14.4, "elapsed_time": "0:39:07", "remaining_time": "3:52:38", "throughput": 2373.52, "total_tokens": 5571136} {"current_steps": 9670, "total_steps": 67140, "loss": 0.74, "lr": 4.970554248180959e-05, "epoch": 1.440274054215073, "percentage": 14.4, "elapsed_time": "0:39:08", "remaining_time": "3:52:36", "throughput": 2373.59, "total_tokens": 5573952} {"current_steps": 9675, "total_steps": 67140, "loss": 0.7041, "lr": 4.970454713567625e-05, "epoch": 1.4410187667560321, "percentage": 14.41, "elapsed_time": "0:39:09", "remaining_time": "3:52:34", "throughput": 2373.74, "total_tokens": 5577056} {"current_steps": 9680, "total_steps": 67140, "loss": 0.7301, "lr": 4.970355012011005e-05, "epoch": 1.4417634792969913, "percentage": 14.42, "elapsed_time": "0:39:10", "remaining_time": "3:52:32", "throughput": 2373.7, "total_tokens": 5579520} {"current_steps": 9685, "total_steps": 67140, "loss": 0.5669, "lr": 4.970255143517838e-05, "epoch": 1.4425081918379505, "percentage": 14.43, "elapsed_time": "0:39:11", "remaining_time": "3:52:31", "throughput": 2373.82, "total_tokens": 5582496} {"current_steps": 9690, "total_steps": 67140, "loss": 0.6093, "lr": 4.9701551080948714e-05, "epoch": 1.4432529043789097, "percentage": 14.43, "elapsed_time": "0:39:12", "remaining_time": "3:52:29", "throughput": 2373.87, "total_tokens": 5585280} {"current_steps": 9695, "total_steps": 67140, "loss": 0.6805, "lr": 4.970054905748865e-05, "epoch": 1.443997616919869, "percentage": 14.44, "elapsed_time": "0:39:13", "remaining_time": "3:52:27", "throughput": 2373.87, "total_tokens": 5587872} {"current_steps": 9700, "total_steps": 67140, "loss": 0.5886, "lr": 4.969954536486592e-05, "epoch": 1.4447423294608281, "percentage": 14.45, "elapsed_time": "0:39:15", "remaining_time": "3:52:25", "throughput": 2373.96, "total_tokens": 5590784} {"current_steps": 9705, "total_steps": 67140, "loss": 0.7456, "lr": 4.969854000314833e-05, "epoch": 1.4454870420017873, "percentage": 14.45, "elapsed_time": "0:39:16", "remaining_time": "3:52:23", "throughput": 2373.97, "total_tokens": 5593408} {"current_steps": 9710, "total_steps": 67140, "loss": 0.6217, "lr": 4.9697532972403816e-05, "epoch": 1.4462317545427466, "percentage": 14.46, "elapsed_time": "0:39:17", "remaining_time": "3:52:22", "throughput": 2374.1, "total_tokens": 5596448} {"current_steps": 9715, "total_steps": 67140, "loss": 0.8271, "lr": 4.969652427270044e-05, "epoch": 1.4469764670837058, "percentage": 14.47, "elapsed_time": "0:39:18", "remaining_time": "3:52:20", "throughput": 2374.15, "total_tokens": 5599232} {"current_steps": 9720, "total_steps": 67140, "loss": 0.5927, "lr": 4.969551390410636e-05, "epoch": 1.447721179624665, "percentage": 14.48, "elapsed_time": "0:39:19", "remaining_time": "3:52:18", "throughput": 2374.21, "total_tokens": 5601984} {"current_steps": 9725, "total_steps": 67140, "loss": 0.8584, "lr": 4.969450186668986e-05, "epoch": 1.4484658921656242, "percentage": 14.48, "elapsed_time": "0:39:20", "remaining_time": "3:52:16", "throughput": 2374.3, "total_tokens": 5604896} {"current_steps": 9730, "total_steps": 67140, "loss": 0.7003, "lr": 4.969348816051932e-05, "epoch": 1.4492106047065834, "percentage": 14.49, "elapsed_time": "0:39:21", "remaining_time": "3:52:15", "throughput": 2374.47, "total_tokens": 5608096} {"current_steps": 9735, "total_steps": 67140, "loss": 0.6461, "lr": 4.9692472785663244e-05, "epoch": 1.4499553172475426, "percentage": 14.5, "elapsed_time": "0:39:22", "remaining_time": "3:52:13", "throughput": 2374.54, "total_tokens": 5610912} {"current_steps": 9740, "total_steps": 67140, "loss": 0.646, "lr": 4.9691455742190266e-05, "epoch": 1.4507000297885018, "percentage": 14.51, "elapsed_time": "0:39:24", "remaining_time": "3:52:12", "throughput": 2374.7, "total_tokens": 5614080} {"current_steps": 9745, "total_steps": 67140, "loss": 0.6848, "lr": 4.969043703016908e-05, "epoch": 1.4514447423294607, "percentage": 14.51, "elapsed_time": "0:39:25", "remaining_time": "3:52:10", "throughput": 2374.7, "total_tokens": 5616704} {"current_steps": 9750, "total_steps": 67140, "loss": 0.6535, "lr": 4.9689416649668554e-05, "epoch": 1.45218945487042, "percentage": 14.52, "elapsed_time": "0:39:26", "remaining_time": "3:52:08", "throughput": 2374.8, "total_tokens": 5619648} {"current_steps": 9755, "total_steps": 67140, "loss": 0.596, "lr": 4.9688394600757624e-05, "epoch": 1.4529341674113792, "percentage": 14.53, "elapsed_time": "0:39:27", "remaining_time": "3:52:07", "throughput": 2374.85, "total_tokens": 5622432} {"current_steps": 9760, "total_steps": 67140, "loss": 0.638, "lr": 4.968737088350536e-05, "epoch": 1.4536788799523384, "percentage": 14.54, "elapsed_time": "0:39:28", "remaining_time": "3:52:05", "throughput": 2374.85, "total_tokens": 5624992} {"current_steps": 9765, "total_steps": 67140, "loss": 0.5836, "lr": 4.9686345497980945e-05, "epoch": 1.4544235924932976, "percentage": 14.54, "elapsed_time": "0:39:29", "remaining_time": "3:52:03", "throughput": 2374.93, "total_tokens": 5627872} {"current_steps": 9770, "total_steps": 67140, "loss": 0.604, "lr": 4.968531844425367e-05, "epoch": 1.4551683050342568, "percentage": 14.55, "elapsed_time": "0:39:30", "remaining_time": "3:52:01", "throughput": 2374.98, "total_tokens": 5630688} {"current_steps": 9775, "total_steps": 67140, "loss": 0.8111, "lr": 4.968428972239294e-05, "epoch": 1.455913017575216, "percentage": 14.56, "elapsed_time": "0:39:31", "remaining_time": "3:52:00", "throughput": 2375.05, "total_tokens": 5633568} {"current_steps": 9780, "total_steps": 67140, "loss": 0.7386, "lr": 4.9683259332468265e-05, "epoch": 1.4566577301161752, "percentage": 14.57, "elapsed_time": "0:39:33", "remaining_time": "3:51:58", "throughput": 2375.08, "total_tokens": 5636288} {"current_steps": 9785, "total_steps": 67140, "loss": 0.6128, "lr": 4.968222727454929e-05, "epoch": 1.4574024426571344, "percentage": 14.57, "elapsed_time": "0:39:34", "remaining_time": "3:51:56", "throughput": 2375.16, "total_tokens": 5639200} {"current_steps": 9790, "total_steps": 67140, "loss": 0.5823, "lr": 4.9681193548705736e-05, "epoch": 1.4581471551980936, "percentage": 14.58, "elapsed_time": "0:39:35", "remaining_time": "3:51:55", "throughput": 2375.26, "total_tokens": 5642176} {"current_steps": 9795, "total_steps": 67140, "loss": 0.6598, "lr": 4.9680158155007474e-05, "epoch": 1.4588918677390528, "percentage": 14.59, "elapsed_time": "0:39:36", "remaining_time": "3:51:53", "throughput": 2375.44, "total_tokens": 5645472} {"current_steps": 9800, "total_steps": 67140, "loss": 0.6758, "lr": 4.967912109352446e-05, "epoch": 1.459636580280012, "percentage": 14.6, "elapsed_time": "0:39:37", "remaining_time": "3:51:52", "throughput": 2375.53, "total_tokens": 5648384} {"current_steps": 9805, "total_steps": 67140, "loss": 0.6704, "lr": 4.9678082364326786e-05, "epoch": 1.4603812928209712, "percentage": 14.6, "elapsed_time": "0:39:38", "remaining_time": "3:51:50", "throughput": 2375.61, "total_tokens": 5651296} {"current_steps": 9810, "total_steps": 67140, "loss": 0.7082, "lr": 4.9677041967484635e-05, "epoch": 1.4611260053619302, "percentage": 14.61, "elapsed_time": "0:39:40", "remaining_time": "3:51:48", "throughput": 2375.66, "total_tokens": 5654080} {"current_steps": 9815, "total_steps": 67140, "loss": 0.6893, "lr": 4.967599990306832e-05, "epoch": 1.4618707179028894, "percentage": 14.62, "elapsed_time": "0:39:41", "remaining_time": "3:51:46", "throughput": 2375.65, "total_tokens": 5656608} {"current_steps": 9820, "total_steps": 67140, "loss": 0.7881, "lr": 4.967495617114826e-05, "epoch": 1.4626154304438486, "percentage": 14.63, "elapsed_time": "0:39:42", "remaining_time": "3:51:45", "throughput": 2375.68, "total_tokens": 5659328} {"current_steps": 9825, "total_steps": 67140, "loss": 0.6365, "lr": 4.9673910771794974e-05, "epoch": 1.4633601429848078, "percentage": 14.63, "elapsed_time": "0:39:43", "remaining_time": "3:51:43", "throughput": 2375.77, "total_tokens": 5662240} {"current_steps": 9830, "total_steps": 67140, "loss": 0.6961, "lr": 4.967286370507912e-05, "epoch": 1.464104855525767, "percentage": 14.64, "elapsed_time": "0:39:44", "remaining_time": "3:51:41", "throughput": 2375.91, "total_tokens": 5665376} {"current_steps": 9835, "total_steps": 67140, "loss": 0.6834, "lr": 4.967181497107145e-05, "epoch": 1.4648495680667262, "percentage": 14.65, "elapsed_time": "0:39:45", "remaining_time": "3:51:40", "throughput": 2376.05, "total_tokens": 5668480} {"current_steps": 9840, "total_steps": 67140, "loss": 0.7333, "lr": 4.967076456984283e-05, "epoch": 1.4655942806076854, "percentage": 14.66, "elapsed_time": "0:39:46", "remaining_time": "3:51:38", "throughput": 2376.11, "total_tokens": 5671296} {"current_steps": 9845, "total_steps": 67140, "loss": 0.7823, "lr": 4.966971250146425e-05, "epoch": 1.4663389931486446, "percentage": 14.66, "elapsed_time": "0:39:47", "remaining_time": "3:51:36", "throughput": 2376.15, "total_tokens": 5674048} {"current_steps": 9850, "total_steps": 67140, "loss": 0.5135, "lr": 4.966865876600679e-05, "epoch": 1.4670837056896038, "percentage": 14.67, "elapsed_time": "0:39:48", "remaining_time": "3:51:34", "throughput": 2376.13, "total_tokens": 5676544} {"current_steps": 9855, "total_steps": 67140, "loss": 0.6441, "lr": 4.9667603363541676e-05, "epoch": 1.467828418230563, "percentage": 14.68, "elapsed_time": "0:39:50", "remaining_time": "3:51:33", "throughput": 2376.18, "total_tokens": 5679296} {"current_steps": 9860, "total_steps": 67140, "loss": 0.5325, "lr": 4.9666546294140216e-05, "epoch": 1.4685731307715222, "percentage": 14.69, "elapsed_time": "0:39:51", "remaining_time": "3:51:31", "throughput": 2376.22, "total_tokens": 5682016} {"current_steps": 9865, "total_steps": 67140, "loss": 0.6886, "lr": 4.9665487557873834e-05, "epoch": 1.4693178433124814, "percentage": 14.69, "elapsed_time": "0:39:52", "remaining_time": "3:51:30", "throughput": 2376.42, "total_tokens": 5685376} {"current_steps": 9870, "total_steps": 67140, "loss": 0.6655, "lr": 4.9664427154814094e-05, "epoch": 1.4700625558534406, "percentage": 14.7, "elapsed_time": "0:39:53", "remaining_time": "3:51:28", "throughput": 2376.49, "total_tokens": 5688256} {"current_steps": 9875, "total_steps": 67140, "loss": 0.8039, "lr": 4.966336508503265e-05, "epoch": 1.4708072683943998, "percentage": 14.71, "elapsed_time": "0:39:54", "remaining_time": "3:51:27", "throughput": 2376.63, "total_tokens": 5691392} {"current_steps": 9880, "total_steps": 67140, "loss": 0.8597, "lr": 4.966230134860126e-05, "epoch": 1.471551980935359, "percentage": 14.72, "elapsed_time": "0:39:55", "remaining_time": "3:51:25", "throughput": 2376.7, "total_tokens": 5694176} {"current_steps": 9885, "total_steps": 67140, "loss": 0.7226, "lr": 4.966123594559182e-05, "epoch": 1.4722966934763182, "percentage": 14.72, "elapsed_time": "0:39:56", "remaining_time": "3:51:23", "throughput": 2376.79, "total_tokens": 5697088} {"current_steps": 9890, "total_steps": 67140, "loss": 0.7238, "lr": 4.966016887607631e-05, "epoch": 1.4730414060172774, "percentage": 14.73, "elapsed_time": "0:39:58", "remaining_time": "3:51:21", "throughput": 2376.8, "total_tokens": 5699776} {"current_steps": 9895, "total_steps": 67140, "loss": 0.7223, "lr": 4.9659100140126856e-05, "epoch": 1.4737861185582366, "percentage": 14.74, "elapsed_time": "0:39:59", "remaining_time": "3:51:20", "throughput": 2376.95, "total_tokens": 5702912} {"current_steps": 9900, "total_steps": 67140, "loss": 0.7983, "lr": 4.965802973781567e-05, "epoch": 1.4745308310991958, "percentage": 14.75, "elapsed_time": "0:40:00", "remaining_time": "3:51:18", "throughput": 2376.99, "total_tokens": 5705664} {"current_steps": 9905, "total_steps": 67140, "loss": 0.5791, "lr": 4.965695766921509e-05, "epoch": 1.475275543640155, "percentage": 14.75, "elapsed_time": "0:40:01", "remaining_time": "3:51:16", "throughput": 2377.05, "total_tokens": 5708512} {"current_steps": 9910, "total_steps": 67140, "loss": 0.7057, "lr": 4.965588393439755e-05, "epoch": 1.4760202561811142, "percentage": 14.76, "elapsed_time": "0:40:02", "remaining_time": "3:51:15", "throughput": 2377.12, "total_tokens": 5711360} {"current_steps": 9915, "total_steps": 67140, "loss": 0.8039, "lr": 4.965480853343563e-05, "epoch": 1.4767649687220734, "percentage": 14.77, "elapsed_time": "0:40:03", "remaining_time": "3:51:13", "throughput": 2377.08, "total_tokens": 5713792} {"current_steps": 9920, "total_steps": 67140, "loss": 0.6789, "lr": 4.9653731466401975e-05, "epoch": 1.4775096812630324, "percentage": 14.78, "elapsed_time": "0:40:04", "remaining_time": "3:51:11", "throughput": 2377.03, "total_tokens": 5716256} {"current_steps": 9925, "total_steps": 67140, "loss": 0.6133, "lr": 4.965265273336939e-05, "epoch": 1.4782543938039916, "percentage": 14.78, "elapsed_time": "0:40:05", "remaining_time": "3:51:09", "throughput": 2377.05, "total_tokens": 5718912} {"current_steps": 9930, "total_steps": 67140, "loss": 0.6971, "lr": 4.9651572334410757e-05, "epoch": 1.4789991063449508, "percentage": 14.79, "elapsed_time": "0:40:06", "remaining_time": "3:51:07", "throughput": 2377.09, "total_tokens": 5721632} {"current_steps": 9935, "total_steps": 67140, "loss": 0.7198, "lr": 4.9650490269599096e-05, "epoch": 1.47974381888591, "percentage": 14.8, "elapsed_time": "0:40:08", "remaining_time": "3:51:05", "throughput": 2377.17, "total_tokens": 5724544} {"current_steps": 9940, "total_steps": 67140, "loss": 0.6158, "lr": 4.964940653900753e-05, "epoch": 1.4804885314268692, "percentage": 14.8, "elapsed_time": "0:40:09", "remaining_time": "3:51:04", "throughput": 2377.23, "total_tokens": 5727328} {"current_steps": 9945, "total_steps": 67140, "loss": 0.7004, "lr": 4.964832114270928e-05, "epoch": 1.4812332439678284, "percentage": 14.81, "elapsed_time": "0:40:10", "remaining_time": "3:51:02", "throughput": 2377.28, "total_tokens": 5730144} {"current_steps": 9950, "total_steps": 67140, "loss": 0.6387, "lr": 4.96472340807777e-05, "epoch": 1.4819779565087876, "percentage": 14.82, "elapsed_time": "0:40:11", "remaining_time": "3:51:00", "throughput": 2377.31, "total_tokens": 5732864} {"current_steps": 9955, "total_steps": 67140, "loss": 0.8926, "lr": 4.964614535328626e-05, "epoch": 1.4827226690497468, "percentage": 14.83, "elapsed_time": "0:40:12", "remaining_time": "3:50:59", "throughput": 2377.44, "total_tokens": 5735904} {"current_steps": 9960, "total_steps": 67140, "loss": 0.6896, "lr": 4.9645054960308504e-05, "epoch": 1.483467381590706, "percentage": 14.83, "elapsed_time": "0:40:13", "remaining_time": "3:50:57", "throughput": 2377.51, "total_tokens": 5738752} {"current_steps": 9965, "total_steps": 67140, "loss": 0.6388, "lr": 4.964396290191814e-05, "epoch": 1.4842120941316652, "percentage": 14.84, "elapsed_time": "0:40:14", "remaining_time": "3:50:55", "throughput": 2377.55, "total_tokens": 5741504} {"current_steps": 9970, "total_steps": 67140, "loss": 0.8229, "lr": 4.964286917818895e-05, "epoch": 1.4849568066726244, "percentage": 14.85, "elapsed_time": "0:40:15", "remaining_time": "3:50:53", "throughput": 2377.52, "total_tokens": 5743968} {"current_steps": 9975, "total_steps": 67140, "loss": 0.628, "lr": 4.964177378919487e-05, "epoch": 1.4857015192135836, "percentage": 14.86, "elapsed_time": "0:40:17", "remaining_time": "3:50:52", "throughput": 2377.6, "total_tokens": 5746912} {"current_steps": 9980, "total_steps": 67140, "loss": 0.691, "lr": 4.9640676735009894e-05, "epoch": 1.4864462317545428, "percentage": 14.86, "elapsed_time": "0:40:18", "remaining_time": "3:50:50", "throughput": 2377.61, "total_tokens": 5749536} {"current_steps": 9985, "total_steps": 67140, "loss": 0.5998, "lr": 4.963957801570816e-05, "epoch": 1.4871909442955018, "percentage": 14.87, "elapsed_time": "0:40:19", "remaining_time": "3:50:48", "throughput": 2377.6, "total_tokens": 5752096} {"current_steps": 9990, "total_steps": 67140, "loss": 0.676, "lr": 4.963847763136393e-05, "epoch": 1.487935656836461, "percentage": 14.88, "elapsed_time": "0:40:20", "remaining_time": "3:50:46", "throughput": 2377.69, "total_tokens": 5755040} {"current_steps": 9995, "total_steps": 67140, "loss": 0.5711, "lr": 4.9637375582051556e-05, "epoch": 1.4886803693774202, "percentage": 14.89, "elapsed_time": "0:40:21", "remaining_time": "3:50:45", "throughput": 2377.79, "total_tokens": 5758016} {"current_steps": 10000, "total_steps": 67140, "loss": 0.5853, "lr": 4.96362718678455e-05, "epoch": 1.4894250819183794, "percentage": 14.89, "elapsed_time": "0:40:22", "remaining_time": "3:50:43", "throughput": 2377.85, "total_tokens": 5760832} {"current_steps": 10005, "total_steps": 67140, "loss": 0.5085, "lr": 4.9635166488820365e-05, "epoch": 1.4901697944593386, "percentage": 14.9, "elapsed_time": "0:40:23", "remaining_time": "3:50:41", "throughput": 2377.9, "total_tokens": 5763584} {"current_steps": 10010, "total_steps": 67140, "loss": 0.6364, "lr": 4.963405944505083e-05, "epoch": 1.4909145070002978, "percentage": 14.91, "elapsed_time": "0:40:24", "remaining_time": "3:50:39", "throughput": 2377.96, "total_tokens": 5766400} {"current_steps": 10015, "total_steps": 67140, "loss": 0.6549, "lr": 4.9632950736611713e-05, "epoch": 1.491659219541257, "percentage": 14.92, "elapsed_time": "0:40:26", "remaining_time": "3:50:38", "throughput": 2378.13, "total_tokens": 5769664} {"current_steps": 10020, "total_steps": 67140, "loss": 0.6802, "lr": 4.963184036357793e-05, "epoch": 1.4924039320822162, "percentage": 14.92, "elapsed_time": "0:40:27", "remaining_time": "3:50:36", "throughput": 2378.14, "total_tokens": 5772288} {"current_steps": 10025, "total_steps": 67140, "loss": 0.6325, "lr": 4.9630728326024535e-05, "epoch": 1.4931486446231754, "percentage": 14.93, "elapsed_time": "0:40:28", "remaining_time": "3:50:35", "throughput": 2378.22, "total_tokens": 5775232} {"current_steps": 10030, "total_steps": 67140, "loss": 0.7314, "lr": 4.962961462402666e-05, "epoch": 1.4938933571641346, "percentage": 14.94, "elapsed_time": "0:40:29", "remaining_time": "3:50:33", "throughput": 2378.23, "total_tokens": 5777856} {"current_steps": 10035, "total_steps": 67140, "loss": 0.6791, "lr": 4.9628499257659553e-05, "epoch": 1.4946380697050938, "percentage": 14.95, "elapsed_time": "0:40:30", "remaining_time": "3:50:31", "throughput": 2378.37, "total_tokens": 5780960} {"current_steps": 10040, "total_steps": 67140, "loss": 0.6553, "lr": 4.9627382226998605e-05, "epoch": 1.495382782246053, "percentage": 14.95, "elapsed_time": "0:40:31", "remaining_time": "3:50:30", "throughput": 2378.46, "total_tokens": 5783936} {"current_steps": 10045, "total_steps": 67140, "loss": 0.5511, "lr": 4.9626263532119286e-05, "epoch": 1.4961274947870122, "percentage": 14.96, "elapsed_time": "0:40:32", "remaining_time": "3:50:28", "throughput": 2378.51, "total_tokens": 5786720} {"current_steps": 10050, "total_steps": 67140, "loss": 0.7447, "lr": 4.962514317309721e-05, "epoch": 1.4968722073279714, "percentage": 14.97, "elapsed_time": "0:40:34", "remaining_time": "3:50:26", "throughput": 2378.55, "total_tokens": 5789472} {"current_steps": 10055, "total_steps": 67140, "loss": 0.6587, "lr": 4.962402115000808e-05, "epoch": 1.4976169198689306, "percentage": 14.98, "elapsed_time": "0:40:35", "remaining_time": "3:50:25", "throughput": 2378.58, "total_tokens": 5792192} {"current_steps": 10060, "total_steps": 67140, "loss": 0.6537, "lr": 4.962289746292771e-05, "epoch": 1.4983616324098898, "percentage": 14.98, "elapsed_time": "0:40:36", "remaining_time": "3:50:23", "throughput": 2378.71, "total_tokens": 5795264} {"current_steps": 10065, "total_steps": 67140, "loss": 0.6843, "lr": 4.962177211193203e-05, "epoch": 1.499106344950849, "percentage": 14.99, "elapsed_time": "0:40:37", "remaining_time": "3:50:21", "throughput": 2378.78, "total_tokens": 5798112} {"current_steps": 10070, "total_steps": 67140, "loss": 0.6583, "lr": 4.962064509709711e-05, "epoch": 1.4998510574918082, "percentage": 15.0, "elapsed_time": "0:40:38", "remaining_time": "3:50:20", "throughput": 2378.87, "total_tokens": 5801088} {"current_steps": 10071, "total_steps": 67140, "eval_loss": 0.6765435338020325, "epoch": 1.5, "percentage": 15.0, "elapsed_time": "0:41:53", "remaining_time": "3:57:20", "throughput": 2308.59, "total_tokens": 5801696} {"current_steps": 10075, "total_steps": 67140, "loss": 0.6595, "lr": 4.961951641849909e-05, "epoch": 1.5005957700327675, "percentage": 15.01, "elapsed_time": "0:41:55", "remaining_time": "3:57:28", "throughput": 2307.26, "total_tokens": 5804000} {"current_steps": 10080, "total_steps": 67140, "loss": 0.7563, "lr": 4.961838607621424e-05, "epoch": 1.5013404825737267, "percentage": 15.01, "elapsed_time": "0:41:56", "remaining_time": "3:57:26", "throughput": 2307.51, "total_tokens": 5807488} {"current_steps": 10085, "total_steps": 67140, "loss": 0.7024, "lr": 4.961725407031896e-05, "epoch": 1.5020851951146859, "percentage": 15.02, "elapsed_time": "0:41:57", "remaining_time": "3:57:24", "throughput": 2307.53, "total_tokens": 5810016} {"current_steps": 10090, "total_steps": 67140, "loss": 0.6738, "lr": 4.961612040088973e-05, "epoch": 1.502829907655645, "percentage": 15.03, "elapsed_time": "0:41:58", "remaining_time": "3:57:22", "throughput": 2307.62, "total_tokens": 5812800} {"current_steps": 10095, "total_steps": 67140, "loss": 0.6019, "lr": 4.9614985068003163e-05, "epoch": 1.5035746201966043, "percentage": 15.04, "elapsed_time": "0:42:00", "remaining_time": "3:57:20", "throughput": 2307.68, "total_tokens": 5815552} {"current_steps": 10100, "total_steps": 67140, "loss": 0.7591, "lr": 4.9613848071735987e-05, "epoch": 1.5043193327375635, "percentage": 15.04, "elapsed_time": "0:42:01", "remaining_time": "3:57:18", "throughput": 2307.84, "total_tokens": 5818656} {"current_steps": 10105, "total_steps": 67140, "loss": 0.73, "lr": 4.9612709412165024e-05, "epoch": 1.5050640452785224, "percentage": 15.05, "elapsed_time": "0:42:02", "remaining_time": "3:57:16", "throughput": 2307.97, "total_tokens": 5821600} {"current_steps": 10110, "total_steps": 67140, "loss": 0.9076, "lr": 4.961156908936724e-05, "epoch": 1.5058087578194816, "percentage": 15.06, "elapsed_time": "0:42:03", "remaining_time": "3:57:15", "throughput": 2308.06, "total_tokens": 5824448} {"current_steps": 10115, "total_steps": 67140, "loss": 0.6961, "lr": 4.961042710341967e-05, "epoch": 1.5065534703604408, "percentage": 15.07, "elapsed_time": "0:42:04", "remaining_time": "3:57:13", "throughput": 2308.17, "total_tokens": 5827328} {"current_steps": 10120, "total_steps": 67140, "loss": 0.6576, "lr": 4.96092834543995e-05, "epoch": 1.5072981829014, "percentage": 15.07, "elapsed_time": "0:42:05", "remaining_time": "3:57:11", "throughput": 2308.3, "total_tokens": 5830304} {"current_steps": 10125, "total_steps": 67140, "loss": 0.7196, "lr": 4.9608138142384e-05, "epoch": 1.5080428954423593, "percentage": 15.08, "elapsed_time": "0:42:06", "remaining_time": "3:57:09", "throughput": 2308.39, "total_tokens": 5833120} {"current_steps": 10130, "total_steps": 67140, "loss": 0.5851, "lr": 4.9606991167450584e-05, "epoch": 1.5087876079833185, "percentage": 15.09, "elapsed_time": "0:42:08", "remaining_time": "3:57:07", "throughput": 2308.45, "total_tokens": 5835840} {"current_steps": 10135, "total_steps": 67140, "loss": 0.8727, "lr": 4.9605842529676746e-05, "epoch": 1.5095323205242777, "percentage": 15.1, "elapsed_time": "0:42:09", "remaining_time": "3:57:05", "throughput": 2308.55, "total_tokens": 5838752} {"current_steps": 10140, "total_steps": 67140, "loss": 0.7526, "lr": 4.9604692229140106e-05, "epoch": 1.5102770330652369, "percentage": 15.1, "elapsed_time": "0:42:10", "remaining_time": "3:57:03", "throughput": 2308.7, "total_tokens": 5841792} {"current_steps": 10145, "total_steps": 67140, "loss": 0.8503, "lr": 4.96035402659184e-05, "epoch": 1.5110217456061958, "percentage": 15.11, "elapsed_time": "0:42:11", "remaining_time": "3:57:01", "throughput": 2308.81, "total_tokens": 5844672} {"current_steps": 10150, "total_steps": 67140, "loss": 0.6876, "lr": 4.960238664008948e-05, "epoch": 1.511766458147155, "percentage": 15.12, "elapsed_time": "0:42:12", "remaining_time": "3:57:00", "throughput": 2308.9, "total_tokens": 5847552} {"current_steps": 10155, "total_steps": 67140, "loss": 0.6927, "lr": 4.960123135173129e-05, "epoch": 1.5125111706881142, "percentage": 15.13, "elapsed_time": "0:42:13", "remaining_time": "3:56:58", "throughput": 2309.07, "total_tokens": 5850688} {"current_steps": 10160, "total_steps": 67140, "loss": 0.6265, "lr": 4.960007440092191e-05, "epoch": 1.5132558832290735, "percentage": 15.13, "elapsed_time": "0:42:14", "remaining_time": "3:56:56", "throughput": 2309.17, "total_tokens": 5853536} {"current_steps": 10165, "total_steps": 67140, "loss": 0.6975, "lr": 4.959891578773953e-05, "epoch": 1.5140005957700327, "percentage": 15.14, "elapsed_time": "0:42:16", "remaining_time": "3:56:54", "throughput": 2309.27, "total_tokens": 5856480} {"current_steps": 10170, "total_steps": 67140, "loss": 0.7044, "lr": 4.959775551226242e-05, "epoch": 1.5147453083109919, "percentage": 15.15, "elapsed_time": "0:42:17", "remaining_time": "3:56:52", "throughput": 2309.34, "total_tokens": 5859264} {"current_steps": 10175, "total_steps": 67140, "loss": 0.6806, "lr": 4.9596593574569e-05, "epoch": 1.515490020851951, "percentage": 15.15, "elapsed_time": "0:42:18", "remaining_time": "3:56:50", "throughput": 2309.45, "total_tokens": 5862112} {"current_steps": 10180, "total_steps": 67140, "loss": 0.585, "lr": 4.9595429974737796e-05, "epoch": 1.5162347333929103, "percentage": 15.16, "elapsed_time": "0:42:19", "remaining_time": "3:56:49", "throughput": 2309.6, "total_tokens": 5865216} {"current_steps": 10185, "total_steps": 67140, "loss": 0.6015, "lr": 4.959426471284742e-05, "epoch": 1.5169794459338695, "percentage": 15.17, "elapsed_time": "0:42:20", "remaining_time": "3:56:47", "throughput": 2309.64, "total_tokens": 5867872} {"current_steps": 10190, "total_steps": 67140, "loss": 0.6906, "lr": 4.959309778897664e-05, "epoch": 1.5177241584748287, "percentage": 15.18, "elapsed_time": "0:42:21", "remaining_time": "3:56:45", "throughput": 2309.77, "total_tokens": 5870880} {"current_steps": 10195, "total_steps": 67140, "loss": 0.6517, "lr": 4.959192920320429e-05, "epoch": 1.5184688710157879, "percentage": 15.18, "elapsed_time": "0:42:22", "remaining_time": "3:56:43", "throughput": 2309.92, "total_tokens": 5873920} {"current_steps": 10200, "total_steps": 67140, "loss": 0.6196, "lr": 4.959075895560935e-05, "epoch": 1.519213583556747, "percentage": 15.19, "elapsed_time": "0:42:24", "remaining_time": "3:56:41", "throughput": 2310.05, "total_tokens": 5876928} {"current_steps": 10205, "total_steps": 67140, "loss": 0.6644, "lr": 4.9589587046270904e-05, "epoch": 1.5199582960977063, "percentage": 15.2, "elapsed_time": "0:42:25", "remaining_time": "3:56:40", "throughput": 2310.19, "total_tokens": 5879936} {"current_steps": 10210, "total_steps": 67140, "loss": 0.7835, "lr": 4.958841347526814e-05, "epoch": 1.5207030086386655, "percentage": 15.21, "elapsed_time": "0:42:26", "remaining_time": "3:56:38", "throughput": 2310.35, "total_tokens": 5883072} {"current_steps": 10215, "total_steps": 67140, "loss": 0.6223, "lr": 4.9587238242680356e-05, "epoch": 1.5214477211796247, "percentage": 15.21, "elapsed_time": "0:42:27", "remaining_time": "3:56:36", "throughput": 2310.46, "total_tokens": 5885984} {"current_steps": 10220, "total_steps": 67140, "loss": 0.7387, "lr": 4.958606134858697e-05, "epoch": 1.5221924337205839, "percentage": 15.22, "elapsed_time": "0:42:28", "remaining_time": "3:56:34", "throughput": 2310.51, "total_tokens": 5888704} {"current_steps": 10225, "total_steps": 67140, "loss": 0.7155, "lr": 4.9584882793067534e-05, "epoch": 1.522937146261543, "percentage": 15.23, "elapsed_time": "0:42:29", "remaining_time": "3:56:32", "throughput": 2310.6, "total_tokens": 5891488} {"current_steps": 10230, "total_steps": 67140, "loss": 0.691, "lr": 4.958370257620166e-05, "epoch": 1.5236818588025023, "percentage": 15.24, "elapsed_time": "0:42:30", "remaining_time": "3:56:30", "throughput": 2310.64, "total_tokens": 5894176} {"current_steps": 10235, "total_steps": 67140, "loss": 0.6278, "lr": 4.958252069806912e-05, "epoch": 1.5244265713434615, "percentage": 15.24, "elapsed_time": "0:42:32", "remaining_time": "3:56:28", "throughput": 2310.74, "total_tokens": 5897088} {"current_steps": 10240, "total_steps": 67140, "loss": 0.6982, "lr": 4.9581337158749784e-05, "epoch": 1.5251712838844207, "percentage": 15.25, "elapsed_time": "0:42:33", "remaining_time": "3:56:26", "throughput": 2310.81, "total_tokens": 5899840} {"current_steps": 10245, "total_steps": 67140, "loss": 0.7561, "lr": 4.958015195832362e-05, "epoch": 1.52591599642538, "percentage": 15.26, "elapsed_time": "0:42:34", "remaining_time": "3:56:25", "throughput": 2310.93, "total_tokens": 5902816} {"current_steps": 10250, "total_steps": 67140, "loss": 0.6683, "lr": 4.957896509687072e-05, "epoch": 1.526660708966339, "percentage": 15.27, "elapsed_time": "0:42:35", "remaining_time": "3:56:23", "throughput": 2311.06, "total_tokens": 5905792} {"current_steps": 10255, "total_steps": 67140, "loss": 0.817, "lr": 4.957777657447128e-05, "epoch": 1.5274054215072983, "percentage": 15.27, "elapsed_time": "0:42:36", "remaining_time": "3:56:21", "throughput": 2311.28, "total_tokens": 5909152} {"current_steps": 10260, "total_steps": 67140, "loss": 0.6928, "lr": 4.957658639120564e-05, "epoch": 1.5281501340482575, "percentage": 15.28, "elapsed_time": "0:42:37", "remaining_time": "3:56:20", "throughput": 2311.46, "total_tokens": 5912352} {"current_steps": 10265, "total_steps": 67140, "loss": 0.747, "lr": 4.957539454715421e-05, "epoch": 1.5288948465892167, "percentage": 15.29, "elapsed_time": "0:42:38", "remaining_time": "3:56:18", "throughput": 2311.58, "total_tokens": 5915264} {"current_steps": 10270, "total_steps": 67140, "loss": 0.7773, "lr": 4.957420104239753e-05, "epoch": 1.529639559130176, "percentage": 15.3, "elapsed_time": "0:42:40", "remaining_time": "3:56:16", "throughput": 2311.67, "total_tokens": 5918144} {"current_steps": 10275, "total_steps": 67140, "loss": 0.6781, "lr": 4.9573005877016255e-05, "epoch": 1.5303842716711349, "percentage": 15.3, "elapsed_time": "0:42:41", "remaining_time": "3:56:14", "throughput": 2311.73, "total_tokens": 5920896} {"current_steps": 10280, "total_steps": 67140, "loss": 0.8415, "lr": 4.957180905109115e-05, "epoch": 1.531128984212094, "percentage": 15.31, "elapsed_time": "0:42:42", "remaining_time": "3:56:12", "throughput": 2311.87, "total_tokens": 5923904} {"current_steps": 10285, "total_steps": 67140, "loss": 0.7079, "lr": 4.9570610564703086e-05, "epoch": 1.5318736967530533, "percentage": 15.32, "elapsed_time": "0:42:43", "remaining_time": "3:56:10", "throughput": 2311.95, "total_tokens": 5926688} {"current_steps": 10290, "total_steps": 67140, "loss": 0.6106, "lr": 4.956941041793306e-05, "epoch": 1.5326184092940125, "percentage": 15.33, "elapsed_time": "0:42:44", "remaining_time": "3:56:09", "throughput": 2312.04, "total_tokens": 5929536} {"current_steps": 10295, "total_steps": 67140, "loss": 0.7348, "lr": 4.956820861086217e-05, "epoch": 1.5333631218349717, "percentage": 15.33, "elapsed_time": "0:42:45", "remaining_time": "3:56:07", "throughput": 2312.13, "total_tokens": 5932352} {"current_steps": 10300, "total_steps": 67140, "loss": 0.6873, "lr": 4.956700514357163e-05, "epoch": 1.534107834375931, "percentage": 15.34, "elapsed_time": "0:42:46", "remaining_time": "3:56:05", "throughput": 2312.19, "total_tokens": 5935136} {"current_steps": 10305, "total_steps": 67140, "loss": 0.7385, "lr": 4.956580001614277e-05, "epoch": 1.53485254691689, "percentage": 15.35, "elapsed_time": "0:42:48", "remaining_time": "3:56:03", "throughput": 2312.3, "total_tokens": 5938048} {"current_steps": 10310, "total_steps": 67140, "loss": 0.6977, "lr": 4.9564593228657016e-05, "epoch": 1.5355972594578493, "percentage": 15.36, "elapsed_time": "0:42:49", "remaining_time": "3:56:01", "throughput": 2312.37, "total_tokens": 5940768} {"current_steps": 10315, "total_steps": 67140, "loss": 0.7001, "lr": 4.956338478119592e-05, "epoch": 1.5363419719988085, "percentage": 15.36, "elapsed_time": "0:42:50", "remaining_time": "3:55:59", "throughput": 2312.44, "total_tokens": 5943552} {"current_steps": 10320, "total_steps": 67140, "loss": 0.6975, "lr": 4.956217467384116e-05, "epoch": 1.5370866845397675, "percentage": 15.37, "elapsed_time": "0:42:51", "remaining_time": "3:55:57", "throughput": 2312.59, "total_tokens": 5946624} {"current_steps": 10325, "total_steps": 67140, "loss": 0.6937, "lr": 4.9560962906674493e-05, "epoch": 1.5378313970807267, "percentage": 15.38, "elapsed_time": "0:42:52", "remaining_time": "3:55:55", "throughput": 2312.67, "total_tokens": 5949440} {"current_steps": 10330, "total_steps": 67140, "loss": 0.6189, "lr": 4.9559749479777805e-05, "epoch": 1.538576109621686, "percentage": 15.39, "elapsed_time": "0:42:53", "remaining_time": "3:55:54", "throughput": 2312.84, "total_tokens": 5952576} {"current_steps": 10335, "total_steps": 67140, "loss": 0.7837, "lr": 4.9558534393233104e-05, "epoch": 1.539320822162645, "percentage": 15.39, "elapsed_time": "0:42:54", "remaining_time": "3:55:52", "throughput": 2312.99, "total_tokens": 5955680} {"current_steps": 10340, "total_steps": 67140, "loss": 0.6618, "lr": 4.955731764712249e-05, "epoch": 1.5400655347036043, "percentage": 15.4, "elapsed_time": "0:42:55", "remaining_time": "3:55:50", "throughput": 2313.05, "total_tokens": 5958368} {"current_steps": 10345, "total_steps": 67140, "loss": 0.7658, "lr": 4.9556099241528194e-05, "epoch": 1.5408102472445635, "percentage": 15.41, "elapsed_time": "0:42:57", "remaining_time": "3:55:48", "throughput": 2313.11, "total_tokens": 5961120} {"current_steps": 10350, "total_steps": 67140, "loss": 0.6942, "lr": 4.955487917653256e-05, "epoch": 1.5415549597855227, "percentage": 15.42, "elapsed_time": "0:42:58", "remaining_time": "3:55:46", "throughput": 2313.28, "total_tokens": 5964288} {"current_steps": 10355, "total_steps": 67140, "loss": 0.6513, "lr": 4.955365745221802e-05, "epoch": 1.542299672326482, "percentage": 15.42, "elapsed_time": "0:42:59", "remaining_time": "3:55:44", "throughput": 2313.33, "total_tokens": 5966944} {"current_steps": 10360, "total_steps": 67140, "loss": 0.7285, "lr": 4.955243406866713e-05, "epoch": 1.543044384867441, "percentage": 15.43, "elapsed_time": "0:43:00", "remaining_time": "3:55:42", "throughput": 2313.42, "total_tokens": 5969792} {"current_steps": 10365, "total_steps": 67140, "loss": 0.7643, "lr": 4.9551209025962575e-05, "epoch": 1.5437890974084003, "percentage": 15.44, "elapsed_time": "0:43:01", "remaining_time": "3:55:41", "throughput": 2313.55, "total_tokens": 5972800} {"current_steps": 10370, "total_steps": 67140, "loss": 0.6897, "lr": 4.9549982324187125e-05, "epoch": 1.5445338099493595, "percentage": 15.45, "elapsed_time": "0:43:02", "remaining_time": "3:55:39", "throughput": 2313.63, "total_tokens": 5975616} {"current_steps": 10375, "total_steps": 67140, "loss": 0.7474, "lr": 4.954875396342369e-05, "epoch": 1.5452785224903187, "percentage": 15.45, "elapsed_time": "0:43:03", "remaining_time": "3:55:37", "throughput": 2313.69, "total_tokens": 5978368} {"current_steps": 10380, "total_steps": 67140, "loss": 0.6899, "lr": 4.954752394375527e-05, "epoch": 1.546023235031278, "percentage": 15.46, "elapsed_time": "0:43:05", "remaining_time": "3:55:35", "throughput": 2313.77, "total_tokens": 5981152} {"current_steps": 10385, "total_steps": 67140, "loss": 0.6051, "lr": 4.9546292265264985e-05, "epoch": 1.5467679475722371, "percentage": 15.47, "elapsed_time": "0:43:06", "remaining_time": "3:55:33", "throughput": 2313.91, "total_tokens": 5984224} {"current_steps": 10390, "total_steps": 67140, "loss": 0.6561, "lr": 4.9545058928036056e-05, "epoch": 1.5475126601131963, "percentage": 15.48, "elapsed_time": "0:43:07", "remaining_time": "3:55:31", "throughput": 2313.99, "total_tokens": 5987072} {"current_steps": 10395, "total_steps": 67140, "loss": 0.7573, "lr": 4.9543823932151845e-05, "epoch": 1.5482573726541555, "percentage": 15.48, "elapsed_time": "0:43:08", "remaining_time": "3:55:30", "throughput": 2314.11, "total_tokens": 5990048} {"current_steps": 10400, "total_steps": 67140, "loss": 0.6049, "lr": 4.954258727769581e-05, "epoch": 1.5490020851951147, "percentage": 15.49, "elapsed_time": "0:43:09", "remaining_time": "3:55:28", "throughput": 2314.23, "total_tokens": 5993024} {"current_steps": 10405, "total_steps": 67140, "loss": 0.6434, "lr": 4.9541348964751497e-05, "epoch": 1.549746797736074, "percentage": 15.5, "elapsed_time": "0:43:10", "remaining_time": "3:55:26", "throughput": 2314.35, "total_tokens": 5995968} {"current_steps": 10410, "total_steps": 67140, "loss": 0.6383, "lr": 4.95401089934026e-05, "epoch": 1.5504915102770331, "percentage": 15.5, "elapsed_time": "0:43:11", "remaining_time": "3:55:24", "throughput": 2314.44, "total_tokens": 5998848} {"current_steps": 10415, "total_steps": 67140, "loss": 0.7208, "lr": 4.953886736373291e-05, "epoch": 1.5512362228179923, "percentage": 15.51, "elapsed_time": "0:43:13", "remaining_time": "3:55:23", "throughput": 2314.53, "total_tokens": 6001760} {"current_steps": 10420, "total_steps": 67140, "loss": 0.6701, "lr": 4.953762407582634e-05, "epoch": 1.5519809353589515, "percentage": 15.52, "elapsed_time": "0:43:14", "remaining_time": "3:55:21", "throughput": 2314.67, "total_tokens": 6004768} {"current_steps": 10425, "total_steps": 67140, "loss": 0.6194, "lr": 4.953637912976688e-05, "epoch": 1.5527256478999107, "percentage": 15.53, "elapsed_time": "0:43:15", "remaining_time": "3:55:19", "throughput": 2314.74, "total_tokens": 6007552} {"current_steps": 10430, "total_steps": 67140, "loss": 0.6124, "lr": 4.9535132525638696e-05, "epoch": 1.55347036044087, "percentage": 15.53, "elapsed_time": "0:43:16", "remaining_time": "3:55:17", "throughput": 2314.84, "total_tokens": 6010464} {"current_steps": 10435, "total_steps": 67140, "loss": 0.6681, "lr": 4.9533884263526e-05, "epoch": 1.5542150729818291, "percentage": 15.54, "elapsed_time": "0:43:17", "remaining_time": "3:55:16", "throughput": 2315.05, "total_tokens": 6013792} {"current_steps": 10440, "total_steps": 67140, "loss": 0.7649, "lr": 4.953263434351315e-05, "epoch": 1.5549597855227884, "percentage": 15.55, "elapsed_time": "0:43:18", "remaining_time": "3:55:14", "throughput": 2315.09, "total_tokens": 6016480} {"current_steps": 10445, "total_steps": 67140, "loss": 0.6979, "lr": 4.953138276568462e-05, "epoch": 1.5557044980637476, "percentage": 15.56, "elapsed_time": "0:43:19", "remaining_time": "3:55:12", "throughput": 2315.11, "total_tokens": 6019072} {"current_steps": 10450, "total_steps": 67140, "loss": 0.6581, "lr": 4.953012953012498e-05, "epoch": 1.5564492106047065, "percentage": 15.56, "elapsed_time": "0:43:21", "remaining_time": "3:55:10", "throughput": 2315.23, "total_tokens": 6022048} {"current_steps": 10455, "total_steps": 67140, "loss": 0.792, "lr": 4.952887463691891e-05, "epoch": 1.5571939231456657, "percentage": 15.57, "elapsed_time": "0:43:22", "remaining_time": "3:55:08", "throughput": 2315.31, "total_tokens": 6024896} {"current_steps": 10460, "total_steps": 67140, "loss": 0.7771, "lr": 4.9527618086151226e-05, "epoch": 1.557938635686625, "percentage": 15.58, "elapsed_time": "0:43:23", "remaining_time": "3:55:06", "throughput": 2315.39, "total_tokens": 6027744} {"current_steps": 10465, "total_steps": 67140, "loss": 0.7575, "lr": 4.952635987790683e-05, "epoch": 1.5586833482275841, "percentage": 15.59, "elapsed_time": "0:43:24", "remaining_time": "3:55:04", "throughput": 2315.45, "total_tokens": 6030464} {"current_steps": 10470, "total_steps": 67140, "loss": 0.7447, "lr": 4.9525100012270754e-05, "epoch": 1.5594280607685433, "percentage": 15.59, "elapsed_time": "0:43:25", "remaining_time": "3:55:02", "throughput": 2315.54, "total_tokens": 6033344} {"current_steps": 10475, "total_steps": 67140, "loss": 0.6665, "lr": 4.9523838489328134e-05, "epoch": 1.5601727733095025, "percentage": 15.6, "elapsed_time": "0:43:26", "remaining_time": "3:55:01", "throughput": 2315.65, "total_tokens": 6036256} {"current_steps": 10480, "total_steps": 67140, "loss": 0.7118, "lr": 4.952257530916421e-05, "epoch": 1.5609174858504618, "percentage": 15.61, "elapsed_time": "0:43:27", "remaining_time": "3:54:59", "throughput": 2315.71, "total_tokens": 6039008} {"current_steps": 10485, "total_steps": 67140, "loss": 0.6457, "lr": 4.9521310471864346e-05, "epoch": 1.561662198391421, "percentage": 15.62, "elapsed_time": "0:43:28", "remaining_time": "3:54:57", "throughput": 2315.78, "total_tokens": 6041792} {"current_steps": 10490, "total_steps": 67140, "loss": 0.6789, "lr": 4.952004397751402e-05, "epoch": 1.5624069109323802, "percentage": 15.62, "elapsed_time": "0:43:30", "remaining_time": "3:54:55", "throughput": 2315.9, "total_tokens": 6044768} {"current_steps": 10495, "total_steps": 67140, "loss": 0.5982, "lr": 4.951877582619881e-05, "epoch": 1.5631516234733391, "percentage": 15.63, "elapsed_time": "0:43:31", "remaining_time": "3:54:53", "throughput": 2316.04, "total_tokens": 6047808} {"current_steps": 10500, "total_steps": 67140, "loss": 0.653, "lr": 4.951750601800442e-05, "epoch": 1.5638963360142983, "percentage": 15.64, "elapsed_time": "0:43:32", "remaining_time": "3:54:52", "throughput": 2316.14, "total_tokens": 6050720} {"current_steps": 10505, "total_steps": 67140, "loss": 0.684, "lr": 4.9516234553016656e-05, "epoch": 1.5646410485552575, "percentage": 15.65, "elapsed_time": "0:43:33", "remaining_time": "3:54:50", "throughput": 2316.27, "total_tokens": 6053760} {"current_steps": 10510, "total_steps": 67140, "loss": 0.7162, "lr": 4.951496143132143e-05, "epoch": 1.5653857610962167, "percentage": 15.65, "elapsed_time": "0:43:34", "remaining_time": "3:54:48", "throughput": 2316.37, "total_tokens": 6056704} {"current_steps": 10515, "total_steps": 67140, "loss": 0.5892, "lr": 4.9513686653004785e-05, "epoch": 1.566130473637176, "percentage": 15.66, "elapsed_time": "0:43:35", "remaining_time": "3:54:46", "throughput": 2316.41, "total_tokens": 6059424} {"current_steps": 10520, "total_steps": 67140, "loss": 0.5595, "lr": 4.951241021815286e-05, "epoch": 1.5668751861781351, "percentage": 15.67, "elapsed_time": "0:43:36", "remaining_time": "3:54:44", "throughput": 2316.47, "total_tokens": 6062144} {"current_steps": 10525, "total_steps": 67140, "loss": 0.7531, "lr": 4.9511132126851914e-05, "epoch": 1.5676198987190944, "percentage": 15.68, "elapsed_time": "0:43:38", "remaining_time": "3:54:43", "throughput": 2316.62, "total_tokens": 6065248} {"current_steps": 10530, "total_steps": 67140, "loss": 0.7217, "lr": 4.950985237918831e-05, "epoch": 1.5683646112600536, "percentage": 15.68, "elapsed_time": "0:43:39", "remaining_time": "3:54:41", "throughput": 2316.73, "total_tokens": 6068128} {"current_steps": 10535, "total_steps": 67140, "loss": 0.7606, "lr": 4.950857097524854e-05, "epoch": 1.5691093238010128, "percentage": 15.69, "elapsed_time": "0:43:40", "remaining_time": "3:54:39", "throughput": 2316.79, "total_tokens": 6070848} {"current_steps": 10540, "total_steps": 67140, "loss": 0.6112, "lr": 4.950728791511918e-05, "epoch": 1.569854036341972, "percentage": 15.7, "elapsed_time": "0:43:41", "remaining_time": "3:54:37", "throughput": 2316.94, "total_tokens": 6073952} {"current_steps": 10545, "total_steps": 67140, "loss": 0.7524, "lr": 4.950600319888695e-05, "epoch": 1.5705987488829312, "percentage": 15.71, "elapsed_time": "0:43:42", "remaining_time": "3:54:36", "throughput": 2317.07, "total_tokens": 6076960} {"current_steps": 10550, "total_steps": 67140, "loss": 0.6428, "lr": 4.9504716826638655e-05, "epoch": 1.5713434614238904, "percentage": 15.71, "elapsed_time": "0:43:43", "remaining_time": "3:54:34", "throughput": 2317.14, "total_tokens": 6079712} {"current_steps": 10555, "total_steps": 67140, "loss": 0.6413, "lr": 4.9503428798461226e-05, "epoch": 1.5720881739648496, "percentage": 15.72, "elapsed_time": "0:43:44", "remaining_time": "3:54:31", "throughput": 2317.16, "total_tokens": 6082272} {"current_steps": 10560, "total_steps": 67140, "loss": 0.6213, "lr": 4.95021391144417e-05, "epoch": 1.5728328865058088, "percentage": 15.73, "elapsed_time": "0:43:45", "remaining_time": "3:54:29", "throughput": 2317.21, "total_tokens": 6084960} {"current_steps": 10565, "total_steps": 67140, "loss": 0.6316, "lr": 4.950084777466724e-05, "epoch": 1.573577599046768, "percentage": 15.74, "elapsed_time": "0:43:47", "remaining_time": "3:54:28", "throughput": 2317.3, "total_tokens": 6087808} {"current_steps": 10570, "total_steps": 67140, "loss": 0.6608, "lr": 4.949955477922509e-05, "epoch": 1.5743223115877272, "percentage": 15.74, "elapsed_time": "0:43:48", "remaining_time": "3:54:26", "throughput": 2317.34, "total_tokens": 6090496} {"current_steps": 10575, "total_steps": 67140, "loss": 0.7144, "lr": 4.9498260128202635e-05, "epoch": 1.5750670241286864, "percentage": 15.75, "elapsed_time": "0:43:49", "remaining_time": "3:54:24", "throughput": 2317.48, "total_tokens": 6093600} {"current_steps": 10580, "total_steps": 67140, "loss": 0.5463, "lr": 4.949696382168737e-05, "epoch": 1.5758117366696456, "percentage": 15.76, "elapsed_time": "0:43:50", "remaining_time": "3:54:22", "throughput": 2317.55, "total_tokens": 6096352} {"current_steps": 10585, "total_steps": 67140, "loss": 0.542, "lr": 4.949566585976688e-05, "epoch": 1.5765564492106048, "percentage": 15.77, "elapsed_time": "0:43:51", "remaining_time": "3:54:20", "throughput": 2317.58, "total_tokens": 6098976} {"current_steps": 10590, "total_steps": 67140, "loss": 0.5642, "lr": 4.949436624252889e-05, "epoch": 1.577301161751564, "percentage": 15.77, "elapsed_time": "0:43:52", "remaining_time": "3:54:18", "throughput": 2317.63, "total_tokens": 6101600} {"current_steps": 10595, "total_steps": 67140, "loss": 0.7082, "lr": 4.949306497006121e-05, "epoch": 1.5780458742925232, "percentage": 15.78, "elapsed_time": "0:43:53", "remaining_time": "3:54:16", "throughput": 2317.67, "total_tokens": 6104256} {"current_steps": 10600, "total_steps": 67140, "loss": 0.6332, "lr": 4.949176204245178e-05, "epoch": 1.5787905868334824, "percentage": 15.79, "elapsed_time": "0:43:54", "remaining_time": "3:54:14", "throughput": 2317.73, "total_tokens": 6107040} {"current_steps": 10605, "total_steps": 67140, "loss": 0.7149, "lr": 4.949045745978866e-05, "epoch": 1.5795352993744416, "percentage": 15.8, "elapsed_time": "0:43:56", "remaining_time": "3:54:12", "throughput": 2317.84, "total_tokens": 6109984} {"current_steps": 10610, "total_steps": 67140, "loss": 0.7562, "lr": 4.9489151222159984e-05, "epoch": 1.5802800119154008, "percentage": 15.8, "elapsed_time": "0:43:57", "remaining_time": "3:54:11", "throughput": 2317.96, "total_tokens": 6112960} {"current_steps": 10615, "total_steps": 67140, "loss": 0.6919, "lr": 4.948784332965404e-05, "epoch": 1.58102472445636, "percentage": 15.81, "elapsed_time": "0:43:58", "remaining_time": "3:54:09", "throughput": 2318.05, "total_tokens": 6115840} {"current_steps": 10620, "total_steps": 67140, "loss": 0.7302, "lr": 4.94865337823592e-05, "epoch": 1.5817694369973192, "percentage": 15.82, "elapsed_time": "0:43:59", "remaining_time": "3:54:07", "throughput": 2318.17, "total_tokens": 6118848} {"current_steps": 10625, "total_steps": 67140, "loss": 0.6539, "lr": 4.948522258036397e-05, "epoch": 1.5825141495382782, "percentage": 15.83, "elapsed_time": "0:44:00", "remaining_time": "3:54:05", "throughput": 2318.27, "total_tokens": 6121760} {"current_steps": 10630, "total_steps": 67140, "loss": 0.7273, "lr": 4.948390972375694e-05, "epoch": 1.5832588620792374, "percentage": 15.83, "elapsed_time": "0:44:01", "remaining_time": "3:54:04", "throughput": 2318.37, "total_tokens": 6124672} {"current_steps": 10635, "total_steps": 67140, "loss": 0.6432, "lr": 4.948259521262684e-05, "epoch": 1.5840035746201966, "percentage": 15.84, "elapsed_time": "0:44:02", "remaining_time": "3:54:02", "throughput": 2318.43, "total_tokens": 6127392} {"current_steps": 10640, "total_steps": 67140, "loss": 0.6957, "lr": 4.948127904706249e-05, "epoch": 1.5847482871611558, "percentage": 15.85, "elapsed_time": "0:44:04", "remaining_time": "3:54:00", "throughput": 2318.53, "total_tokens": 6130368} {"current_steps": 10645, "total_steps": 67140, "loss": 0.742, "lr": 4.947996122715283e-05, "epoch": 1.585492999702115, "percentage": 15.85, "elapsed_time": "0:44:05", "remaining_time": "3:53:58", "throughput": 2318.62, "total_tokens": 6133216} {"current_steps": 10650, "total_steps": 67140, "loss": 0.6615, "lr": 4.947864175298693e-05, "epoch": 1.5862377122430742, "percentage": 15.86, "elapsed_time": "0:44:06", "remaining_time": "3:53:56", "throughput": 2318.75, "total_tokens": 6136224} {"current_steps": 10655, "total_steps": 67140, "loss": 0.6838, "lr": 4.9477320624653937e-05, "epoch": 1.5869824247840334, "percentage": 15.87, "elapsed_time": "0:44:07", "remaining_time": "3:53:55", "throughput": 2318.86, "total_tokens": 6139168} {"current_steps": 10660, "total_steps": 67140, "loss": 0.6796, "lr": 4.9475997842243136e-05, "epoch": 1.5877271373249926, "percentage": 15.88, "elapsed_time": "0:44:08", "remaining_time": "3:53:53", "throughput": 2318.98, "total_tokens": 6142144} {"current_steps": 10665, "total_steps": 67140, "loss": 0.7408, "lr": 4.947467340584391e-05, "epoch": 1.5884718498659516, "percentage": 15.88, "elapsed_time": "0:44:09", "remaining_time": "3:53:51", "throughput": 2319.08, "total_tokens": 6145056} {"current_steps": 10670, "total_steps": 67140, "loss": 0.6772, "lr": 4.947334731554577e-05, "epoch": 1.5892165624069108, "percentage": 15.89, "elapsed_time": "0:44:10", "remaining_time": "3:53:49", "throughput": 2319.14, "total_tokens": 6147776} {"current_steps": 10675, "total_steps": 67140, "loss": 0.7521, "lr": 4.947201957143831e-05, "epoch": 1.58996127494787, "percentage": 15.9, "elapsed_time": "0:44:12", "remaining_time": "3:53:47", "throughput": 2319.25, "total_tokens": 6150752} {"current_steps": 10680, "total_steps": 67140, "loss": 0.6865, "lr": 4.947069017361127e-05, "epoch": 1.5907059874888292, "percentage": 15.91, "elapsed_time": "0:44:13", "remaining_time": "3:53:46", "throughput": 2319.3, "total_tokens": 6153504} {"current_steps": 10685, "total_steps": 67140, "loss": 0.6728, "lr": 4.9469359122154476e-05, "epoch": 1.5914507000297884, "percentage": 15.91, "elapsed_time": "0:44:14", "remaining_time": "3:53:44", "throughput": 2319.44, "total_tokens": 6156576} {"current_steps": 10690, "total_steps": 67140, "loss": 0.667, "lr": 4.946802641715788e-05, "epoch": 1.5921954125707476, "percentage": 15.92, "elapsed_time": "0:44:15", "remaining_time": "3:53:42", "throughput": 2319.48, "total_tokens": 6159232} {"current_steps": 10695, "total_steps": 67140, "loss": 0.9304, "lr": 4.9466692058711536e-05, "epoch": 1.5929401251117068, "percentage": 15.93, "elapsed_time": "0:44:16", "remaining_time": "3:53:40", "throughput": 2319.64, "total_tokens": 6162400} {"current_steps": 10700, "total_steps": 67140, "loss": 0.6787, "lr": 4.946535604690562e-05, "epoch": 1.593684837652666, "percentage": 15.94, "elapsed_time": "0:44:17", "remaining_time": "3:53:39", "throughput": 2319.78, "total_tokens": 6165536} {"current_steps": 10705, "total_steps": 67140, "loss": 0.667, "lr": 4.94640183818304e-05, "epoch": 1.5944295501936252, "percentage": 15.94, "elapsed_time": "0:44:18", "remaining_time": "3:53:37", "throughput": 2319.86, "total_tokens": 6168352} {"current_steps": 10710, "total_steps": 67140, "loss": 0.69, "lr": 4.9462679063576286e-05, "epoch": 1.5951742627345844, "percentage": 15.95, "elapsed_time": "0:44:20", "remaining_time": "3:53:35", "throughput": 2319.95, "total_tokens": 6171232} {"current_steps": 10715, "total_steps": 67140, "loss": 0.7345, "lr": 4.946133809223379e-05, "epoch": 1.5959189752755436, "percentage": 15.96, "elapsed_time": "0:44:21", "remaining_time": "3:53:33", "throughput": 2320.06, "total_tokens": 6174176} {"current_steps": 10720, "total_steps": 67140, "loss": 0.751, "lr": 4.945999546789351e-05, "epoch": 1.5966636878165028, "percentage": 15.97, "elapsed_time": "0:44:22", "remaining_time": "3:53:32", "throughput": 2320.31, "total_tokens": 6177728} {"current_steps": 10725, "total_steps": 67140, "loss": 0.7303, "lr": 4.9458651190646185e-05, "epoch": 1.597408400357462, "percentage": 15.97, "elapsed_time": "0:44:23", "remaining_time": "3:53:30", "throughput": 2320.39, "total_tokens": 6180576} {"current_steps": 10730, "total_steps": 67140, "loss": 0.8036, "lr": 4.945730526058265e-05, "epoch": 1.5981531128984212, "percentage": 15.98, "elapsed_time": "0:44:24", "remaining_time": "3:53:29", "throughput": 2320.55, "total_tokens": 6183776} {"current_steps": 10735, "total_steps": 67140, "loss": 0.674, "lr": 4.9455957677793865e-05, "epoch": 1.5988978254393804, "percentage": 15.99, "elapsed_time": "0:44:25", "remaining_time": "3:53:27", "throughput": 2320.58, "total_tokens": 6186368} {"current_steps": 10740, "total_steps": 67140, "loss": 0.4324, "lr": 4.94546084423709e-05, "epoch": 1.5996425379803396, "percentage": 16.0, "elapsed_time": "0:44:26", "remaining_time": "3:53:25", "throughput": 2320.64, "total_tokens": 6189120} {"current_steps": 10745, "total_steps": 67140, "loss": 0.5535, "lr": 4.945325755440491e-05, "epoch": 1.6003872505212988, "percentage": 16.0, "elapsed_time": "0:44:28", "remaining_time": "3:53:23", "throughput": 2320.7, "total_tokens": 6191872} {"current_steps": 10750, "total_steps": 67140, "loss": 0.6776, "lr": 4.945190501398719e-05, "epoch": 1.601131963062258, "percentage": 16.01, "elapsed_time": "0:44:29", "remaining_time": "3:53:21", "throughput": 2320.81, "total_tokens": 6194816} {"current_steps": 10755, "total_steps": 67140, "loss": 0.7219, "lr": 4.945055082120915e-05, "epoch": 1.6018766756032172, "percentage": 16.02, "elapsed_time": "0:44:30", "remaining_time": "3:53:19", "throughput": 2320.89, "total_tokens": 6197664} {"current_steps": 10760, "total_steps": 67140, "loss": 0.7269, "lr": 4.94491949761623e-05, "epoch": 1.6026213881441764, "percentage": 16.03, "elapsed_time": "0:44:31", "remaining_time": "3:53:18", "throughput": 2321.0, "total_tokens": 6200640} {"current_steps": 10765, "total_steps": 67140, "loss": 0.5965, "lr": 4.944783747893825e-05, "epoch": 1.6033661006851356, "percentage": 16.03, "elapsed_time": "0:44:32", "remaining_time": "3:53:16", "throughput": 2321.11, "total_tokens": 6203552} {"current_steps": 10770, "total_steps": 67140, "loss": 0.5349, "lr": 4.944647832962874e-05, "epoch": 1.6041108132260948, "percentage": 16.04, "elapsed_time": "0:44:33", "remaining_time": "3:53:14", "throughput": 2321.17, "total_tokens": 6206336} {"current_steps": 10775, "total_steps": 67140, "loss": 0.6599, "lr": 4.9445117528325625e-05, "epoch": 1.604855525767054, "percentage": 16.05, "elapsed_time": "0:44:34", "remaining_time": "3:53:12", "throughput": 2321.26, "total_tokens": 6209216} {"current_steps": 10780, "total_steps": 67140, "loss": 0.6831, "lr": 4.9443755075120844e-05, "epoch": 1.6056002383080132, "percentage": 16.06, "elapsed_time": "0:44:36", "remaining_time": "3:53:11", "throughput": 2321.39, "total_tokens": 6212192} {"current_steps": 10785, "total_steps": 67140, "loss": 0.6065, "lr": 4.944239097010648e-05, "epoch": 1.6063449508489724, "percentage": 16.06, "elapsed_time": "0:44:37", "remaining_time": "3:53:09", "throughput": 2321.57, "total_tokens": 6215424} {"current_steps": 10790, "total_steps": 67140, "loss": 0.6292, "lr": 4.9441025213374706e-05, "epoch": 1.6070896633899316, "percentage": 16.07, "elapsed_time": "0:44:38", "remaining_time": "3:53:07", "throughput": 2321.72, "total_tokens": 6218528} {"current_steps": 10795, "total_steps": 67140, "loss": 0.766, "lr": 4.9439657805017825e-05, "epoch": 1.6078343759308906, "percentage": 16.08, "elapsed_time": "0:44:39", "remaining_time": "3:53:06", "throughput": 2321.89, "total_tokens": 6221760} {"current_steps": 10800, "total_steps": 67140, "loss": 0.5393, "lr": 4.9438288745128234e-05, "epoch": 1.6085790884718498, "percentage": 16.09, "elapsed_time": "0:44:40", "remaining_time": "3:53:04", "throughput": 2321.91, "total_tokens": 6224320} {"current_steps": 10805, "total_steps": 67140, "loss": 0.5379, "lr": 4.943691803379844e-05, "epoch": 1.609323801012809, "percentage": 16.09, "elapsed_time": "0:44:41", "remaining_time": "3:53:02", "throughput": 2322.02, "total_tokens": 6227296} {"current_steps": 10810, "total_steps": 67140, "loss": 0.5795, "lr": 4.9435545671121085e-05, "epoch": 1.6100685135537682, "percentage": 16.1, "elapsed_time": "0:44:42", "remaining_time": "3:53:00", "throughput": 2322.09, "total_tokens": 6230048} {"current_steps": 10815, "total_steps": 67140, "loss": 0.689, "lr": 4.94341716571889e-05, "epoch": 1.6108132260947274, "percentage": 16.11, "elapsed_time": "0:44:44", "remaining_time": "3:52:58", "throughput": 2322.23, "total_tokens": 6233120} {"current_steps": 10820, "total_steps": 67140, "loss": 0.776, "lr": 4.943279599209474e-05, "epoch": 1.6115579386356866, "percentage": 16.12, "elapsed_time": "0:44:45", "remaining_time": "3:52:57", "throughput": 2322.31, "total_tokens": 6235936} {"current_steps": 10825, "total_steps": 67140, "loss": 0.7111, "lr": 4.943141867593155e-05, "epoch": 1.6123026511766458, "percentage": 16.12, "elapsed_time": "0:44:46", "remaining_time": "3:52:55", "throughput": 2322.42, "total_tokens": 6238848} {"current_steps": 10830, "total_steps": 67140, "loss": 0.7269, "lr": 4.943003970879243e-05, "epoch": 1.613047363717605, "percentage": 16.13, "elapsed_time": "0:44:47", "remaining_time": "3:52:53", "throughput": 2322.46, "total_tokens": 6241504} {"current_steps": 10835, "total_steps": 67140, "loss": 0.804, "lr": 4.942865909077055e-05, "epoch": 1.6137920762585642, "percentage": 16.14, "elapsed_time": "0:44:48", "remaining_time": "3:52:51", "throughput": 2322.49, "total_tokens": 6244160} {"current_steps": 10840, "total_steps": 67140, "loss": 0.579, "lr": 4.942727682195921e-05, "epoch": 1.6145367887995232, "percentage": 16.15, "elapsed_time": "0:44:49", "remaining_time": "3:52:49", "throughput": 2322.59, "total_tokens": 6247072} {"current_steps": 10845, "total_steps": 67140, "loss": 0.723, "lr": 4.942589290245181e-05, "epoch": 1.6152815013404824, "percentage": 16.15, "elapsed_time": "0:44:50", "remaining_time": "3:52:47", "throughput": 2322.63, "total_tokens": 6249792} {"current_steps": 10850, "total_steps": 67140, "loss": 0.7545, "lr": 4.9424507332341874e-05, "epoch": 1.6160262138814416, "percentage": 16.16, "elapsed_time": "0:44:51", "remaining_time": "3:52:45", "throughput": 2322.74, "total_tokens": 6252736} {"current_steps": 10855, "total_steps": 67140, "loss": 0.7344, "lr": 4.942312011172304e-05, "epoch": 1.6167709264224008, "percentage": 16.17, "elapsed_time": "0:44:53", "remaining_time": "3:52:44", "throughput": 2322.85, "total_tokens": 6255744} {"current_steps": 10860, "total_steps": 67140, "loss": 0.6013, "lr": 4.942173124068905e-05, "epoch": 1.61751563896336, "percentage": 16.18, "elapsed_time": "0:44:54", "remaining_time": "3:52:42", "throughput": 2322.95, "total_tokens": 6258688} {"current_steps": 10865, "total_steps": 67140, "loss": 0.7495, "lr": 4.9420340719333746e-05, "epoch": 1.6182603515043192, "percentage": 16.18, "elapsed_time": "0:44:55", "remaining_time": "3:52:40", "throughput": 2323.0, "total_tokens": 6261440} {"current_steps": 10870, "total_steps": 67140, "loss": 0.6796, "lr": 4.941894854775111e-05, "epoch": 1.6190050640452784, "percentage": 16.19, "elapsed_time": "0:44:56", "remaining_time": "3:52:39", "throughput": 2323.11, "total_tokens": 6264416} {"current_steps": 10875, "total_steps": 67140, "loss": 0.7426, "lr": 4.9417554726035206e-05, "epoch": 1.6197497765862376, "percentage": 16.2, "elapsed_time": "0:44:57", "remaining_time": "3:52:37", "throughput": 2323.21, "total_tokens": 6267360} {"current_steps": 10880, "total_steps": 67140, "loss": 0.7274, "lr": 4.941615925428024e-05, "epoch": 1.6204944891271968, "percentage": 16.2, "elapsed_time": "0:44:58", "remaining_time": "3:52:35", "throughput": 2323.32, "total_tokens": 6270304} {"current_steps": 10885, "total_steps": 67140, "loss": 0.5259, "lr": 4.9414762132580486e-05, "epoch": 1.621239201668156, "percentage": 16.21, "elapsed_time": "0:44:59", "remaining_time": "3:52:33", "throughput": 2323.42, "total_tokens": 6273216} {"current_steps": 10890, "total_steps": 67140, "loss": 0.689, "lr": 4.9413363361030374e-05, "epoch": 1.6219839142091153, "percentage": 16.22, "elapsed_time": "0:45:01", "remaining_time": "3:52:31", "throughput": 2323.47, "total_tokens": 6275936} {"current_steps": 10895, "total_steps": 67140, "loss": 0.6746, "lr": 4.941196293972442e-05, "epoch": 1.6227286267500745, "percentage": 16.23, "elapsed_time": "0:45:02", "remaining_time": "3:52:30", "throughput": 2323.54, "total_tokens": 6278720} {"current_steps": 10900, "total_steps": 67140, "loss": 0.73, "lr": 4.941056086875727e-05, "epoch": 1.6234733392910337, "percentage": 16.23, "elapsed_time": "0:45:03", "remaining_time": "3:52:28", "throughput": 2323.63, "total_tokens": 6281568} {"current_steps": 10905, "total_steps": 67140, "loss": 0.7956, "lr": 4.940915714822366e-05, "epoch": 1.6242180518319929, "percentage": 16.24, "elapsed_time": "0:45:04", "remaining_time": "3:52:26", "throughput": 2323.76, "total_tokens": 6284608} {"current_steps": 10910, "total_steps": 67140, "loss": 0.6479, "lr": 4.940775177821845e-05, "epoch": 1.624962764372952, "percentage": 16.25, "elapsed_time": "0:45:05", "remaining_time": "3:52:24", "throughput": 2323.79, "total_tokens": 6287264} {"current_steps": 10915, "total_steps": 67140, "loss": 0.7896, "lr": 4.9406344758836606e-05, "epoch": 1.6257074769139113, "percentage": 16.26, "elapsed_time": "0:45:06", "remaining_time": "3:52:22", "throughput": 2323.91, "total_tokens": 6290208} {"current_steps": 10920, "total_steps": 67140, "loss": 0.6528, "lr": 4.9404936090173214e-05, "epoch": 1.6264521894548705, "percentage": 16.26, "elapsed_time": "0:45:07", "remaining_time": "3:52:21", "throughput": 2324.05, "total_tokens": 6293280} {"current_steps": 10925, "total_steps": 67140, "loss": 0.8767, "lr": 4.9403525772323466e-05, "epoch": 1.6271969019958297, "percentage": 16.27, "elapsed_time": "0:45:08", "remaining_time": "3:52:19", "throughput": 2324.11, "total_tokens": 6296000} {"current_steps": 10930, "total_steps": 67140, "loss": 0.7496, "lr": 4.9402113805382665e-05, "epoch": 1.6279416145367889, "percentage": 16.28, "elapsed_time": "0:45:10", "remaining_time": "3:52:17", "throughput": 2324.22, "total_tokens": 6298976} {"current_steps": 10935, "total_steps": 67140, "loss": 0.6777, "lr": 4.9400700189446226e-05, "epoch": 1.628686327077748, "percentage": 16.29, "elapsed_time": "0:45:11", "remaining_time": "3:52:16", "throughput": 2324.42, "total_tokens": 6302304} {"current_steps": 10940, "total_steps": 67140, "loss": 0.7205, "lr": 4.939928492460967e-05, "epoch": 1.6294310396187073, "percentage": 16.29, "elapsed_time": "0:45:12", "remaining_time": "3:52:14", "throughput": 2324.53, "total_tokens": 6305312} {"current_steps": 10945, "total_steps": 67140, "loss": 0.7092, "lr": 4.939786801096864e-05, "epoch": 1.6301757521596665, "percentage": 16.3, "elapsed_time": "0:45:13", "remaining_time": "3:52:12", "throughput": 2324.62, "total_tokens": 6308128} {"current_steps": 10950, "total_steps": 67140, "loss": 0.7504, "lr": 4.9396449448618886e-05, "epoch": 1.6309204647006257, "percentage": 16.31, "elapsed_time": "0:45:14", "remaining_time": "3:52:10", "throughput": 2324.62, "total_tokens": 6310656} {"current_steps": 10955, "total_steps": 67140, "loss": 0.7131, "lr": 4.9395029237656266e-05, "epoch": 1.6316651772415849, "percentage": 16.32, "elapsed_time": "0:45:15", "remaining_time": "3:52:08", "throughput": 2324.66, "total_tokens": 6313312} {"current_steps": 10960, "total_steps": 67140, "loss": 0.7079, "lr": 4.939360737817675e-05, "epoch": 1.632409889782544, "percentage": 16.32, "elapsed_time": "0:45:16", "remaining_time": "3:52:06", "throughput": 2324.77, "total_tokens": 6316288} {"current_steps": 10965, "total_steps": 67140, "loss": 0.7036, "lr": 4.939218387027643e-05, "epoch": 1.6331546023235033, "percentage": 16.33, "elapsed_time": "0:45:18", "remaining_time": "3:52:04", "throughput": 2324.81, "total_tokens": 6318976} {"current_steps": 10970, "total_steps": 67140, "loss": 0.5316, "lr": 4.939075871405149e-05, "epoch": 1.6338993148644623, "percentage": 16.34, "elapsed_time": "0:45:19", "remaining_time": "3:52:03", "throughput": 2324.91, "total_tokens": 6321888} {"current_steps": 10975, "total_steps": 67140, "loss": 0.6885, "lr": 4.9389331909598246e-05, "epoch": 1.6346440274054215, "percentage": 16.35, "elapsed_time": "0:45:20", "remaining_time": "3:52:01", "throughput": 2325.0, "total_tokens": 6324800} {"current_steps": 10980, "total_steps": 67140, "loss": 0.5896, "lr": 4.938790345701311e-05, "epoch": 1.6353887399463807, "percentage": 16.35, "elapsed_time": "0:45:21", "remaining_time": "3:51:59", "throughput": 2325.03, "total_tokens": 6327424} {"current_steps": 10985, "total_steps": 67140, "loss": 0.6751, "lr": 4.9386473356392614e-05, "epoch": 1.6361334524873399, "percentage": 16.36, "elapsed_time": "0:45:22", "remaining_time": "3:51:57", "throughput": 2325.05, "total_tokens": 6330016} {"current_steps": 10990, "total_steps": 67140, "loss": 0.6446, "lr": 4.93850416078334e-05, "epoch": 1.636878165028299, "percentage": 16.37, "elapsed_time": "0:45:23", "remaining_time": "3:51:55", "throughput": 2325.09, "total_tokens": 6332736} {"current_steps": 10995, "total_steps": 67140, "loss": 0.6724, "lr": 4.938360821143221e-05, "epoch": 1.6376228775692583, "percentage": 16.38, "elapsed_time": "0:45:24", "remaining_time": "3:51:54", "throughput": 2325.18, "total_tokens": 6335680} {"current_steps": 11000, "total_steps": 67140, "loss": 0.761, "lr": 4.938217316728592e-05, "epoch": 1.6383675901102175, "percentage": 16.38, "elapsed_time": "0:45:25", "remaining_time": "3:51:52", "throughput": 2325.22, "total_tokens": 6338400} {"current_steps": 11005, "total_steps": 67140, "loss": 0.6041, "lr": 4.9380736475491484e-05, "epoch": 1.6391123026511767, "percentage": 16.39, "elapsed_time": "0:45:27", "remaining_time": "3:51:50", "throughput": 2325.23, "total_tokens": 6340928} {"current_steps": 11010, "total_steps": 67140, "loss": 0.6664, "lr": 4.9379298136146016e-05, "epoch": 1.6398570151921357, "percentage": 16.4, "elapsed_time": "0:45:28", "remaining_time": "3:51:48", "throughput": 2325.25, "total_tokens": 6343520} {"current_steps": 11015, "total_steps": 67140, "loss": 0.7335, "lr": 4.9377858149346686e-05, "epoch": 1.6406017277330949, "percentage": 16.41, "elapsed_time": "0:45:29", "remaining_time": "3:51:46", "throughput": 2325.33, "total_tokens": 6346304} {"current_steps": 11020, "total_steps": 67140, "loss": 0.6745, "lr": 4.937641651519083e-05, "epoch": 1.641346440274054, "percentage": 16.41, "elapsed_time": "0:45:30", "remaining_time": "3:51:44", "throughput": 2325.37, "total_tokens": 6348992} {"current_steps": 11025, "total_steps": 67140, "loss": 0.6553, "lr": 4.937497323377584e-05, "epoch": 1.6420911528150133, "percentage": 16.42, "elapsed_time": "0:45:31", "remaining_time": "3:51:42", "throughput": 2325.45, "total_tokens": 6351776} {"current_steps": 11030, "total_steps": 67140, "loss": 0.7963, "lr": 4.9373528305199273e-05, "epoch": 1.6428358653559725, "percentage": 16.43, "elapsed_time": "0:45:32", "remaining_time": "3:51:40", "throughput": 2325.47, "total_tokens": 6354368} {"current_steps": 11035, "total_steps": 67140, "loss": 0.5684, "lr": 4.937208172955876e-05, "epoch": 1.6435805778969317, "percentage": 16.44, "elapsed_time": "0:45:33", "remaining_time": "3:51:38", "throughput": 2325.6, "total_tokens": 6357440} {"current_steps": 11040, "total_steps": 67140, "loss": 0.6542, "lr": 4.937063350695204e-05, "epoch": 1.6443252904378909, "percentage": 16.44, "elapsed_time": "0:45:34", "remaining_time": "3:51:36", "throughput": 2325.6, "total_tokens": 6359968} {"current_steps": 11045, "total_steps": 67140, "loss": 0.6907, "lr": 4.9369183637477e-05, "epoch": 1.64507000297885, "percentage": 16.45, "elapsed_time": "0:45:35", "remaining_time": "3:51:35", "throughput": 2325.68, "total_tokens": 6362848} {"current_steps": 11050, "total_steps": 67140, "loss": 0.7326, "lr": 4.93677321212316e-05, "epoch": 1.6458147155198093, "percentage": 16.46, "elapsed_time": "0:45:37", "remaining_time": "3:51:33", "throughput": 2325.79, "total_tokens": 6365792} {"current_steps": 11055, "total_steps": 67140, "loss": 0.8775, "lr": 4.936627895831394e-05, "epoch": 1.6465594280607685, "percentage": 16.47, "elapsed_time": "0:45:38", "remaining_time": "3:51:31", "throughput": 2325.83, "total_tokens": 6368480} {"current_steps": 11060, "total_steps": 67140, "loss": 0.6412, "lr": 4.936482414882222e-05, "epoch": 1.6473041406017277, "percentage": 16.47, "elapsed_time": "0:45:39", "remaining_time": "3:51:29", "throughput": 2326.0, "total_tokens": 6371712} {"current_steps": 11065, "total_steps": 67140, "loss": 0.8859, "lr": 4.9363367692854735e-05, "epoch": 1.648048853142687, "percentage": 16.48, "elapsed_time": "0:45:40", "remaining_time": "3:51:28", "throughput": 2326.11, "total_tokens": 6374688} {"current_steps": 11070, "total_steps": 67140, "loss": 0.6578, "lr": 4.9361909590509924e-05, "epoch": 1.648793565683646, "percentage": 16.49, "elapsed_time": "0:45:41", "remaining_time": "3:51:26", "throughput": 2326.19, "total_tokens": 6377504} {"current_steps": 11075, "total_steps": 67140, "loss": 0.7646, "lr": 4.9360449841886304e-05, "epoch": 1.6495382782246053, "percentage": 16.5, "elapsed_time": "0:45:42", "remaining_time": "3:51:24", "throughput": 2326.22, "total_tokens": 6380160} {"current_steps": 11080, "total_steps": 67140, "loss": 0.5537, "lr": 4.935898844708253e-05, "epoch": 1.6502829907655645, "percentage": 16.5, "elapsed_time": "0:45:43", "remaining_time": "3:51:22", "throughput": 2326.35, "total_tokens": 6383200} {"current_steps": 11085, "total_steps": 67140, "loss": 0.7101, "lr": 4.9357525406197345e-05, "epoch": 1.6510277033065237, "percentage": 16.51, "elapsed_time": "0:45:44", "remaining_time": "3:51:20", "throughput": 2326.4, "total_tokens": 6385952} {"current_steps": 11090, "total_steps": 67140, "loss": 0.5985, "lr": 4.9356060719329636e-05, "epoch": 1.651772415847483, "percentage": 16.52, "elapsed_time": "0:45:46", "remaining_time": "3:51:19", "throughput": 2326.47, "total_tokens": 6388736} {"current_steps": 11095, "total_steps": 67140, "loss": 0.7357, "lr": 4.935459438657836e-05, "epoch": 1.6525171283884421, "percentage": 16.53, "elapsed_time": "0:45:47", "remaining_time": "3:51:17", "throughput": 2326.53, "total_tokens": 6391456} {"current_steps": 11100, "total_steps": 67140, "loss": 0.5544, "lr": 4.9353126408042616e-05, "epoch": 1.6532618409294013, "percentage": 16.53, "elapsed_time": "0:45:48", "remaining_time": "3:51:15", "throughput": 2326.61, "total_tokens": 6394336} {"current_steps": 11105, "total_steps": 67140, "loss": 0.8429, "lr": 4.9351656783821606e-05, "epoch": 1.6540065534703605, "percentage": 16.54, "elapsed_time": "0:45:49", "remaining_time": "3:51:13", "throughput": 2326.68, "total_tokens": 6397120} {"current_steps": 11110, "total_steps": 67140, "loss": 0.6191, "lr": 4.935018551401463e-05, "epoch": 1.6547512660113197, "percentage": 16.55, "elapsed_time": "0:45:50", "remaining_time": "3:51:11", "throughput": 2326.77, "total_tokens": 6400000} {"current_steps": 11115, "total_steps": 67140, "loss": 0.6624, "lr": 4.934871259872112e-05, "epoch": 1.655495978552279, "percentage": 16.55, "elapsed_time": "0:45:51", "remaining_time": "3:51:10", "throughput": 2326.92, "total_tokens": 6403168} {"current_steps": 11120, "total_steps": 67140, "loss": 0.7868, "lr": 4.9347238038040614e-05, "epoch": 1.6562406910932381, "percentage": 16.56, "elapsed_time": "0:45:52", "remaining_time": "3:51:08", "throughput": 2326.98, "total_tokens": 6405952} {"current_steps": 11125, "total_steps": 67140, "loss": 0.7024, "lr": 4.934576183207274e-05, "epoch": 1.6569854036341973, "percentage": 16.57, "elapsed_time": "0:45:54", "remaining_time": "3:51:06", "throughput": 2327.11, "total_tokens": 6408992} {"current_steps": 11130, "total_steps": 67140, "loss": 0.7536, "lr": 4.9344283980917273e-05, "epoch": 1.6577301161751565, "percentage": 16.58, "elapsed_time": "0:45:55", "remaining_time": "3:51:04", "throughput": 2327.16, "total_tokens": 6411680} {"current_steps": 11135, "total_steps": 67140, "loss": 0.5893, "lr": 4.9342804484674064e-05, "epoch": 1.6584748287161157, "percentage": 16.58, "elapsed_time": "0:45:56", "remaining_time": "3:51:03", "throughput": 2327.27, "total_tokens": 6414624} {"current_steps": 11140, "total_steps": 67140, "loss": 0.593, "lr": 4.93413233434431e-05, "epoch": 1.6592195412570747, "percentage": 16.59, "elapsed_time": "0:45:57", "remaining_time": "3:51:01", "throughput": 2327.35, "total_tokens": 6417504} {"current_steps": 11145, "total_steps": 67140, "loss": 0.7078, "lr": 4.933984055732447e-05, "epoch": 1.659964253798034, "percentage": 16.6, "elapsed_time": "0:45:58", "remaining_time": "3:50:59", "throughput": 2327.39, "total_tokens": 6420192} {"current_steps": 11150, "total_steps": 67140, "loss": 0.6106, "lr": 4.9338356126418375e-05, "epoch": 1.6607089663389931, "percentage": 16.61, "elapsed_time": "0:45:59", "remaining_time": "3:50:57", "throughput": 2327.5, "total_tokens": 6423136} {"current_steps": 11155, "total_steps": 67140, "loss": 0.6813, "lr": 4.9336870050825124e-05, "epoch": 1.6614536788799523, "percentage": 16.61, "elapsed_time": "0:46:00", "remaining_time": "3:50:55", "throughput": 2327.57, "total_tokens": 6425920} {"current_steps": 11160, "total_steps": 67140, "loss": 0.834, "lr": 4.933538233064514e-05, "epoch": 1.6621983914209115, "percentage": 16.62, "elapsed_time": "0:46:01", "remaining_time": "3:50:54", "throughput": 2327.68, "total_tokens": 6428896} {"current_steps": 11165, "total_steps": 67140, "loss": 0.609, "lr": 4.9333892965978955e-05, "epoch": 1.6629431039618707, "percentage": 16.63, "elapsed_time": "0:46:03", "remaining_time": "3:50:52", "throughput": 2327.81, "total_tokens": 6432032} {"current_steps": 11170, "total_steps": 67140, "loss": 0.4773, "lr": 4.9332401956927224e-05, "epoch": 1.66368781650283, "percentage": 16.64, "elapsed_time": "0:46:04", "remaining_time": "3:50:51", "throughput": 2327.92, "total_tokens": 6435008} {"current_steps": 11175, "total_steps": 67140, "loss": 0.6344, "lr": 4.93309093035907e-05, "epoch": 1.6644325290437891, "percentage": 16.64, "elapsed_time": "0:46:05", "remaining_time": "3:50:49", "throughput": 2328.08, "total_tokens": 6438176} {"current_steps": 11180, "total_steps": 67140, "loss": 0.5735, "lr": 4.932941500607025e-05, "epoch": 1.6651772415847483, "percentage": 16.65, "elapsed_time": "0:46:06", "remaining_time": "3:50:47", "throughput": 2328.18, "total_tokens": 6441088} {"current_steps": 11185, "total_steps": 67140, "loss": 0.6907, "lr": 4.9327919064466835e-05, "epoch": 1.6659219541257073, "percentage": 16.66, "elapsed_time": "0:46:07", "remaining_time": "3:50:46", "throughput": 2328.38, "total_tokens": 6444448} {"current_steps": 11190, "total_steps": 67140, "loss": 0.9732, "lr": 4.932642147888157e-05, "epoch": 1.6666666666666665, "percentage": 16.67, "elapsed_time": "0:46:08", "remaining_time": "3:50:44", "throughput": 2328.43, "total_tokens": 6447136} {"current_steps": 11195, "total_steps": 67140, "loss": 0.7544, "lr": 4.932492224941565e-05, "epoch": 1.6674113792076257, "percentage": 16.67, "elapsed_time": "0:46:09", "remaining_time": "3:50:42", "throughput": 2328.43, "total_tokens": 6449696} {"current_steps": 11200, "total_steps": 67140, "loss": 0.6389, "lr": 4.932342137617037e-05, "epoch": 1.668156091748585, "percentage": 16.68, "elapsed_time": "0:46:11", "remaining_time": "3:50:40", "throughput": 2328.57, "total_tokens": 6452736} {"current_steps": 11205, "total_steps": 67140, "loss": 0.5284, "lr": 4.932191885924717e-05, "epoch": 1.6689008042895441, "percentage": 16.69, "elapsed_time": "0:46:12", "remaining_time": "3:50:39", "throughput": 2328.68, "total_tokens": 6455712} {"current_steps": 11210, "total_steps": 67140, "loss": 0.6714, "lr": 4.9320414698747586e-05, "epoch": 1.6696455168305033, "percentage": 16.7, "elapsed_time": "0:46:13", "remaining_time": "3:50:37", "throughput": 2328.74, "total_tokens": 6458464} {"current_steps": 11215, "total_steps": 67140, "loss": 0.606, "lr": 4.931890889477325e-05, "epoch": 1.6703902293714625, "percentage": 16.7, "elapsed_time": "0:46:14", "remaining_time": "3:50:35", "throughput": 2328.91, "total_tokens": 6461696} {"current_steps": 11220, "total_steps": 67140, "loss": 0.6093, "lr": 4.931740144742593e-05, "epoch": 1.6711349419124217, "percentage": 16.71, "elapsed_time": "0:46:15", "remaining_time": "3:50:34", "throughput": 2329.08, "total_tokens": 6464896} {"current_steps": 11225, "total_steps": 67140, "loss": 0.7897, "lr": 4.931589235680748e-05, "epoch": 1.671879654453381, "percentage": 16.72, "elapsed_time": "0:46:16", "remaining_time": "3:50:32", "throughput": 2329.2, "total_tokens": 6467904} {"current_steps": 11230, "total_steps": 67140, "loss": 0.6223, "lr": 4.931438162301989e-05, "epoch": 1.6726243669943401, "percentage": 16.73, "elapsed_time": "0:46:18", "remaining_time": "3:50:30", "throughput": 2329.26, "total_tokens": 6470688} {"current_steps": 11235, "total_steps": 67140, "loss": 0.5521, "lr": 4.931286924616524e-05, "epoch": 1.6733690795352993, "percentage": 16.73, "elapsed_time": "0:46:19", "remaining_time": "3:50:28", "throughput": 2329.33, "total_tokens": 6473536} {"current_steps": 11240, "total_steps": 67140, "loss": 0.4608, "lr": 4.931135522634574e-05, "epoch": 1.6741137920762585, "percentage": 16.74, "elapsed_time": "0:46:20", "remaining_time": "3:50:27", "throughput": 2329.4, "total_tokens": 6476352} {"current_steps": 11245, "total_steps": 67140, "loss": 0.7015, "lr": 4.930983956366369e-05, "epoch": 1.6748585046172177, "percentage": 16.75, "elapsed_time": "0:46:21", "remaining_time": "3:50:25", "throughput": 2329.44, "total_tokens": 6479008} {"current_steps": 11250, "total_steps": 67140, "loss": 0.5678, "lr": 4.930832225822153e-05, "epoch": 1.675603217158177, "percentage": 16.76, "elapsed_time": "0:46:22", "remaining_time": "3:50:23", "throughput": 2329.56, "total_tokens": 6482016} {"current_steps": 11255, "total_steps": 67140, "loss": 0.6148, "lr": 4.9306803310121776e-05, "epoch": 1.6763479296991362, "percentage": 16.76, "elapsed_time": "0:46:23", "remaining_time": "3:50:21", "throughput": 2329.59, "total_tokens": 6484672} {"current_steps": 11260, "total_steps": 67140, "loss": 0.7585, "lr": 4.9305282719467076e-05, "epoch": 1.6770926422400954, "percentage": 16.77, "elapsed_time": "0:46:24", "remaining_time": "3:50:19", "throughput": 2329.69, "total_tokens": 6487584} {"current_steps": 11265, "total_steps": 67140, "loss": 0.792, "lr": 4.93037604863602e-05, "epoch": 1.6778373547810546, "percentage": 16.78, "elapsed_time": "0:46:25", "remaining_time": "3:50:18", "throughput": 2329.75, "total_tokens": 6490400} {"current_steps": 11270, "total_steps": 67140, "loss": 0.7321, "lr": 4.930223661090398e-05, "epoch": 1.6785820673220138, "percentage": 16.79, "elapsed_time": "0:46:27", "remaining_time": "3:50:16", "throughput": 2329.87, "total_tokens": 6493440} {"current_steps": 11275, "total_steps": 67140, "loss": 0.7353, "lr": 4.930071109320144e-05, "epoch": 1.679326779862973, "percentage": 16.79, "elapsed_time": "0:46:28", "remaining_time": "3:50:14", "throughput": 2329.9, "total_tokens": 6496096} {"current_steps": 11280, "total_steps": 67140, "loss": 0.6476, "lr": 4.929918393335563e-05, "epoch": 1.6800714924039322, "percentage": 16.8, "elapsed_time": "0:46:29", "remaining_time": "3:50:12", "throughput": 2329.97, "total_tokens": 6498880} {"current_steps": 11285, "total_steps": 67140, "loss": 0.6687, "lr": 4.9297655131469763e-05, "epoch": 1.6808162049448914, "percentage": 16.81, "elapsed_time": "0:46:30", "remaining_time": "3:50:10", "throughput": 2329.98, "total_tokens": 6501440} {"current_steps": 11290, "total_steps": 67140, "loss": 0.71, "lr": 4.929612468764715e-05, "epoch": 1.6815609174858506, "percentage": 16.82, "elapsed_time": "0:46:31", "remaining_time": "3:50:09", "throughput": 2330.15, "total_tokens": 6504736} {"current_steps": 11295, "total_steps": 67140, "loss": 0.6503, "lr": 4.929459260199122e-05, "epoch": 1.6823056300268098, "percentage": 16.82, "elapsed_time": "0:46:32", "remaining_time": "3:50:07", "throughput": 2330.19, "total_tokens": 6507424} {"current_steps": 11300, "total_steps": 67140, "loss": 0.6046, "lr": 4.9293058874605485e-05, "epoch": 1.683050342567769, "percentage": 16.83, "elapsed_time": "0:46:33", "remaining_time": "3:50:05", "throughput": 2330.34, "total_tokens": 6510560} {"current_steps": 11305, "total_steps": 67140, "loss": 0.6738, "lr": 4.9291523505593604e-05, "epoch": 1.6837950551087282, "percentage": 16.84, "elapsed_time": "0:46:35", "remaining_time": "3:50:04", "throughput": 2330.47, "total_tokens": 6513696} {"current_steps": 11310, "total_steps": 67140, "loss": 0.7647, "lr": 4.928998649505933e-05, "epoch": 1.6845397676496874, "percentage": 16.85, "elapsed_time": "0:46:36", "remaining_time": "3:50:02", "throughput": 2330.6, "total_tokens": 6516800} {"current_steps": 11315, "total_steps": 67140, "loss": 0.5716, "lr": 4.9288447843106525e-05, "epoch": 1.6852844801906464, "percentage": 16.85, "elapsed_time": "0:46:37", "remaining_time": "3:50:01", "throughput": 2330.72, "total_tokens": 6519840} {"current_steps": 11320, "total_steps": 67140, "loss": 0.5939, "lr": 4.9286907549839156e-05, "epoch": 1.6860291927316056, "percentage": 16.86, "elapsed_time": "0:46:38", "remaining_time": "3:49:59", "throughput": 2330.84, "total_tokens": 6522816} {"current_steps": 11325, "total_steps": 67140, "loss": 0.624, "lr": 4.928536561536132e-05, "epoch": 1.6867739052725648, "percentage": 16.87, "elapsed_time": "0:46:39", "remaining_time": "3:49:57", "throughput": 2330.91, "total_tokens": 6525664} {"current_steps": 11330, "total_steps": 67140, "loss": 0.7794, "lr": 4.928382203977722e-05, "epoch": 1.687518617813524, "percentage": 16.88, "elapsed_time": "0:46:40", "remaining_time": "3:49:56", "throughput": 2331.11, "total_tokens": 6529088} {"current_steps": 11335, "total_steps": 67140, "loss": 0.6622, "lr": 4.9282276823191154e-05, "epoch": 1.6882633303544832, "percentage": 16.88, "elapsed_time": "0:46:41", "remaining_time": "3:49:54", "throughput": 2331.16, "total_tokens": 6531840} {"current_steps": 11340, "total_steps": 67140, "loss": 0.7172, "lr": 4.9280729965707545e-05, "epoch": 1.6890080428954424, "percentage": 16.89, "elapsed_time": "0:46:43", "remaining_time": "3:49:52", "throughput": 2331.24, "total_tokens": 6534688} {"current_steps": 11345, "total_steps": 67140, "loss": 0.7606, "lr": 4.9279181467430926e-05, "epoch": 1.6897527554364016, "percentage": 16.9, "elapsed_time": "0:46:44", "remaining_time": "3:49:51", "throughput": 2331.36, "total_tokens": 6537664} {"current_steps": 11350, "total_steps": 67140, "loss": 0.7438, "lr": 4.927763132846593e-05, "epoch": 1.6904974679773608, "percentage": 16.9, "elapsed_time": "0:46:45", "remaining_time": "3:49:49", "throughput": 2331.44, "total_tokens": 6540544} {"current_steps": 11355, "total_steps": 67140, "loss": 0.7779, "lr": 4.927607954891732e-05, "epoch": 1.69124218051832, "percentage": 16.91, "elapsed_time": "0:46:46", "remaining_time": "3:49:48", "throughput": 2331.56, "total_tokens": 6543648} {"current_steps": 11360, "total_steps": 67140, "loss": 0.6872, "lr": 4.927452612888994e-05, "epoch": 1.691986893059279, "percentage": 16.92, "elapsed_time": "0:46:47", "remaining_time": "3:49:46", "throughput": 2331.63, "total_tokens": 6546496} {"current_steps": 11365, "total_steps": 67140, "loss": 0.6472, "lr": 4.9272971068488795e-05, "epoch": 1.6927316056002382, "percentage": 16.93, "elapsed_time": "0:46:48", "remaining_time": "3:49:44", "throughput": 2331.74, "total_tokens": 6549568} {"current_steps": 11370, "total_steps": 67140, "loss": 0.5791, "lr": 4.9271414367818944e-05, "epoch": 1.6934763181411974, "percentage": 16.93, "elapsed_time": "0:46:50", "remaining_time": "3:49:43", "throughput": 2331.87, "total_tokens": 6552672} {"current_steps": 11375, "total_steps": 67140, "loss": 0.6944, "lr": 4.926985602698559e-05, "epoch": 1.6942210306821566, "percentage": 16.94, "elapsed_time": "0:46:51", "remaining_time": "3:49:41", "throughput": 2331.92, "total_tokens": 6555424} {"current_steps": 11380, "total_steps": 67140, "loss": 0.5204, "lr": 4.926829604609404e-05, "epoch": 1.6949657432231158, "percentage": 16.95, "elapsed_time": "0:46:52", "remaining_time": "3:49:39", "throughput": 2332.0, "total_tokens": 6558304} {"current_steps": 11385, "total_steps": 67140, "loss": 0.6462, "lr": 4.926673442524971e-05, "epoch": 1.695710455764075, "percentage": 16.96, "elapsed_time": "0:46:53", "remaining_time": "3:49:38", "throughput": 2332.06, "total_tokens": 6561120} {"current_steps": 11390, "total_steps": 67140, "loss": 0.6723, "lr": 4.926517116455813e-05, "epoch": 1.6964551683050342, "percentage": 16.96, "elapsed_time": "0:46:54", "remaining_time": "3:49:36", "throughput": 2332.13, "total_tokens": 6563968} {"current_steps": 11395, "total_steps": 67140, "loss": 0.6043, "lr": 4.926360626412494e-05, "epoch": 1.6971998808459934, "percentage": 16.97, "elapsed_time": "0:46:55", "remaining_time": "3:49:34", "throughput": 2332.17, "total_tokens": 6566656} {"current_steps": 11400, "total_steps": 67140, "loss": 0.672, "lr": 4.926203972405588e-05, "epoch": 1.6979445933869526, "percentage": 16.98, "elapsed_time": "0:46:56", "remaining_time": "3:49:32", "throughput": 2332.3, "total_tokens": 6569696} {"current_steps": 11405, "total_steps": 67140, "loss": 0.6371, "lr": 4.926047154445683e-05, "epoch": 1.6986893059279118, "percentage": 16.99, "elapsed_time": "0:46:57", "remaining_time": "3:49:31", "throughput": 2332.39, "total_tokens": 6572608} {"current_steps": 11410, "total_steps": 67140, "loss": 0.6398, "lr": 4.925890172543374e-05, "epoch": 1.699434018468871, "percentage": 16.99, "elapsed_time": "0:46:59", "remaining_time": "3:49:29", "throughput": 2332.6, "total_tokens": 6576096} {"current_steps": 11415, "total_steps": 67140, "loss": 0.7107, "lr": 4.92573302670927e-05, "epoch": 1.7001787310098302, "percentage": 17.0, "elapsed_time": "0:47:00", "remaining_time": "3:49:27", "throughput": 2332.64, "total_tokens": 6578752} {"current_steps": 11420, "total_steps": 67140, "loss": 0.6043, "lr": 4.9255757169539905e-05, "epoch": 1.7009234435507894, "percentage": 17.01, "elapsed_time": "0:47:01", "remaining_time": "3:49:26", "throughput": 2332.67, "total_tokens": 6581376} {"current_steps": 11425, "total_steps": 67140, "loss": 0.5682, "lr": 4.9254182432881654e-05, "epoch": 1.7016681560917486, "percentage": 17.02, "elapsed_time": "0:47:02", "remaining_time": "3:49:24", "throughput": 2332.79, "total_tokens": 6584352} {"current_steps": 11430, "total_steps": 67140, "loss": 0.5853, "lr": 4.9252606057224373e-05, "epoch": 1.7024128686327078, "percentage": 17.02, "elapsed_time": "0:47:03", "remaining_time": "3:49:22", "throughput": 2332.86, "total_tokens": 6587168} {"current_steps": 11435, "total_steps": 67140, "loss": 0.7753, "lr": 4.9251028042674573e-05, "epoch": 1.703157581173667, "percentage": 17.03, "elapsed_time": "0:47:04", "remaining_time": "3:49:20", "throughput": 2332.96, "total_tokens": 6590144} {"current_steps": 11440, "total_steps": 67140, "loss": 0.7015, "lr": 4.9249448389338905e-05, "epoch": 1.7039022937146262, "percentage": 17.04, "elapsed_time": "0:47:05", "remaining_time": "3:49:19", "throughput": 2333.04, "total_tokens": 6593024} {"current_steps": 11445, "total_steps": 67140, "loss": 0.806, "lr": 4.9247867097324095e-05, "epoch": 1.7046470062555854, "percentage": 17.05, "elapsed_time": "0:47:07", "remaining_time": "3:49:17", "throughput": 2333.15, "total_tokens": 6596032} {"current_steps": 11450, "total_steps": 67140, "loss": 0.6495, "lr": 4.924628416673701e-05, "epoch": 1.7053917187965446, "percentage": 17.05, "elapsed_time": "0:47:08", "remaining_time": "3:49:15", "throughput": 2333.19, "total_tokens": 6598752} {"current_steps": 11455, "total_steps": 67140, "loss": 0.6839, "lr": 4.9244699597684625e-05, "epoch": 1.7061364313375038, "percentage": 17.06, "elapsed_time": "0:47:09", "remaining_time": "3:49:14", "throughput": 2333.44, "total_tokens": 6602528} {"current_steps": 11460, "total_steps": 67140, "loss": 0.5302, "lr": 4.924311339027401e-05, "epoch": 1.706881143878463, "percentage": 17.07, "elapsed_time": "0:47:10", "remaining_time": "3:49:13", "throughput": 2333.54, "total_tokens": 6605472} {"current_steps": 11465, "total_steps": 67140, "loss": 0.6707, "lr": 4.924152554461236e-05, "epoch": 1.7076258564194222, "percentage": 17.08, "elapsed_time": "0:47:11", "remaining_time": "3:49:11", "throughput": 2333.65, "total_tokens": 6608512} {"current_steps": 11470, "total_steps": 67140, "loss": 0.6439, "lr": 4.9239936060806965e-05, "epoch": 1.7083705689603814, "percentage": 17.08, "elapsed_time": "0:47:12", "remaining_time": "3:49:09", "throughput": 2333.74, "total_tokens": 6611392} {"current_steps": 11475, "total_steps": 67140, "loss": 0.8797, "lr": 4.9238344938965254e-05, "epoch": 1.7091152815013406, "percentage": 17.09, "elapsed_time": "0:47:14", "remaining_time": "3:49:08", "throughput": 2333.9, "total_tokens": 6614624} {"current_steps": 11480, "total_steps": 67140, "loss": 0.6451, "lr": 4.923675217919473e-05, "epoch": 1.7098599940422998, "percentage": 17.1, "elapsed_time": "0:47:15", "remaining_time": "3:49:06", "throughput": 2333.98, "total_tokens": 6617536} {"current_steps": 11485, "total_steps": 67140, "loss": 0.6641, "lr": 4.923515778160304e-05, "epoch": 1.710604706583259, "percentage": 17.11, "elapsed_time": "0:47:16", "remaining_time": "3:49:05", "throughput": 2334.07, "total_tokens": 6620448} {"current_steps": 11490, "total_steps": 67140, "loss": 0.5876, "lr": 4.9233561746297917e-05, "epoch": 1.711349419124218, "percentage": 17.11, "elapsed_time": "0:47:17", "remaining_time": "3:49:03", "throughput": 2334.13, "total_tokens": 6623264} {"current_steps": 11495, "total_steps": 67140, "loss": 0.6484, "lr": 4.923196407338721e-05, "epoch": 1.7120941316651772, "percentage": 17.12, "elapsed_time": "0:47:18", "remaining_time": "3:49:01", "throughput": 2334.26, "total_tokens": 6626368} {"current_steps": 11500, "total_steps": 67140, "loss": 0.766, "lr": 4.923036476297891e-05, "epoch": 1.7128388442061364, "percentage": 17.13, "elapsed_time": "0:47:19", "remaining_time": "3:49:00", "throughput": 2334.38, "total_tokens": 6629408} {"current_steps": 11505, "total_steps": 67140, "loss": 0.7042, "lr": 4.922876381518106e-05, "epoch": 1.7135835567470956, "percentage": 17.14, "elapsed_time": "0:47:21", "remaining_time": "3:48:58", "throughput": 2334.45, "total_tokens": 6632256} {"current_steps": 11510, "total_steps": 67140, "loss": 0.6305, "lr": 4.922716123010186e-05, "epoch": 1.7143282692880548, "percentage": 17.14, "elapsed_time": "0:47:22", "remaining_time": "3:48:56", "throughput": 2334.55, "total_tokens": 6635232} {"current_steps": 11515, "total_steps": 67140, "loss": 0.6327, "lr": 4.92255570078496e-05, "epoch": 1.715072981829014, "percentage": 17.15, "elapsed_time": "0:47:23", "remaining_time": "3:48:55", "throughput": 2334.6, "total_tokens": 6638016} {"current_steps": 11520, "total_steps": 67140, "loss": 0.6636, "lr": 4.92239511485327e-05, "epoch": 1.7158176943699732, "percentage": 17.16, "elapsed_time": "0:47:24", "remaining_time": "3:48:53", "throughput": 2334.71, "total_tokens": 6641024} {"current_steps": 11525, "total_steps": 67140, "loss": 0.8138, "lr": 4.922234365225966e-05, "epoch": 1.7165624069109324, "percentage": 17.17, "elapsed_time": "0:47:25", "remaining_time": "3:48:51", "throughput": 2334.78, "total_tokens": 6643840} {"current_steps": 11530, "total_steps": 67140, "loss": 0.8605, "lr": 4.922073451913912e-05, "epoch": 1.7173071194518914, "percentage": 17.17, "elapsed_time": "0:47:26", "remaining_time": "3:48:49", "throughput": 2334.87, "total_tokens": 6646720} {"current_steps": 11535, "total_steps": 67140, "loss": 0.6931, "lr": 4.9219123749279816e-05, "epoch": 1.7180518319928506, "percentage": 17.18, "elapsed_time": "0:47:27", "remaining_time": "3:48:48", "throughput": 2335.0, "total_tokens": 6649760} {"current_steps": 11540, "total_steps": 67140, "loss": 0.5301, "lr": 4.92175113427906e-05, "epoch": 1.7187965445338098, "percentage": 17.19, "elapsed_time": "0:47:28", "remaining_time": "3:48:46", "throughput": 2335.03, "total_tokens": 6652448} {"current_steps": 11545, "total_steps": 67140, "loss": 0.662, "lr": 4.9215897299780426e-05, "epoch": 1.719541257074769, "percentage": 17.2, "elapsed_time": "0:47:30", "remaining_time": "3:48:44", "throughput": 2335.11, "total_tokens": 6655328} {"current_steps": 11550, "total_steps": 67140, "loss": 0.6598, "lr": 4.9214281620358374e-05, "epoch": 1.7202859696157282, "percentage": 17.2, "elapsed_time": "0:47:31", "remaining_time": "3:48:43", "throughput": 2335.24, "total_tokens": 6658368} {"current_steps": 11555, "total_steps": 67140, "loss": 0.8595, "lr": 4.92126643046336e-05, "epoch": 1.7210306821566874, "percentage": 17.21, "elapsed_time": "0:47:32", "remaining_time": "3:48:41", "throughput": 2335.33, "total_tokens": 6661344} {"current_steps": 11560, "total_steps": 67140, "loss": 0.7019, "lr": 4.921104535271543e-05, "epoch": 1.7217753946976466, "percentage": 17.22, "elapsed_time": "0:47:33", "remaining_time": "3:48:39", "throughput": 2335.43, "total_tokens": 6664320} {"current_steps": 11565, "total_steps": 67140, "loss": 0.56, "lr": 4.9209424764713246e-05, "epoch": 1.7225201072386058, "percentage": 17.23, "elapsed_time": "0:47:34", "remaining_time": "3:48:38", "throughput": 2335.54, "total_tokens": 6667296} {"current_steps": 11570, "total_steps": 67140, "loss": 0.7653, "lr": 4.920780254073656e-05, "epoch": 1.723264819779565, "percentage": 17.23, "elapsed_time": "0:47:35", "remaining_time": "3:48:36", "throughput": 2335.56, "total_tokens": 6669952} {"current_steps": 11575, "total_steps": 67140, "loss": 0.5581, "lr": 4.920617868089501e-05, "epoch": 1.7240095323205242, "percentage": 17.24, "elapsed_time": "0:47:36", "remaining_time": "3:48:34", "throughput": 2335.69, "total_tokens": 6673056} {"current_steps": 11580, "total_steps": 67140, "loss": 0.6423, "lr": 4.9204553185298315e-05, "epoch": 1.7247542448614834, "percentage": 17.25, "elapsed_time": "0:47:38", "remaining_time": "3:48:33", "throughput": 2335.75, "total_tokens": 6675840} {"current_steps": 11585, "total_steps": 67140, "loss": 0.7316, "lr": 4.920292605405632e-05, "epoch": 1.7254989574024426, "percentage": 17.25, "elapsed_time": "0:47:39", "remaining_time": "3:48:31", "throughput": 2335.77, "total_tokens": 6678464} {"current_steps": 11590, "total_steps": 67140, "loss": 0.6642, "lr": 4.9201297287278994e-05, "epoch": 1.7262436699434018, "percentage": 17.26, "elapsed_time": "0:47:40", "remaining_time": "3:48:29", "throughput": 2335.8, "total_tokens": 6681120} {"current_steps": 11595, "total_steps": 67140, "loss": 0.4941, "lr": 4.919966688507638e-05, "epoch": 1.726988382484361, "percentage": 17.27, "elapsed_time": "0:47:41", "remaining_time": "3:48:27", "throughput": 2335.86, "total_tokens": 6683872} {"current_steps": 11600, "total_steps": 67140, "loss": 0.8621, "lr": 4.919803484755867e-05, "epoch": 1.7277330950253202, "percentage": 17.28, "elapsed_time": "0:47:42", "remaining_time": "3:48:25", "throughput": 2335.97, "total_tokens": 6686912} {"current_steps": 11605, "total_steps": 67140, "loss": 0.5383, "lr": 4.919640117483616e-05, "epoch": 1.7284778075662794, "percentage": 17.28, "elapsed_time": "0:47:43", "remaining_time": "3:48:24", "throughput": 2336.06, "total_tokens": 6689792} {"current_steps": 11610, "total_steps": 67140, "loss": 0.6574, "lr": 4.9194765867019214e-05, "epoch": 1.7292225201072386, "percentage": 17.29, "elapsed_time": "0:47:44", "remaining_time": "3:48:22", "throughput": 2336.09, "total_tokens": 6692448} {"current_steps": 11615, "total_steps": 67140, "loss": 0.4967, "lr": 4.919312892421837e-05, "epoch": 1.7299672326481979, "percentage": 17.3, "elapsed_time": "0:47:45", "remaining_time": "3:48:20", "throughput": 2336.15, "total_tokens": 6695264} {"current_steps": 11620, "total_steps": 67140, "loss": 0.5784, "lr": 4.9191490346544236e-05, "epoch": 1.730711945189157, "percentage": 17.31, "elapsed_time": "0:47:47", "remaining_time": "3:48:18", "throughput": 2336.22, "total_tokens": 6698112} {"current_steps": 11625, "total_steps": 67140, "loss": 0.52, "lr": 4.918985013410754e-05, "epoch": 1.7314566577301163, "percentage": 17.31, "elapsed_time": "0:47:48", "remaining_time": "3:48:16", "throughput": 2336.27, "total_tokens": 6700864} {"current_steps": 11630, "total_steps": 67140, "loss": 0.6771, "lr": 4.918820828701912e-05, "epoch": 1.7322013702710755, "percentage": 17.32, "elapsed_time": "0:47:49", "remaining_time": "3:48:15", "throughput": 2336.37, "total_tokens": 6703808} {"current_steps": 11635, "total_steps": 67140, "loss": 0.6564, "lr": 4.9186564805389923e-05, "epoch": 1.7329460828120347, "percentage": 17.33, "elapsed_time": "0:47:50", "remaining_time": "3:48:13", "throughput": 2336.54, "total_tokens": 6707072} {"current_steps": 11640, "total_steps": 67140, "loss": 0.5228, "lr": 4.918491968933101e-05, "epoch": 1.7336907953529939, "percentage": 17.34, "elapsed_time": "0:47:51", "remaining_time": "3:48:12", "throughput": 2336.56, "total_tokens": 6709728} {"current_steps": 11645, "total_steps": 67140, "loss": 0.9388, "lr": 4.918327293895356e-05, "epoch": 1.734435507893953, "percentage": 17.34, "elapsed_time": "0:47:52", "remaining_time": "3:48:10", "throughput": 2336.61, "total_tokens": 6712480} {"current_steps": 11650, "total_steps": 67140, "loss": 0.5951, "lr": 4.918162455436884e-05, "epoch": 1.7351802204349123, "percentage": 17.35, "elapsed_time": "0:47:53", "remaining_time": "3:48:08", "throughput": 2336.69, "total_tokens": 6715328} {"current_steps": 11655, "total_steps": 67140, "loss": 0.684, "lr": 4.9179974535688256e-05, "epoch": 1.7359249329758715, "percentage": 17.36, "elapsed_time": "0:47:54", "remaining_time": "3:48:06", "throughput": 2336.76, "total_tokens": 6718176} {"current_steps": 11660, "total_steps": 67140, "loss": 0.8016, "lr": 4.91783228830233e-05, "epoch": 1.7366696455168305, "percentage": 17.37, "elapsed_time": "0:47:56", "remaining_time": "3:48:05", "throughput": 2336.91, "total_tokens": 6721408} {"current_steps": 11665, "total_steps": 67140, "loss": 0.7214, "lr": 4.9176669596485584e-05, "epoch": 1.7374143580577897, "percentage": 17.37, "elapsed_time": "0:47:57", "remaining_time": "3:48:03", "throughput": 2336.95, "total_tokens": 6724096} {"current_steps": 11670, "total_steps": 67140, "loss": 0.6435, "lr": 4.917501467618682e-05, "epoch": 1.7381590705987489, "percentage": 17.38, "elapsed_time": "0:47:58", "remaining_time": "3:48:01", "throughput": 2337.01, "total_tokens": 6726944} {"current_steps": 11675, "total_steps": 67140, "loss": 0.5605, "lr": 4.917335812223887e-05, "epoch": 1.738903783139708, "percentage": 17.39, "elapsed_time": "0:47:59", "remaining_time": "3:48:00", "throughput": 2337.11, "total_tokens": 6729888} {"current_steps": 11680, "total_steps": 67140, "loss": 0.7331, "lr": 4.917169993475366e-05, "epoch": 1.7396484956806673, "percentage": 17.4, "elapsed_time": "0:48:00", "remaining_time": "3:47:58", "throughput": 2337.12, "total_tokens": 6732544} {"current_steps": 11685, "total_steps": 67140, "loss": 0.5593, "lr": 4.917004011384323e-05, "epoch": 1.7403932082216265, "percentage": 17.4, "elapsed_time": "0:48:01", "remaining_time": "3:47:56", "throughput": 2337.22, "total_tokens": 6735488} {"current_steps": 11690, "total_steps": 67140, "loss": 0.7188, "lr": 4.916837865961976e-05, "epoch": 1.7411379207625857, "percentage": 17.41, "elapsed_time": "0:48:02", "remaining_time": "3:47:54", "throughput": 2337.29, "total_tokens": 6738304} {"current_steps": 11695, "total_steps": 67140, "loss": 0.8134, "lr": 4.916671557219553e-05, "epoch": 1.7418826333035449, "percentage": 17.42, "elapsed_time": "0:48:04", "remaining_time": "3:47:53", "throughput": 2337.38, "total_tokens": 6741280} {"current_steps": 11700, "total_steps": 67140, "loss": 0.7116, "lr": 4.916505085168291e-05, "epoch": 1.742627345844504, "percentage": 17.43, "elapsed_time": "0:48:05", "remaining_time": "3:47:51", "throughput": 2337.42, "total_tokens": 6744000} {"current_steps": 11705, "total_steps": 67140, "loss": 0.5316, "lr": 4.91633844981944e-05, "epoch": 1.743372058385463, "percentage": 17.43, "elapsed_time": "0:48:06", "remaining_time": "3:47:49", "throughput": 2337.46, "total_tokens": 6746720} {"current_steps": 11710, "total_steps": 67140, "loss": 0.7808, "lr": 4.9161716511842614e-05, "epoch": 1.7441167709264223, "percentage": 17.44, "elapsed_time": "0:48:07", "remaining_time": "3:47:48", "throughput": 2337.6, "total_tokens": 6749856} {"current_steps": 11715, "total_steps": 67140, "loss": 0.6816, "lr": 4.916004689274026e-05, "epoch": 1.7448614834673815, "percentage": 17.45, "elapsed_time": "0:48:08", "remaining_time": "3:47:46", "throughput": 2337.66, "total_tokens": 6752640} {"current_steps": 11720, "total_steps": 67140, "loss": 0.6847, "lr": 4.915837564100016e-05, "epoch": 1.7456061960083407, "percentage": 17.46, "elapsed_time": "0:48:09", "remaining_time": "3:47:44", "throughput": 2337.73, "total_tokens": 6755520} {"current_steps": 11725, "total_steps": 67140, "loss": 0.5277, "lr": 4.915670275673525e-05, "epoch": 1.7463509085492999, "percentage": 17.46, "elapsed_time": "0:48:10", "remaining_time": "3:47:43", "throughput": 2337.81, "total_tokens": 6758368} {"current_steps": 11730, "total_steps": 67140, "loss": 0.7394, "lr": 4.915502824005859e-05, "epoch": 1.747095621090259, "percentage": 17.47, "elapsed_time": "0:48:12", "remaining_time": "3:47:41", "throughput": 2337.92, "total_tokens": 6761408} {"current_steps": 11735, "total_steps": 67140, "loss": 0.6275, "lr": 4.915335209108333e-05, "epoch": 1.7478403336312183, "percentage": 17.48, "elapsed_time": "0:48:13", "remaining_time": "3:47:39", "throughput": 2338.09, "total_tokens": 6764640} {"current_steps": 11740, "total_steps": 67140, "loss": 0.5597, "lr": 4.9151674309922736e-05, "epoch": 1.7485850461721775, "percentage": 17.49, "elapsed_time": "0:48:14", "remaining_time": "3:47:38", "throughput": 2338.16, "total_tokens": 6767456} {"current_steps": 11745, "total_steps": 67140, "loss": 0.7335, "lr": 4.914999489669018e-05, "epoch": 1.7493297587131367, "percentage": 17.49, "elapsed_time": "0:48:15", "remaining_time": "3:47:36", "throughput": 2338.23, "total_tokens": 6770336} {"current_steps": 11750, "total_steps": 67140, "loss": 0.6716, "lr": 4.9148313851499156e-05, "epoch": 1.7500744712540959, "percentage": 17.5, "elapsed_time": "0:48:16", "remaining_time": "3:47:34", "throughput": 2338.26, "total_tokens": 6772992} {"current_steps": 11755, "total_steps": 67140, "loss": 0.548, "lr": 4.914663117446327e-05, "epoch": 1.750819183795055, "percentage": 17.51, "elapsed_time": "0:48:17", "remaining_time": "3:47:32", "throughput": 2338.31, "total_tokens": 6775744} {"current_steps": 11760, "total_steps": 67140, "loss": 0.6231, "lr": 4.9144946865696204e-05, "epoch": 1.7515638963360143, "percentage": 17.52, "elapsed_time": "0:48:18", "remaining_time": "3:47:31", "throughput": 2338.39, "total_tokens": 6778688} {"current_steps": 11765, "total_steps": 67140, "loss": 0.7204, "lr": 4.9143260925311814e-05, "epoch": 1.7523086088769735, "percentage": 17.52, "elapsed_time": "0:48:20", "remaining_time": "3:47:29", "throughput": 2338.47, "total_tokens": 6781568} {"current_steps": 11770, "total_steps": 67140, "loss": 0.7337, "lr": 4.9141573353424e-05, "epoch": 1.7530533214179327, "percentage": 17.53, "elapsed_time": "0:48:21", "remaining_time": "3:47:28", "throughput": 2338.64, "total_tokens": 6784960} {"current_steps": 11775, "total_steps": 67140, "loss": 0.7208, "lr": 4.913988415014681e-05, "epoch": 1.7537980339588919, "percentage": 17.54, "elapsed_time": "0:48:22", "remaining_time": "3:47:26", "throughput": 2338.76, "total_tokens": 6788032} {"current_steps": 11780, "total_steps": 67140, "loss": 0.6424, "lr": 4.9138193315594404e-05, "epoch": 1.754542746499851, "percentage": 17.55, "elapsed_time": "0:48:23", "remaining_time": "3:47:25", "throughput": 2338.82, "total_tokens": 6790880} {"current_steps": 11785, "total_steps": 67140, "loss": 0.8032, "lr": 4.913650084988103e-05, "epoch": 1.7552874590408103, "percentage": 17.55, "elapsed_time": "0:48:24", "remaining_time": "3:47:23", "throughput": 2338.89, "total_tokens": 6793696} {"current_steps": 11790, "total_steps": 67140, "loss": 0.6472, "lr": 4.9134806753121055e-05, "epoch": 1.7560321715817695, "percentage": 17.56, "elapsed_time": "0:48:25", "remaining_time": "3:47:21", "throughput": 2338.91, "total_tokens": 6796352} {"current_steps": 11795, "total_steps": 67140, "loss": 0.7312, "lr": 4.913311102542897e-05, "epoch": 1.7567768841227287, "percentage": 17.57, "elapsed_time": "0:48:26", "remaining_time": "3:47:19", "throughput": 2338.97, "total_tokens": 6799168} {"current_steps": 11800, "total_steps": 67140, "loss": 0.6638, "lr": 4.913141366691936e-05, "epoch": 1.757521596663688, "percentage": 17.58, "elapsed_time": "0:48:28", "remaining_time": "3:47:18", "throughput": 2339.12, "total_tokens": 6802432} {"current_steps": 11805, "total_steps": 67140, "loss": 0.5651, "lr": 4.912971467770692e-05, "epoch": 1.758266309204647, "percentage": 17.58, "elapsed_time": "0:48:29", "remaining_time": "3:47:17", "throughput": 2339.24, "total_tokens": 6805504} {"current_steps": 11810, "total_steps": 67140, "loss": 0.6669, "lr": 4.912801405790647e-05, "epoch": 1.7590110217456063, "percentage": 17.59, "elapsed_time": "0:48:30", "remaining_time": "3:47:15", "throughput": 2339.33, "total_tokens": 6808448} {"current_steps": 11815, "total_steps": 67140, "loss": 0.5244, "lr": 4.9126311807632926e-05, "epoch": 1.7597557342865655, "percentage": 17.6, "elapsed_time": "0:48:31", "remaining_time": "3:47:13", "throughput": 2339.43, "total_tokens": 6811424} {"current_steps": 11820, "total_steps": 67140, "loss": 0.7023, "lr": 4.912460792700132e-05, "epoch": 1.7605004468275247, "percentage": 17.61, "elapsed_time": "0:48:32", "remaining_time": "3:47:11", "throughput": 2339.43, "total_tokens": 6813984} {"current_steps": 11825, "total_steps": 67140, "loss": 0.4803, "lr": 4.912290241612679e-05, "epoch": 1.761245159368484, "percentage": 17.61, "elapsed_time": "0:48:33", "remaining_time": "3:47:10", "throughput": 2339.53, "total_tokens": 6816928} {"current_steps": 11830, "total_steps": 67140, "loss": 0.7325, "lr": 4.91211952751246e-05, "epoch": 1.7619898719094431, "percentage": 17.62, "elapsed_time": "0:48:34", "remaining_time": "3:47:08", "throughput": 2339.59, "total_tokens": 6819776} {"current_steps": 11835, "total_steps": 67140, "loss": 0.7534, "lr": 4.9119486504110105e-05, "epoch": 1.762734584450402, "percentage": 17.63, "elapsed_time": "0:48:36", "remaining_time": "3:47:06", "throughput": 2339.65, "total_tokens": 6822496} {"current_steps": 11840, "total_steps": 67140, "loss": 0.6892, "lr": 4.911777610319877e-05, "epoch": 1.7634792969913613, "percentage": 17.63, "elapsed_time": "0:48:37", "remaining_time": "3:47:04", "throughput": 2339.76, "total_tokens": 6825472} {"current_steps": 11845, "total_steps": 67140, "loss": 0.7433, "lr": 4.911606407250617e-05, "epoch": 1.7642240095323205, "percentage": 17.64, "elapsed_time": "0:48:38", "remaining_time": "3:47:03", "throughput": 2339.84, "total_tokens": 6828352} {"current_steps": 11850, "total_steps": 67140, "loss": 0.8106, "lr": 4.9114350412148026e-05, "epoch": 1.7649687220732797, "percentage": 17.65, "elapsed_time": "0:48:39", "remaining_time": "3:47:01", "throughput": 2339.89, "total_tokens": 6831104} {"current_steps": 11855, "total_steps": 67140, "loss": 0.777, "lr": 4.911263512224011e-05, "epoch": 1.765713434614239, "percentage": 17.66, "elapsed_time": "0:48:40", "remaining_time": "3:46:59", "throughput": 2340.06, "total_tokens": 6834336} {"current_steps": 11860, "total_steps": 67140, "loss": 0.8059, "lr": 4.911091820289836e-05, "epoch": 1.766458147155198, "percentage": 17.66, "elapsed_time": "0:48:41", "remaining_time": "3:46:58", "throughput": 2340.09, "total_tokens": 6836992} {"current_steps": 11865, "total_steps": 67140, "loss": 0.6248, "lr": 4.910919965423878e-05, "epoch": 1.7672028596961573, "percentage": 17.67, "elapsed_time": "0:48:42", "remaining_time": "3:46:56", "throughput": 2340.13, "total_tokens": 6839744} {"current_steps": 11870, "total_steps": 67140, "loss": 0.6786, "lr": 4.91074794763775e-05, "epoch": 1.7679475722371165, "percentage": 17.68, "elapsed_time": "0:48:43", "remaining_time": "3:46:54", "throughput": 2340.2, "total_tokens": 6842528} {"current_steps": 11875, "total_steps": 67140, "loss": 0.7714, "lr": 4.910575766943079e-05, "epoch": 1.7686922847780755, "percentage": 17.69, "elapsed_time": "0:48:45", "remaining_time": "3:46:53", "throughput": 2340.31, "total_tokens": 6845600} {"current_steps": 11880, "total_steps": 67140, "loss": 0.7949, "lr": 4.9104034233514965e-05, "epoch": 1.7694369973190347, "percentage": 17.69, "elapsed_time": "0:48:46", "remaining_time": "3:46:51", "throughput": 2340.36, "total_tokens": 6848384} {"current_steps": 11885, "total_steps": 67140, "loss": 0.6234, "lr": 4.910230916874651e-05, "epoch": 1.770181709859994, "percentage": 17.7, "elapsed_time": "0:48:47", "remaining_time": "3:46:49", "throughput": 2340.41, "total_tokens": 6851072} {"current_steps": 11890, "total_steps": 67140, "loss": 0.71, "lr": 4.9100582475242004e-05, "epoch": 1.770926422400953, "percentage": 17.71, "elapsed_time": "0:48:48", "remaining_time": "3:46:47", "throughput": 2340.49, "total_tokens": 6853984} {"current_steps": 11895, "total_steps": 67140, "loss": 0.7902, "lr": 4.909885415311811e-05, "epoch": 1.7716711349419123, "percentage": 17.72, "elapsed_time": "0:48:49", "remaining_time": "3:46:45", "throughput": 2340.47, "total_tokens": 6856416} {"current_steps": 11900, "total_steps": 67140, "loss": 0.7531, "lr": 4.9097124202491636e-05, "epoch": 1.7724158474828715, "percentage": 17.72, "elapsed_time": "0:48:50", "remaining_time": "3:46:44", "throughput": 2340.57, "total_tokens": 6859456} {"current_steps": 11905, "total_steps": 67140, "loss": 0.6041, "lr": 4.9095392623479474e-05, "epoch": 1.7731605600238307, "percentage": 17.73, "elapsed_time": "0:48:51", "remaining_time": "3:46:42", "throughput": 2340.62, "total_tokens": 6862208} {"current_steps": 11910, "total_steps": 67140, "loss": 0.7679, "lr": 4.909365941619866e-05, "epoch": 1.77390527256479, "percentage": 17.74, "elapsed_time": "0:48:52", "remaining_time": "3:46:40", "throughput": 2340.71, "total_tokens": 6865152} {"current_steps": 11915, "total_steps": 67140, "loss": 0.6975, "lr": 4.909192458076628e-05, "epoch": 1.7746499851057491, "percentage": 17.75, "elapsed_time": "0:48:54", "remaining_time": "3:46:38", "throughput": 2340.74, "total_tokens": 6867776} {"current_steps": 11920, "total_steps": 67140, "loss": 0.7454, "lr": 4.9090188117299596e-05, "epoch": 1.7753946976467083, "percentage": 17.75, "elapsed_time": "0:48:55", "remaining_time": "3:46:37", "throughput": 2340.85, "total_tokens": 6870848} {"current_steps": 11925, "total_steps": 67140, "loss": 0.6988, "lr": 4.908845002591594e-05, "epoch": 1.7761394101876675, "percentage": 17.76, "elapsed_time": "0:48:56", "remaining_time": "3:46:35", "throughput": 2340.93, "total_tokens": 6873696} {"current_steps": 11930, "total_steps": 67140, "loss": 0.8362, "lr": 4.9086710306732775e-05, "epoch": 1.7768841227286267, "percentage": 17.77, "elapsed_time": "0:48:57", "remaining_time": "3:46:34", "throughput": 2341.08, "total_tokens": 6876928} {"current_steps": 11935, "total_steps": 67140, "loss": 0.676, "lr": 4.908496895986765e-05, "epoch": 1.777628835269586, "percentage": 17.78, "elapsed_time": "0:48:58", "remaining_time": "3:46:32", "throughput": 2341.1, "total_tokens": 6879584} {"current_steps": 11940, "total_steps": 67140, "loss": 0.6991, "lr": 4.908322598543825e-05, "epoch": 1.7783735478105451, "percentage": 17.78, "elapsed_time": "0:48:59", "remaining_time": "3:46:30", "throughput": 2341.26, "total_tokens": 6882784} {"current_steps": 11945, "total_steps": 67140, "loss": 0.7365, "lr": 4.908148138356235e-05, "epoch": 1.7791182603515043, "percentage": 17.79, "elapsed_time": "0:49:00", "remaining_time": "3:46:29", "throughput": 2341.34, "total_tokens": 6885632} {"current_steps": 11950, "total_steps": 67140, "loss": 0.7588, "lr": 4.907973515435784e-05, "epoch": 1.7798629728924635, "percentage": 17.8, "elapsed_time": "0:49:02", "remaining_time": "3:46:27", "throughput": 2341.47, "total_tokens": 6888736} {"current_steps": 11955, "total_steps": 67140, "loss": 0.7245, "lr": 4.907798729794274e-05, "epoch": 1.7806076854334227, "percentage": 17.81, "elapsed_time": "0:49:03", "remaining_time": "3:46:26", "throughput": 2341.6, "total_tokens": 6891840} {"current_steps": 11960, "total_steps": 67140, "loss": 0.6941, "lr": 4.907623781443515e-05, "epoch": 1.781352397974382, "percentage": 17.81, "elapsed_time": "0:49:04", "remaining_time": "3:46:24", "throughput": 2341.65, "total_tokens": 6894592} {"current_steps": 11965, "total_steps": 67140, "loss": 0.5143, "lr": 4.9074486703953295e-05, "epoch": 1.7820971105153411, "percentage": 17.82, "elapsed_time": "0:49:05", "remaining_time": "3:46:22", "throughput": 2341.7, "total_tokens": 6897376} {"current_steps": 11970, "total_steps": 67140, "loss": 0.716, "lr": 4.9072733966615506e-05, "epoch": 1.7828418230563003, "percentage": 17.83, "elapsed_time": "0:49:06", "remaining_time": "3:46:20", "throughput": 2341.74, "total_tokens": 6900096} {"current_steps": 11975, "total_steps": 67140, "loss": 0.7479, "lr": 4.907097960254023e-05, "epoch": 1.7835865355972595, "percentage": 17.84, "elapsed_time": "0:49:07", "remaining_time": "3:46:19", "throughput": 2341.84, "total_tokens": 6903008} {"current_steps": 11980, "total_steps": 67140, "loss": 0.6826, "lr": 4.9069223611846014e-05, "epoch": 1.7843312481382188, "percentage": 17.84, "elapsed_time": "0:49:08", "remaining_time": "3:46:17", "throughput": 2341.97, "total_tokens": 6906144} {"current_steps": 11985, "total_steps": 67140, "loss": 0.5686, "lr": 4.906746599465153e-05, "epoch": 1.785075960679178, "percentage": 17.85, "elapsed_time": "0:49:10", "remaining_time": "3:46:15", "throughput": 2342.07, "total_tokens": 6909152} {"current_steps": 11990, "total_steps": 67140, "loss": 0.6774, "lr": 4.906570675107555e-05, "epoch": 1.7858206732201372, "percentage": 17.86, "elapsed_time": "0:49:11", "remaining_time": "3:46:14", "throughput": 2342.21, "total_tokens": 6912320} {"current_steps": 11995, "total_steps": 67140, "loss": 0.6049, "lr": 4.906394588123694e-05, "epoch": 1.7865653857610964, "percentage": 17.87, "elapsed_time": "0:49:12", "remaining_time": "3:46:12", "throughput": 2342.3, "total_tokens": 6915232} {"current_steps": 12000, "total_steps": 67140, "loss": 0.6405, "lr": 4.9062183385254714e-05, "epoch": 1.7873100983020556, "percentage": 17.87, "elapsed_time": "0:49:13", "remaining_time": "3:46:11", "throughput": 2342.36, "total_tokens": 6918048} {"current_steps": 12005, "total_steps": 67140, "loss": 0.6925, "lr": 4.9060419263247954e-05, "epoch": 1.7880548108430145, "percentage": 17.88, "elapsed_time": "0:49:14", "remaining_time": "3:46:09", "throughput": 2342.4, "total_tokens": 6920832} {"current_steps": 12010, "total_steps": 67140, "loss": 0.7075, "lr": 4.905865351533589e-05, "epoch": 1.7887995233839737, "percentage": 17.89, "elapsed_time": "0:49:15", "remaining_time": "3:46:07", "throughput": 2342.48, "total_tokens": 6923712} {"current_steps": 12015, "total_steps": 67140, "loss": 0.559, "lr": 4.905688614163784e-05, "epoch": 1.789544235924933, "percentage": 17.9, "elapsed_time": "0:49:16", "remaining_time": "3:46:05", "throughput": 2342.52, "total_tokens": 6926432} {"current_steps": 12020, "total_steps": 67140, "loss": 0.7022, "lr": 4.905511714227322e-05, "epoch": 1.7902889484658921, "percentage": 17.9, "elapsed_time": "0:49:17", "remaining_time": "3:46:04", "throughput": 2342.63, "total_tokens": 6929440} {"current_steps": 12025, "total_steps": 67140, "loss": 0.8476, "lr": 4.905334651736159e-05, "epoch": 1.7910336610068514, "percentage": 17.91, "elapsed_time": "0:49:19", "remaining_time": "3:46:02", "throughput": 2342.77, "total_tokens": 6932608} {"current_steps": 12030, "total_steps": 67140, "loss": 0.7652, "lr": 4.90515742670226e-05, "epoch": 1.7917783735478106, "percentage": 17.92, "elapsed_time": "0:49:20", "remaining_time": "3:46:01", "throughput": 2342.87, "total_tokens": 6935616} {"current_steps": 12035, "total_steps": 67140, "loss": 0.5321, "lr": 4.904980039137601e-05, "epoch": 1.7925230860887698, "percentage": 17.93, "elapsed_time": "0:49:21", "remaining_time": "3:45:59", "throughput": 2342.92, "total_tokens": 6938400} {"current_steps": 12040, "total_steps": 67140, "loss": 0.548, "lr": 4.904802489054168e-05, "epoch": 1.793267798629729, "percentage": 17.93, "elapsed_time": "0:49:22", "remaining_time": "3:45:58", "throughput": 2343.0, "total_tokens": 6941344} {"current_steps": 12045, "total_steps": 67140, "loss": 0.6968, "lr": 4.9046247764639606e-05, "epoch": 1.7940125111706882, "percentage": 17.94, "elapsed_time": "0:49:23", "remaining_time": "3:45:56", "throughput": 2343.03, "total_tokens": 6944032} {"current_steps": 12050, "total_steps": 67140, "loss": 0.6976, "lr": 4.9044469013789876e-05, "epoch": 1.7947572237116471, "percentage": 17.95, "elapsed_time": "0:49:24", "remaining_time": "3:45:54", "throughput": 2343.13, "total_tokens": 6947040} {"current_steps": 12055, "total_steps": 67140, "loss": 0.5981, "lr": 4.904268863811268e-05, "epoch": 1.7955019362526063, "percentage": 17.96, "elapsed_time": "0:49:25", "remaining_time": "3:45:52", "throughput": 2343.18, "total_tokens": 6949824} {"current_steps": 12060, "total_steps": 67140, "loss": 0.7357, "lr": 4.9040906637728344e-05, "epoch": 1.7962466487935655, "percentage": 17.96, "elapsed_time": "0:49:27", "remaining_time": "3:45:51", "throughput": 2343.27, "total_tokens": 6952768} {"current_steps": 12065, "total_steps": 67140, "loss": 0.6687, "lr": 4.903912301275728e-05, "epoch": 1.7969913613345248, "percentage": 17.97, "elapsed_time": "0:49:28", "remaining_time": "3:45:49", "throughput": 2343.33, "total_tokens": 6955616} {"current_steps": 12070, "total_steps": 67140, "loss": 0.736, "lr": 4.903733776332001e-05, "epoch": 1.797736073875484, "percentage": 17.98, "elapsed_time": "0:49:29", "remaining_time": "3:45:48", "throughput": 2343.42, "total_tokens": 6958528} {"current_steps": 12075, "total_steps": 67140, "loss": 0.5241, "lr": 4.903555088953719e-05, "epoch": 1.7984807864164432, "percentage": 17.98, "elapsed_time": "0:49:30", "remaining_time": "3:45:46", "throughput": 2343.5, "total_tokens": 6961472} {"current_steps": 12080, "total_steps": 67140, "loss": 0.6973, "lr": 4.9033762391529556e-05, "epoch": 1.7992254989574024, "percentage": 17.99, "elapsed_time": "0:49:31", "remaining_time": "3:45:44", "throughput": 2343.6, "total_tokens": 6964512} {"current_steps": 12085, "total_steps": 67140, "loss": 0.7785, "lr": 4.903197226941798e-05, "epoch": 1.7999702114983616, "percentage": 18.0, "elapsed_time": "0:49:32", "remaining_time": "3:45:43", "throughput": 2343.67, "total_tokens": 6967456} {"current_steps": 12090, "total_steps": 67140, "loss": 0.8358, "lr": 4.9030180523323425e-05, "epoch": 1.8007149240393208, "percentage": 18.01, "elapsed_time": "0:49:33", "remaining_time": "3:45:41", "throughput": 2343.75, "total_tokens": 6970272} {"current_steps": 12095, "total_steps": 67140, "loss": 0.7042, "lr": 4.902838715336697e-05, "epoch": 1.80145963658028, "percentage": 18.01, "elapsed_time": "0:49:35", "remaining_time": "3:45:39", "throughput": 2343.81, "total_tokens": 6973120} {"current_steps": 12100, "total_steps": 67140, "loss": 0.6241, "lr": 4.90265921596698e-05, "epoch": 1.8022043491212392, "percentage": 18.02, "elapsed_time": "0:49:36", "remaining_time": "3:45:38", "throughput": 2343.86, "total_tokens": 6975904} {"current_steps": 12105, "total_steps": 67140, "loss": 0.6314, "lr": 4.9024795542353216e-05, "epoch": 1.8029490616621984, "percentage": 18.03, "elapsed_time": "0:49:37", "remaining_time": "3:45:36", "throughput": 2344.01, "total_tokens": 6979072} {"current_steps": 12110, "total_steps": 67140, "loss": 0.6929, "lr": 4.902299730153863e-05, "epoch": 1.8036937742031576, "percentage": 18.04, "elapsed_time": "0:49:38", "remaining_time": "3:45:35", "throughput": 2344.11, "total_tokens": 6982112} {"current_steps": 12115, "total_steps": 67140, "loss": 0.757, "lr": 4.9021197437347555e-05, "epoch": 1.8044384867441168, "percentage": 18.04, "elapsed_time": "0:49:39", "remaining_time": "3:45:33", "throughput": 2344.18, "total_tokens": 6984960} {"current_steps": 12120, "total_steps": 67140, "loss": 0.574, "lr": 4.901939594990162e-05, "epoch": 1.805183199285076, "percentage": 18.05, "elapsed_time": "0:49:40", "remaining_time": "3:45:31", "throughput": 2344.25, "total_tokens": 6987808} {"current_steps": 12125, "total_steps": 67140, "loss": 0.6889, "lr": 4.901759283932257e-05, "epoch": 1.8059279118260352, "percentage": 18.06, "elapsed_time": "0:49:41", "remaining_time": "3:45:29", "throughput": 2344.28, "total_tokens": 6990496} {"current_steps": 12130, "total_steps": 67140, "loss": 0.7502, "lr": 4.9015788105732236e-05, "epoch": 1.8066726243669944, "percentage": 18.07, "elapsed_time": "0:49:43", "remaining_time": "3:45:28", "throughput": 2344.3, "total_tokens": 6993120} {"current_steps": 12135, "total_steps": 67140, "loss": 0.6717, "lr": 4.9013981749252585e-05, "epoch": 1.8074173369079536, "percentage": 18.07, "elapsed_time": "0:49:44", "remaining_time": "3:45:26", "throughput": 2344.35, "total_tokens": 6995840} {"current_steps": 12140, "total_steps": 67140, "loss": 0.6701, "lr": 4.901217377000568e-05, "epoch": 1.8081620494489128, "percentage": 18.08, "elapsed_time": "0:49:45", "remaining_time": "3:45:24", "throughput": 2344.38, "total_tokens": 6998496} {"current_steps": 12145, "total_steps": 67140, "loss": 0.5838, "lr": 4.90103641681137e-05, "epoch": 1.808906761989872, "percentage": 18.09, "elapsed_time": "0:49:46", "remaining_time": "3:45:22", "throughput": 2344.46, "total_tokens": 7001376} {"current_steps": 12150, "total_steps": 67140, "loss": 0.906, "lr": 4.900855294369893e-05, "epoch": 1.8096514745308312, "percentage": 18.1, "elapsed_time": "0:49:47", "remaining_time": "3:45:21", "throughput": 2344.59, "total_tokens": 7004544} {"current_steps": 12155, "total_steps": 67140, "loss": 0.6362, "lr": 4.900674009688376e-05, "epoch": 1.8103961870717904, "percentage": 18.1, "elapsed_time": "0:49:48", "remaining_time": "3:45:19", "throughput": 2344.65, "total_tokens": 7007360} {"current_steps": 12160, "total_steps": 67140, "loss": 0.6373, "lr": 4.90049256277907e-05, "epoch": 1.8111408996127496, "percentage": 18.11, "elapsed_time": "0:49:49", "remaining_time": "3:45:17", "throughput": 2344.71, "total_tokens": 7010176} {"current_steps": 12165, "total_steps": 67140, "loss": 0.7333, "lr": 4.900310953654236e-05, "epoch": 1.8118856121537088, "percentage": 18.12, "elapsed_time": "0:49:50", "remaining_time": "3:45:16", "throughput": 2344.84, "total_tokens": 7013280} {"current_steps": 12170, "total_steps": 67140, "loss": 0.658, "lr": 4.900129182326147e-05, "epoch": 1.812630324694668, "percentage": 18.13, "elapsed_time": "0:49:52", "remaining_time": "3:45:14", "throughput": 2344.89, "total_tokens": 7016032} {"current_steps": 12175, "total_steps": 67140, "loss": 0.5744, "lr": 4.899947248807086e-05, "epoch": 1.8133750372356272, "percentage": 18.13, "elapsed_time": "0:49:53", "remaining_time": "3:45:14", "throughput": 2345.18, "total_tokens": 7020128} {"current_steps": 12180, "total_steps": 67140, "loss": 0.7962, "lr": 4.899765153109348e-05, "epoch": 1.8141197497765862, "percentage": 18.14, "elapsed_time": "0:49:54", "remaining_time": "3:45:12", "throughput": 2345.3, "total_tokens": 7023232} {"current_steps": 12185, "total_steps": 67140, "loss": 0.576, "lr": 4.899582895245237e-05, "epoch": 1.8148644623175454, "percentage": 18.15, "elapsed_time": "0:49:55", "remaining_time": "3:45:10", "throughput": 2345.35, "total_tokens": 7026048} {"current_steps": 12190, "total_steps": 67140, "loss": 0.7852, "lr": 4.89940047522707e-05, "epoch": 1.8156091748585046, "percentage": 18.16, "elapsed_time": "0:49:56", "remaining_time": "3:45:09", "throughput": 2345.39, "total_tokens": 7028768} {"current_steps": 12195, "total_steps": 67140, "loss": 0.6928, "lr": 4.899217893067174e-05, "epoch": 1.8163538873994638, "percentage": 18.16, "elapsed_time": "0:49:57", "remaining_time": "3:45:07", "throughput": 2345.48, "total_tokens": 7031712} {"current_steps": 12200, "total_steps": 67140, "loss": 0.7576, "lr": 4.8990351487778875e-05, "epoch": 1.817098599940423, "percentage": 18.17, "elapsed_time": "0:49:59", "remaining_time": "3:45:05", "throughput": 2345.58, "total_tokens": 7034720} {"current_steps": 12205, "total_steps": 67140, "loss": 0.6512, "lr": 4.89885224237156e-05, "epoch": 1.8178433124813822, "percentage": 18.18, "elapsed_time": "0:50:00", "remaining_time": "3:45:04", "throughput": 2345.64, "total_tokens": 7037536} {"current_steps": 12210, "total_steps": 67140, "loss": 0.6506, "lr": 4.89866917386055e-05, "epoch": 1.8185880250223414, "percentage": 18.19, "elapsed_time": "0:50:01", "remaining_time": "3:45:02", "throughput": 2345.72, "total_tokens": 7040480} {"current_steps": 12215, "total_steps": 67140, "loss": 0.6857, "lr": 4.89848594325723e-05, "epoch": 1.8193327375633006, "percentage": 18.19, "elapsed_time": "0:50:02", "remaining_time": "3:45:01", "throughput": 2345.83, "total_tokens": 7043552} {"current_steps": 12220, "total_steps": 67140, "loss": 0.7308, "lr": 4.898302550573981e-05, "epoch": 1.8200774501042598, "percentage": 18.2, "elapsed_time": "0:50:03", "remaining_time": "3:44:59", "throughput": 2345.89, "total_tokens": 7046368} {"current_steps": 12225, "total_steps": 67140, "loss": 0.6789, "lr": 4.898118995823197e-05, "epoch": 1.8208221626452188, "percentage": 18.21, "elapsed_time": "0:50:04", "remaining_time": "3:44:58", "throughput": 2346.0, "total_tokens": 7049472} {"current_steps": 12230, "total_steps": 67140, "loss": 0.6391, "lr": 4.8979352790172814e-05, "epoch": 1.821566875186178, "percentage": 18.22, "elapsed_time": "0:50:05", "remaining_time": "3:44:56", "throughput": 2346.0, "total_tokens": 7052000} {"current_steps": 12235, "total_steps": 67140, "loss": 0.7458, "lr": 4.8977514001686485e-05, "epoch": 1.8223115877271372, "percentage": 18.22, "elapsed_time": "0:50:07", "remaining_time": "3:44:54", "throughput": 2346.08, "total_tokens": 7054880} {"current_steps": 12240, "total_steps": 67140, "loss": 0.6727, "lr": 4.8975673592897244e-05, "epoch": 1.8230563002680964, "percentage": 18.23, "elapsed_time": "0:50:08", "remaining_time": "3:44:52", "throughput": 2346.17, "total_tokens": 7057824} {"current_steps": 12245, "total_steps": 67140, "loss": 0.5984, "lr": 4.897383156392947e-05, "epoch": 1.8238010128090556, "percentage": 18.24, "elapsed_time": "0:50:09", "remaining_time": "3:44:51", "throughput": 2346.22, "total_tokens": 7060608} {"current_steps": 12250, "total_steps": 67140, "loss": 0.6634, "lr": 4.897198791490762e-05, "epoch": 1.8245457253500148, "percentage": 18.25, "elapsed_time": "0:50:10", "remaining_time": "3:44:49", "throughput": 2346.38, "total_tokens": 7063872} {"current_steps": 12255, "total_steps": 67140, "loss": 0.7343, "lr": 4.897014264595629e-05, "epoch": 1.825290437890974, "percentage": 18.25, "elapsed_time": "0:50:11", "remaining_time": "3:44:47", "throughput": 2346.4, "total_tokens": 7066560} {"current_steps": 12260, "total_steps": 67140, "loss": 0.614, "lr": 4.896829575720018e-05, "epoch": 1.8260351504319332, "percentage": 18.26, "elapsed_time": "0:50:12", "remaining_time": "3:44:46", "throughput": 2346.47, "total_tokens": 7069408} {"current_steps": 12265, "total_steps": 67140, "loss": 0.7009, "lr": 4.8966447248764084e-05, "epoch": 1.8267798629728924, "percentage": 18.27, "elapsed_time": "0:50:13", "remaining_time": "3:44:44", "throughput": 2346.52, "total_tokens": 7072192} {"current_steps": 12270, "total_steps": 67140, "loss": 0.6721, "lr": 4.8964597120772926e-05, "epoch": 1.8275245755138516, "percentage": 18.28, "elapsed_time": "0:50:15", "remaining_time": "3:44:42", "throughput": 2346.62, "total_tokens": 7075200} {"current_steps": 12275, "total_steps": 67140, "loss": 0.6328, "lr": 4.8962745373351734e-05, "epoch": 1.8282692880548108, "percentage": 18.28, "elapsed_time": "0:50:16", "remaining_time": "3:44:41", "throughput": 2346.66, "total_tokens": 7077952} {"current_steps": 12280, "total_steps": 67140, "loss": 0.6663, "lr": 4.8960892006625626e-05, "epoch": 1.82901400059577, "percentage": 18.29, "elapsed_time": "0:50:17", "remaining_time": "3:44:39", "throughput": 2346.72, "total_tokens": 7080736} {"current_steps": 12285, "total_steps": 67140, "loss": 0.6256, "lr": 4.8959037020719854e-05, "epoch": 1.8297587131367292, "percentage": 18.3, "elapsed_time": "0:50:18", "remaining_time": "3:44:37", "throughput": 2346.81, "total_tokens": 7083680} {"current_steps": 12290, "total_steps": 67140, "loss": 0.7744, "lr": 4.895718041575978e-05, "epoch": 1.8305034256776884, "percentage": 18.31, "elapsed_time": "0:50:19", "remaining_time": "3:44:36", "throughput": 2346.87, "total_tokens": 7086464} {"current_steps": 12295, "total_steps": 67140, "loss": 0.6355, "lr": 4.895532219187085e-05, "epoch": 1.8312481382186476, "percentage": 18.31, "elapsed_time": "0:50:20", "remaining_time": "3:44:34", "throughput": 2346.99, "total_tokens": 7089568} {"current_steps": 12300, "total_steps": 67140, "loss": 0.7666, "lr": 4.895346234917865e-05, "epoch": 1.8319928507596068, "percentage": 18.32, "elapsed_time": "0:50:21", "remaining_time": "3:44:33", "throughput": 2347.1, "total_tokens": 7092640} {"current_steps": 12305, "total_steps": 67140, "loss": 0.5524, "lr": 4.8951600887808836e-05, "epoch": 1.832737563300566, "percentage": 18.33, "elapsed_time": "0:50:22", "remaining_time": "3:44:31", "throughput": 2347.14, "total_tokens": 7095392} {"current_steps": 12310, "total_steps": 67140, "loss": 0.6247, "lr": 4.894973780788722e-05, "epoch": 1.8334822758415252, "percentage": 18.33, "elapsed_time": "0:50:24", "remaining_time": "3:44:29", "throughput": 2347.22, "total_tokens": 7098304} {"current_steps": 12315, "total_steps": 67140, "loss": 0.7287, "lr": 4.89478731095397e-05, "epoch": 1.8342269883824844, "percentage": 18.34, "elapsed_time": "0:50:25", "remaining_time": "3:44:28", "throughput": 2347.26, "total_tokens": 7101056} {"current_steps": 12320, "total_steps": 67140, "loss": 0.6707, "lr": 4.894600679289228e-05, "epoch": 1.8349717009234436, "percentage": 18.35, "elapsed_time": "0:50:26", "remaining_time": "3:44:26", "throughput": 2347.36, "total_tokens": 7104064} {"current_steps": 12325, "total_steps": 67140, "loss": 0.5293, "lr": 4.8944138858071076e-05, "epoch": 1.8357164134644028, "percentage": 18.36, "elapsed_time": "0:50:27", "remaining_time": "3:44:25", "throughput": 2347.46, "total_tokens": 7107104} {"current_steps": 12330, "total_steps": 67140, "loss": 0.7067, "lr": 4.894226930520232e-05, "epoch": 1.836461126005362, "percentage": 18.36, "elapsed_time": "0:50:28", "remaining_time": "3:44:23", "throughput": 2347.55, "total_tokens": 7110080} {"current_steps": 12335, "total_steps": 67140, "loss": 0.495, "lr": 4.894039813441235e-05, "epoch": 1.8372058385463212, "percentage": 18.37, "elapsed_time": "0:50:29", "remaining_time": "3:44:21", "throughput": 2347.62, "total_tokens": 7112992} {"current_steps": 12340, "total_steps": 67140, "loss": 0.8325, "lr": 4.89385253458276e-05, "epoch": 1.8379505510872804, "percentage": 18.38, "elapsed_time": "0:50:31", "remaining_time": "3:44:20", "throughput": 2347.71, "total_tokens": 7115968} {"current_steps": 12345, "total_steps": 67140, "loss": 0.6274, "lr": 4.8936650939574636e-05, "epoch": 1.8386952636282397, "percentage": 18.39, "elapsed_time": "0:50:32", "remaining_time": "3:44:18", "throughput": 2347.82, "total_tokens": 7119040} {"current_steps": 12350, "total_steps": 67140, "loss": 0.6665, "lr": 4.893477491578013e-05, "epoch": 1.8394399761691989, "percentage": 18.39, "elapsed_time": "0:50:33", "remaining_time": "3:44:17", "throughput": 2347.91, "total_tokens": 7122016} {"current_steps": 12355, "total_steps": 67140, "loss": 0.6335, "lr": 4.893289727457083e-05, "epoch": 1.8401846887101578, "percentage": 18.4, "elapsed_time": "0:50:34", "remaining_time": "3:44:15", "throughput": 2347.97, "total_tokens": 7124832} {"current_steps": 12360, "total_steps": 67140, "loss": 0.6112, "lr": 4.893101801607365e-05, "epoch": 1.840929401251117, "percentage": 18.41, "elapsed_time": "0:50:35", "remaining_time": "3:44:13", "throughput": 2348.06, "total_tokens": 7127808} {"current_steps": 12365, "total_steps": 67140, "loss": 0.6994, "lr": 4.892913714041556e-05, "epoch": 1.8416741137920762, "percentage": 18.42, "elapsed_time": "0:50:36", "remaining_time": "3:44:12", "throughput": 2348.18, "total_tokens": 7130880} {"current_steps": 12370, "total_steps": 67140, "loss": 0.6891, "lr": 4.892725464772368e-05, "epoch": 1.8424188263330354, "percentage": 18.42, "elapsed_time": "0:50:37", "remaining_time": "3:44:10", "throughput": 2348.27, "total_tokens": 7133856} {"current_steps": 12375, "total_steps": 67140, "loss": 0.6619, "lr": 4.8925370538125204e-05, "epoch": 1.8431635388739946, "percentage": 18.43, "elapsed_time": "0:50:39", "remaining_time": "3:44:09", "throughput": 2348.34, "total_tokens": 7136768} {"current_steps": 12380, "total_steps": 67140, "loss": 0.6816, "lr": 4.892348481174747e-05, "epoch": 1.8439082514149538, "percentage": 18.44, "elapsed_time": "0:50:40", "remaining_time": "3:44:07", "throughput": 2348.41, "total_tokens": 7139680} {"current_steps": 12385, "total_steps": 67140, "loss": 0.6635, "lr": 4.8921597468717887e-05, "epoch": 1.844652963955913, "percentage": 18.45, "elapsed_time": "0:50:41", "remaining_time": "3:44:06", "throughput": 2348.48, "total_tokens": 7142560} {"current_steps": 12390, "total_steps": 67140, "loss": 0.5454, "lr": 4.891970850916401e-05, "epoch": 1.8453976764968723, "percentage": 18.45, "elapsed_time": "0:50:42", "remaining_time": "3:44:04", "throughput": 2348.51, "total_tokens": 7145248} {"current_steps": 12395, "total_steps": 67140, "loss": 0.7346, "lr": 4.891781793321348e-05, "epoch": 1.8461423890378312, "percentage": 18.46, "elapsed_time": "0:50:43", "remaining_time": "3:44:02", "throughput": 2348.57, "total_tokens": 7148064} {"current_steps": 12400, "total_steps": 67140, "loss": 0.6612, "lr": 4.8915925740994064e-05, "epoch": 1.8468871015787904, "percentage": 18.47, "elapsed_time": "0:50:44", "remaining_time": "3:44:01", "throughput": 2348.69, "total_tokens": 7151136} {"current_steps": 12405, "total_steps": 67140, "loss": 0.6098, "lr": 4.8914031932633613e-05, "epoch": 1.8476318141197496, "percentage": 18.48, "elapsed_time": "0:50:45", "remaining_time": "3:43:59", "throughput": 2348.76, "total_tokens": 7154016} {"current_steps": 12410, "total_steps": 67140, "loss": 0.5452, "lr": 4.891213650826012e-05, "epoch": 1.8483765266607088, "percentage": 18.48, "elapsed_time": "0:50:46", "remaining_time": "3:43:57", "throughput": 2348.86, "total_tokens": 7156960} {"current_steps": 12415, "total_steps": 67140, "loss": 0.6975, "lr": 4.891023946800165e-05, "epoch": 1.849121239201668, "percentage": 18.49, "elapsed_time": "0:50:48", "remaining_time": "3:43:56", "throughput": 2348.92, "total_tokens": 7159872} {"current_steps": 12420, "total_steps": 67140, "loss": 0.5253, "lr": 4.890834081198642e-05, "epoch": 1.8498659517426272, "percentage": 18.5, "elapsed_time": "0:50:49", "remaining_time": "3:43:54", "throughput": 2349.02, "total_tokens": 7162880} {"current_steps": 12425, "total_steps": 67140, "loss": 0.7161, "lr": 4.890644054034271e-05, "epoch": 1.8506106642835864, "percentage": 18.51, "elapsed_time": "0:50:50", "remaining_time": "3:43:53", "throughput": 2349.11, "total_tokens": 7165824} {"current_steps": 12430, "total_steps": 67140, "loss": 0.6534, "lr": 4.890453865319896e-05, "epoch": 1.8513553768245457, "percentage": 18.51, "elapsed_time": "0:50:51", "remaining_time": "3:43:51", "throughput": 2349.14, "total_tokens": 7168544} {"current_steps": 12435, "total_steps": 67140, "loss": 0.706, "lr": 4.890263515068367e-05, "epoch": 1.8521000893655049, "percentage": 18.52, "elapsed_time": "0:50:52", "remaining_time": "3:43:49", "throughput": 2349.16, "total_tokens": 7171200} {"current_steps": 12440, "total_steps": 67140, "loss": 0.6648, "lr": 4.890073003292547e-05, "epoch": 1.852844801906464, "percentage": 18.53, "elapsed_time": "0:50:53", "remaining_time": "3:43:47", "throughput": 2349.21, "total_tokens": 7173952} {"current_steps": 12445, "total_steps": 67140, "loss": 0.7896, "lr": 4.8898823300053124e-05, "epoch": 1.8535895144474233, "percentage": 18.54, "elapsed_time": "0:50:54", "remaining_time": "3:43:46", "throughput": 2349.25, "total_tokens": 7176704} {"current_steps": 12450, "total_steps": 67140, "loss": 0.6459, "lr": 4.889691495219545e-05, "epoch": 1.8543342269883825, "percentage": 18.54, "elapsed_time": "0:50:56", "remaining_time": "3:43:44", "throughput": 2349.31, "total_tokens": 7179552} {"current_steps": 12455, "total_steps": 67140, "loss": 0.6855, "lr": 4.889500498948143e-05, "epoch": 1.8550789395293417, "percentage": 18.55, "elapsed_time": "0:50:57", "remaining_time": "3:43:42", "throughput": 2349.34, "total_tokens": 7182240} {"current_steps": 12460, "total_steps": 67140, "loss": 0.7496, "lr": 4.8893093412040114e-05, "epoch": 1.8558236520703009, "percentage": 18.56, "elapsed_time": "0:50:58", "remaining_time": "3:43:40", "throughput": 2349.38, "total_tokens": 7184960} {"current_steps": 12465, "total_steps": 67140, "loss": 0.6549, "lr": 4.8891180220000696e-05, "epoch": 1.85656836461126, "percentage": 18.57, "elapsed_time": "0:50:59", "remaining_time": "3:43:39", "throughput": 2349.43, "total_tokens": 7187808} {"current_steps": 12470, "total_steps": 67140, "loss": 0.6359, "lr": 4.8889265413492446e-05, "epoch": 1.8573130771522193, "percentage": 18.57, "elapsed_time": "0:51:00", "remaining_time": "3:43:37", "throughput": 2349.48, "total_tokens": 7190592} {"current_steps": 12475, "total_steps": 67140, "loss": 0.7245, "lr": 4.888734899264477e-05, "epoch": 1.8580577896931785, "percentage": 18.58, "elapsed_time": "0:51:01", "remaining_time": "3:43:35", "throughput": 2349.53, "total_tokens": 7193408} {"current_steps": 12480, "total_steps": 67140, "loss": 0.9183, "lr": 4.888543095758717e-05, "epoch": 1.8588025022341377, "percentage": 18.59, "elapsed_time": "0:51:02", "remaining_time": "3:43:34", "throughput": 2349.61, "total_tokens": 7196384} {"current_steps": 12485, "total_steps": 67140, "loss": 0.6707, "lr": 4.888351130844926e-05, "epoch": 1.8595472147750969, "percentage": 18.6, "elapsed_time": "0:51:03", "remaining_time": "3:43:32", "throughput": 2349.65, "total_tokens": 7199168} {"current_steps": 12490, "total_steps": 67140, "loss": 0.7659, "lr": 4.8881590045360744e-05, "epoch": 1.860291927316056, "percentage": 18.6, "elapsed_time": "0:51:05", "remaining_time": "3:43:31", "throughput": 2349.75, "total_tokens": 7202208} {"current_steps": 12495, "total_steps": 67140, "loss": 0.665, "lr": 4.8879667168451484e-05, "epoch": 1.8610366398570153, "percentage": 18.61, "elapsed_time": "0:51:06", "remaining_time": "3:43:29", "throughput": 2349.78, "total_tokens": 7204864} {"current_steps": 12500, "total_steps": 67140, "loss": 0.5994, "lr": 4.88777426778514e-05, "epoch": 1.8617813523979745, "percentage": 18.62, "elapsed_time": "0:51:07", "remaining_time": "3:43:27", "throughput": 2349.82, "total_tokens": 7207616} {"current_steps": 12505, "total_steps": 67140, "loss": 0.6626, "lr": 4.8875816573690544e-05, "epoch": 1.8625260649389337, "percentage": 18.63, "elapsed_time": "0:51:08", "remaining_time": "3:43:26", "throughput": 2349.89, "total_tokens": 7210496} {"current_steps": 12510, "total_steps": 67140, "loss": 0.6587, "lr": 4.887388885609907e-05, "epoch": 1.863270777479893, "percentage": 18.63, "elapsed_time": "0:51:09", "remaining_time": "3:43:24", "throughput": 2349.94, "total_tokens": 7213280} {"current_steps": 12515, "total_steps": 67140, "loss": 0.752, "lr": 4.887195952520726e-05, "epoch": 1.864015490020852, "percentage": 18.64, "elapsed_time": "0:51:10", "remaining_time": "3:43:22", "throughput": 2350.03, "total_tokens": 7216256} {"current_steps": 12520, "total_steps": 67140, "loss": 0.6577, "lr": 4.887002858114548e-05, "epoch": 1.8647602025618113, "percentage": 18.65, "elapsed_time": "0:51:11", "remaining_time": "3:43:21", "throughput": 2350.08, "total_tokens": 7219040} {"current_steps": 12525, "total_steps": 67140, "loss": 0.7554, "lr": 4.886809602404422e-05, "epoch": 1.8655049151027703, "percentage": 18.66, "elapsed_time": "0:51:12", "remaining_time": "3:43:19", "throughput": 2350.13, "total_tokens": 7221824} {"current_steps": 12530, "total_steps": 67140, "loss": 0.7264, "lr": 4.8866161854034064e-05, "epoch": 1.8662496276437295, "percentage": 18.66, "elapsed_time": "0:51:14", "remaining_time": "3:43:18", "throughput": 2350.21, "total_tokens": 7224832} {"current_steps": 12535, "total_steps": 67140, "loss": 0.684, "lr": 4.886422607124572e-05, "epoch": 1.8669943401846887, "percentage": 18.67, "elapsed_time": "0:51:15", "remaining_time": "3:43:16", "throughput": 2350.31, "total_tokens": 7227840} {"current_steps": 12540, "total_steps": 67140, "loss": 0.6792, "lr": 4.886228867581002e-05, "epoch": 1.8677390527256479, "percentage": 18.68, "elapsed_time": "0:51:16", "remaining_time": "3:43:15", "throughput": 2350.45, "total_tokens": 7231040} {"current_steps": 12545, "total_steps": 67140, "loss": 0.9234, "lr": 4.886034966785785e-05, "epoch": 1.868483765266607, "percentage": 18.68, "elapsed_time": "0:51:17", "remaining_time": "3:43:13", "throughput": 2350.51, "total_tokens": 7233888} {"current_steps": 12550, "total_steps": 67140, "loss": 0.8704, "lr": 4.8858409047520274e-05, "epoch": 1.8692284778075663, "percentage": 18.69, "elapsed_time": "0:51:18", "remaining_time": "3:43:11", "throughput": 2350.51, "total_tokens": 7236480} {"current_steps": 12555, "total_steps": 67140, "loss": 0.6307, "lr": 4.88564668149284e-05, "epoch": 1.8699731903485255, "percentage": 18.7, "elapsed_time": "0:51:19", "remaining_time": "3:43:10", "throughput": 2350.6, "total_tokens": 7239456} {"current_steps": 12560, "total_steps": 67140, "loss": 0.578, "lr": 4.88545229702135e-05, "epoch": 1.8707179028894847, "percentage": 18.71, "elapsed_time": "0:51:21", "remaining_time": "3:43:08", "throughput": 2350.78, "total_tokens": 7242848} {"current_steps": 12565, "total_steps": 67140, "loss": 0.609, "lr": 4.8852577513506925e-05, "epoch": 1.871462615430444, "percentage": 18.71, "elapsed_time": "0:51:22", "remaining_time": "3:43:07", "throughput": 2350.84, "total_tokens": 7245664} {"current_steps": 12570, "total_steps": 67140, "loss": 0.4935, "lr": 4.885063044494014e-05, "epoch": 1.8722073279714029, "percentage": 18.72, "elapsed_time": "0:51:23", "remaining_time": "3:43:05", "throughput": 2350.84, "total_tokens": 7248224} {"current_steps": 12575, "total_steps": 67140, "loss": 0.6424, "lr": 4.884868176464471e-05, "epoch": 1.872952040512362, "percentage": 18.73, "elapsed_time": "0:51:24", "remaining_time": "3:43:03", "throughput": 2350.88, "total_tokens": 7251008} {"current_steps": 12580, "total_steps": 67140, "loss": 0.6687, "lr": 4.8846731472752336e-05, "epoch": 1.8736967530533213, "percentage": 18.74, "elapsed_time": "0:51:25", "remaining_time": "3:43:02", "throughput": 2350.98, "total_tokens": 7253984} {"current_steps": 12585, "total_steps": 67140, "loss": 0.7556, "lr": 4.8844779569394805e-05, "epoch": 1.8744414655942805, "percentage": 18.74, "elapsed_time": "0:51:26", "remaining_time": "3:43:00", "throughput": 2351.03, "total_tokens": 7256736} {"current_steps": 12590, "total_steps": 67140, "loss": 0.648, "lr": 4.884282605470401e-05, "epoch": 1.8751861781352397, "percentage": 18.75, "elapsed_time": "0:51:27", "remaining_time": "3:42:58", "throughput": 2351.06, "total_tokens": 7259424} {"current_steps": 12595, "total_steps": 67140, "loss": 0.7722, "lr": 4.8840870928811966e-05, "epoch": 1.875930890676199, "percentage": 18.76, "elapsed_time": "0:51:28", "remaining_time": "3:42:56", "throughput": 2351.11, "total_tokens": 7262240} {"current_steps": 12600, "total_steps": 67140, "loss": 0.5703, "lr": 4.8838914191850804e-05, "epoch": 1.876675603217158, "percentage": 18.77, "elapsed_time": "0:51:29", "remaining_time": "3:42:54", "throughput": 2351.1, "total_tokens": 7264736} {"current_steps": 12605, "total_steps": 67140, "loss": 0.627, "lr": 4.883695584395274e-05, "epoch": 1.8774203157581173, "percentage": 18.77, "elapsed_time": "0:51:31", "remaining_time": "3:42:53", "throughput": 2351.13, "total_tokens": 7267488} {"current_steps": 12610, "total_steps": 67140, "loss": 0.5572, "lr": 4.883499588525011e-05, "epoch": 1.8781650282990765, "percentage": 18.78, "elapsed_time": "0:51:32", "remaining_time": "3:42:51", "throughput": 2351.17, "total_tokens": 7270240} {"current_steps": 12615, "total_steps": 67140, "loss": 0.698, "lr": 4.883303431587536e-05, "epoch": 1.8789097408400357, "percentage": 18.79, "elapsed_time": "0:51:33", "remaining_time": "3:42:50", "throughput": 2351.26, "total_tokens": 7273216} {"current_steps": 12620, "total_steps": 67140, "loss": 0.6784, "lr": 4.883107113596106e-05, "epoch": 1.879654453380995, "percentage": 18.8, "elapsed_time": "0:51:34", "remaining_time": "3:42:48", "throughput": 2351.27, "total_tokens": 7275808} {"current_steps": 12625, "total_steps": 67140, "loss": 0.718, "lr": 4.882910634563985e-05, "epoch": 1.880399165921954, "percentage": 18.8, "elapsed_time": "0:51:35", "remaining_time": "3:42:46", "throughput": 2351.34, "total_tokens": 7278688} {"current_steps": 12630, "total_steps": 67140, "loss": 0.7048, "lr": 4.882713994504453e-05, "epoch": 1.8811438784629133, "percentage": 18.81, "elapsed_time": "0:51:36", "remaining_time": "3:42:45", "throughput": 2351.49, "total_tokens": 7281984} {"current_steps": 12635, "total_steps": 67140, "loss": 0.601, "lr": 4.882517193430796e-05, "epoch": 1.8818885910038725, "percentage": 18.82, "elapsed_time": "0:51:37", "remaining_time": "3:42:43", "throughput": 2351.58, "total_tokens": 7284992} {"current_steps": 12640, "total_steps": 67140, "loss": 0.6365, "lr": 4.882320231356313e-05, "epoch": 1.8826333035448317, "percentage": 18.83, "elapsed_time": "0:51:39", "remaining_time": "3:42:42", "throughput": 2351.65, "total_tokens": 7287872} {"current_steps": 12645, "total_steps": 67140, "loss": 0.7457, "lr": 4.882123108294316e-05, "epoch": 1.883378016085791, "percentage": 18.83, "elapsed_time": "0:51:40", "remaining_time": "3:42:40", "throughput": 2351.71, "total_tokens": 7290688} {"current_steps": 12650, "total_steps": 67140, "loss": 0.5593, "lr": 4.881925824258123e-05, "epoch": 1.8841227286267501, "percentage": 18.84, "elapsed_time": "0:51:41", "remaining_time": "3:42:38", "throughput": 2351.77, "total_tokens": 7293504} {"current_steps": 12655, "total_steps": 67140, "loss": 0.5778, "lr": 4.881728379261068e-05, "epoch": 1.8848674411677093, "percentage": 18.85, "elapsed_time": "0:51:42", "remaining_time": "3:42:37", "throughput": 2351.84, "total_tokens": 7296384} {"current_steps": 12660, "total_steps": 67140, "loss": 0.685, "lr": 4.881530773316492e-05, "epoch": 1.8856121537086685, "percentage": 18.86, "elapsed_time": "0:51:43", "remaining_time": "3:42:35", "throughput": 2351.96, "total_tokens": 7299520} {"current_steps": 12665, "total_steps": 67140, "loss": 0.6946, "lr": 4.881333006437749e-05, "epoch": 1.8863568662496277, "percentage": 18.86, "elapsed_time": "0:51:44", "remaining_time": "3:42:34", "throughput": 2351.98, "total_tokens": 7302240} {"current_steps": 12670, "total_steps": 67140, "loss": 0.6581, "lr": 4.881135078638203e-05, "epoch": 1.887101578790587, "percentage": 18.87, "elapsed_time": "0:51:45", "remaining_time": "3:42:32", "throughput": 2352.08, "total_tokens": 7305312} {"current_steps": 12675, "total_steps": 67140, "loss": 0.7379, "lr": 4.88093698993123e-05, "epoch": 1.8878462913315461, "percentage": 18.88, "elapsed_time": "0:51:47", "remaining_time": "3:42:31", "throughput": 2352.13, "total_tokens": 7308192} {"current_steps": 12680, "total_steps": 67140, "loss": 0.5132, "lr": 4.880738740330215e-05, "epoch": 1.8885910038725053, "percentage": 18.89, "elapsed_time": "0:51:48", "remaining_time": "3:42:29", "throughput": 2352.17, "total_tokens": 7310944} {"current_steps": 12685, "total_steps": 67140, "loss": 0.7966, "lr": 4.8805403298485554e-05, "epoch": 1.8893357164134645, "percentage": 18.89, "elapsed_time": "0:51:49", "remaining_time": "3:42:27", "throughput": 2352.25, "total_tokens": 7313856} {"current_steps": 12690, "total_steps": 67140, "loss": 0.7889, "lr": 4.8803417584996584e-05, "epoch": 1.8900804289544237, "percentage": 18.9, "elapsed_time": "0:51:50", "remaining_time": "3:42:26", "throughput": 2352.29, "total_tokens": 7316608} {"current_steps": 12695, "total_steps": 67140, "loss": 0.6655, "lr": 4.880143026296944e-05, "epoch": 1.890825141495383, "percentage": 18.91, "elapsed_time": "0:51:51", "remaining_time": "3:42:24", "throughput": 2352.38, "total_tokens": 7319648} {"current_steps": 12700, "total_steps": 67140, "loss": 0.7201, "lr": 4.87994413325384e-05, "epoch": 1.891569854036342, "percentage": 18.92, "elapsed_time": "0:51:52", "remaining_time": "3:42:22", "throughput": 2352.42, "total_tokens": 7322368} {"current_steps": 12705, "total_steps": 67140, "loss": 0.7234, "lr": 4.879745079383789e-05, "epoch": 1.8923145665773011, "percentage": 18.92, "elapsed_time": "0:51:53", "remaining_time": "3:42:21", "throughput": 2352.52, "total_tokens": 7325376} {"current_steps": 12710, "total_steps": 67140, "loss": 0.7197, "lr": 4.879545864700239e-05, "epoch": 1.8930592791182603, "percentage": 18.93, "elapsed_time": "0:51:54", "remaining_time": "3:42:19", "throughput": 2352.55, "total_tokens": 7328096} {"current_steps": 12715, "total_steps": 67140, "loss": 0.5726, "lr": 4.879346489216655e-05, "epoch": 1.8938039916592195, "percentage": 18.94, "elapsed_time": "0:51:56", "remaining_time": "3:42:17", "throughput": 2352.58, "total_tokens": 7330816} {"current_steps": 12720, "total_steps": 67140, "loss": 0.6222, "lr": 4.8791469529465087e-05, "epoch": 1.8945487042001787, "percentage": 18.95, "elapsed_time": "0:51:57", "remaining_time": "3:42:16", "throughput": 2352.61, "total_tokens": 7333504} {"current_steps": 12725, "total_steps": 67140, "loss": 0.7494, "lr": 4.878947255903284e-05, "epoch": 1.895293416741138, "percentage": 18.95, "elapsed_time": "0:51:58", "remaining_time": "3:42:14", "throughput": 2352.69, "total_tokens": 7336480} {"current_steps": 12730, "total_steps": 67140, "loss": 0.7391, "lr": 4.878747398100477e-05, "epoch": 1.8960381292820971, "percentage": 18.96, "elapsed_time": "0:51:59", "remaining_time": "3:42:13", "throughput": 2352.82, "total_tokens": 7339648} {"current_steps": 12735, "total_steps": 67140, "loss": 0.6228, "lr": 4.878547379551591e-05, "epoch": 1.8967828418230563, "percentage": 18.97, "elapsed_time": "0:52:00", "remaining_time": "3:42:11", "throughput": 2352.9, "total_tokens": 7342592} {"current_steps": 12740, "total_steps": 67140, "loss": 0.6298, "lr": 4.8783472002701434e-05, "epoch": 1.8975275543640155, "percentage": 18.98, "elapsed_time": "0:52:01", "remaining_time": "3:42:10", "throughput": 2352.97, "total_tokens": 7345536} {"current_steps": 12745, "total_steps": 67140, "loss": 0.6215, "lr": 4.8781468602696623e-05, "epoch": 1.8982722669049745, "percentage": 18.98, "elapsed_time": "0:52:02", "remaining_time": "3:42:08", "throughput": 2352.99, "total_tokens": 7348160} {"current_steps": 12750, "total_steps": 67140, "loss": 0.6134, "lr": 4.8779463595636857e-05, "epoch": 1.8990169794459337, "percentage": 18.99, "elapsed_time": "0:52:04", "remaining_time": "3:42:06", "throughput": 2353.08, "total_tokens": 7351136} {"current_steps": 12755, "total_steps": 67140, "loss": 0.7883, "lr": 4.877745698165761e-05, "epoch": 1.899761691986893, "percentage": 19.0, "elapsed_time": "0:52:05", "remaining_time": "3:42:05", "throughput": 2353.2, "total_tokens": 7354272} {"current_steps": 12760, "total_steps": 67140, "loss": 0.856, "lr": 4.87754487608945e-05, "epoch": 1.9005064045278521, "percentage": 19.01, "elapsed_time": "0:52:06", "remaining_time": "3:42:03", "throughput": 2353.25, "total_tokens": 7357056} {"current_steps": 12765, "total_steps": 67140, "loss": 0.7011, "lr": 4.8773438933483224e-05, "epoch": 1.9012511170688113, "percentage": 19.01, "elapsed_time": "0:52:07", "remaining_time": "3:42:02", "throughput": 2353.32, "total_tokens": 7359904} {"current_steps": 12770, "total_steps": 67140, "loss": 0.8142, "lr": 4.8771427499559594e-05, "epoch": 1.9019958296097705, "percentage": 19.02, "elapsed_time": "0:52:08", "remaining_time": "3:42:00", "throughput": 2353.37, "total_tokens": 7362720} {"current_steps": 12775, "total_steps": 67140, "loss": 0.7328, "lr": 4.8769414459259556e-05, "epoch": 1.9027405421507297, "percentage": 19.03, "elapsed_time": "0:52:09", "remaining_time": "3:41:58", "throughput": 2353.47, "total_tokens": 7365696} {"current_steps": 12780, "total_steps": 67140, "loss": 0.5328, "lr": 4.8767399812719115e-05, "epoch": 1.903485254691689, "percentage": 19.03, "elapsed_time": "0:52:10", "remaining_time": "3:41:57", "throughput": 2353.52, "total_tokens": 7368544} {"current_steps": 12785, "total_steps": 67140, "loss": 0.727, "lr": 4.876538356007443e-05, "epoch": 1.9042299672326481, "percentage": 19.04, "elapsed_time": "0:52:12", "remaining_time": "3:41:55", "throughput": 2353.61, "total_tokens": 7371520} {"current_steps": 12790, "total_steps": 67140, "loss": 0.6126, "lr": 4.876336570146175e-05, "epoch": 1.9049746797736073, "percentage": 19.05, "elapsed_time": "0:52:13", "remaining_time": "3:41:53", "throughput": 2353.66, "total_tokens": 7374304} {"current_steps": 12795, "total_steps": 67140, "loss": 0.8151, "lr": 4.876134623701743e-05, "epoch": 1.9057193923145666, "percentage": 19.06, "elapsed_time": "0:52:14", "remaining_time": "3:41:52", "throughput": 2353.75, "total_tokens": 7377280} {"current_steps": 12800, "total_steps": 67140, "loss": 0.5762, "lr": 4.875932516687793e-05, "epoch": 1.9064641048555258, "percentage": 19.06, "elapsed_time": "0:52:15", "remaining_time": "3:41:50", "throughput": 2353.82, "total_tokens": 7380192} {"current_steps": 12805, "total_steps": 67140, "loss": 0.7251, "lr": 4.8757302491179844e-05, "epoch": 1.907208817396485, "percentage": 19.07, "elapsed_time": "0:52:16", "remaining_time": "3:41:49", "throughput": 2353.86, "total_tokens": 7382976} {"current_steps": 12810, "total_steps": 67140, "loss": 0.5357, "lr": 4.8755278210059845e-05, "epoch": 1.9079535299374442, "percentage": 19.08, "elapsed_time": "0:52:17", "remaining_time": "3:41:47", "throughput": 2353.88, "total_tokens": 7385696} {"current_steps": 12815, "total_steps": 67140, "loss": 0.556, "lr": 4.8753252323654726e-05, "epoch": 1.9086982424784034, "percentage": 19.09, "elapsed_time": "0:52:18", "remaining_time": "3:41:45", "throughput": 2353.96, "total_tokens": 7388640} {"current_steps": 12820, "total_steps": 67140, "loss": 0.7846, "lr": 4.8751224832101383e-05, "epoch": 1.9094429550193626, "percentage": 19.09, "elapsed_time": "0:52:19", "remaining_time": "3:41:44", "throughput": 2354.02, "total_tokens": 7391488} {"current_steps": 12825, "total_steps": 67140, "loss": 0.6705, "lr": 4.874919573553683e-05, "epoch": 1.9101876675603218, "percentage": 19.1, "elapsed_time": "0:52:21", "remaining_time": "3:41:42", "throughput": 2354.02, "total_tokens": 7394080} {"current_steps": 12830, "total_steps": 67140, "loss": 0.7748, "lr": 4.8747165034098196e-05, "epoch": 1.910932380101281, "percentage": 19.11, "elapsed_time": "0:52:22", "remaining_time": "3:41:40", "throughput": 2354.02, "total_tokens": 7396672} {"current_steps": 12835, "total_steps": 67140, "loss": 0.7142, "lr": 4.8745132727922696e-05, "epoch": 1.9116770926422402, "percentage": 19.12, "elapsed_time": "0:52:23", "remaining_time": "3:41:39", "throughput": 2354.08, "total_tokens": 7399488} {"current_steps": 12840, "total_steps": 67140, "loss": 0.6368, "lr": 4.874309881714766e-05, "epoch": 1.9124218051831994, "percentage": 19.12, "elapsed_time": "0:52:24", "remaining_time": "3:41:37", "throughput": 2354.17, "total_tokens": 7402496} {"current_steps": 12845, "total_steps": 67140, "loss": 0.7365, "lr": 4.874106330191055e-05, "epoch": 1.9131665177241586, "percentage": 19.13, "elapsed_time": "0:52:25", "remaining_time": "3:41:36", "throughput": 2354.19, "total_tokens": 7405216} {"current_steps": 12850, "total_steps": 67140, "loss": 0.7696, "lr": 4.8739026182348894e-05, "epoch": 1.9139112302651178, "percentage": 19.14, "elapsed_time": "0:52:26", "remaining_time": "3:41:34", "throughput": 2354.29, "total_tokens": 7408288} {"current_steps": 12855, "total_steps": 67140, "loss": 0.5189, "lr": 4.873698745860037e-05, "epoch": 1.914655942806077, "percentage": 19.15, "elapsed_time": "0:52:27", "remaining_time": "3:41:33", "throughput": 2354.42, "total_tokens": 7411456} {"current_steps": 12860, "total_steps": 67140, "loss": 0.5725, "lr": 4.873494713080274e-05, "epoch": 1.9154006553470362, "percentage": 19.15, "elapsed_time": "0:52:29", "remaining_time": "3:41:31", "throughput": 2354.48, "total_tokens": 7414336} {"current_steps": 12865, "total_steps": 67140, "loss": 0.6353, "lr": 4.8732905199093884e-05, "epoch": 1.9161453678879954, "percentage": 19.16, "elapsed_time": "0:52:30", "remaining_time": "3:41:29", "throughput": 2354.54, "total_tokens": 7417152} {"current_steps": 12870, "total_steps": 67140, "loss": 0.5725, "lr": 4.873086166361178e-05, "epoch": 1.9168900804289544, "percentage": 19.17, "elapsed_time": "0:52:31", "remaining_time": "3:41:28", "throughput": 2354.61, "total_tokens": 7420096} {"current_steps": 12875, "total_steps": 67140, "loss": 0.6873, "lr": 4.872881652449453e-05, "epoch": 1.9176347929699136, "percentage": 19.18, "elapsed_time": "0:52:32", "remaining_time": "3:41:26", "throughput": 2354.68, "total_tokens": 7422976} {"current_steps": 12880, "total_steps": 67140, "loss": 0.7682, "lr": 4.872676978188033e-05, "epoch": 1.9183795055108728, "percentage": 19.18, "elapsed_time": "0:52:33", "remaining_time": "3:41:25", "throughput": 2354.8, "total_tokens": 7426112} {"current_steps": 12885, "total_steps": 67140, "loss": 0.5855, "lr": 4.8724721435907504e-05, "epoch": 1.919124218051832, "percentage": 19.19, "elapsed_time": "0:52:34", "remaining_time": "3:41:23", "throughput": 2354.86, "total_tokens": 7428960} {"current_steps": 12890, "total_steps": 67140, "loss": 0.6922, "lr": 4.8722671486714457e-05, "epoch": 1.9198689305927912, "percentage": 19.2, "elapsed_time": "0:52:35", "remaining_time": "3:41:21", "throughput": 2354.88, "total_tokens": 7431616} {"current_steps": 12895, "total_steps": 67140, "loss": 0.6286, "lr": 4.8720619934439715e-05, "epoch": 1.9206136431337504, "percentage": 19.21, "elapsed_time": "0:52:36", "remaining_time": "3:41:20", "throughput": 2354.91, "total_tokens": 7434304} {"current_steps": 12900, "total_steps": 67140, "loss": 0.5641, "lr": 4.871856677922193e-05, "epoch": 1.9213583556747096, "percentage": 19.21, "elapsed_time": "0:52:38", "remaining_time": "3:41:18", "throughput": 2354.97, "total_tokens": 7437120} {"current_steps": 12905, "total_steps": 67140, "loss": 0.8156, "lr": 4.8716512021199825e-05, "epoch": 1.9221030682156688, "percentage": 19.22, "elapsed_time": "0:52:39", "remaining_time": "3:41:17", "throughput": 2355.04, "total_tokens": 7440064} {"current_steps": 12910, "total_steps": 67140, "loss": 0.5724, "lr": 4.871445566051226e-05, "epoch": 1.922847780756628, "percentage": 19.23, "elapsed_time": "0:52:40", "remaining_time": "3:41:15", "throughput": 2355.09, "total_tokens": 7442880} {"current_steps": 12915, "total_steps": 67140, "loss": 0.5805, "lr": 4.8712397697298207e-05, "epoch": 1.923592493297587, "percentage": 19.24, "elapsed_time": "0:52:41", "remaining_time": "3:41:13", "throughput": 2355.16, "total_tokens": 7445792} {"current_steps": 12920, "total_steps": 67140, "loss": 0.6375, "lr": 4.871033813169672e-05, "epoch": 1.9243372058385462, "percentage": 19.24, "elapsed_time": "0:52:42", "remaining_time": "3:41:12", "throughput": 2355.29, "total_tokens": 7448960} {"current_steps": 12925, "total_steps": 67140, "loss": 0.7613, "lr": 4.870827696384698e-05, "epoch": 1.9250819183795054, "percentage": 19.25, "elapsed_time": "0:52:43", "remaining_time": "3:41:10", "throughput": 2355.37, "total_tokens": 7451840} {"current_steps": 12930, "total_steps": 67140, "loss": 0.7634, "lr": 4.870621419388828e-05, "epoch": 1.9258266309204646, "percentage": 19.26, "elapsed_time": "0:52:44", "remaining_time": "3:41:08", "throughput": 2355.4, "total_tokens": 7454560} {"current_steps": 12935, "total_steps": 67140, "loss": 0.9322, "lr": 4.870414982196e-05, "epoch": 1.9265713434614238, "percentage": 19.27, "elapsed_time": "0:52:45", "remaining_time": "3:41:07", "throughput": 2355.45, "total_tokens": 7457344} {"current_steps": 12940, "total_steps": 67140, "loss": 0.8243, "lr": 4.870208384820165e-05, "epoch": 1.927316056002383, "percentage": 19.27, "elapsed_time": "0:52:47", "remaining_time": "3:41:05", "throughput": 2355.5, "total_tokens": 7460128} {"current_steps": 12945, "total_steps": 67140, "loss": 0.5692, "lr": 4.8700016272752844e-05, "epoch": 1.9280607685433422, "percentage": 19.28, "elapsed_time": "0:52:48", "remaining_time": "3:41:04", "throughput": 2355.57, "total_tokens": 7463072} {"current_steps": 12950, "total_steps": 67140, "loss": 0.8275, "lr": 4.869794709575329e-05, "epoch": 1.9288054810843014, "percentage": 19.29, "elapsed_time": "0:52:49", "remaining_time": "3:41:02", "throughput": 2355.66, "total_tokens": 7466048} {"current_steps": 12955, "total_steps": 67140, "loss": 0.7504, "lr": 4.869587631734282e-05, "epoch": 1.9295501936252606, "percentage": 19.3, "elapsed_time": "0:52:50", "remaining_time": "3:41:01", "throughput": 2355.76, "total_tokens": 7469152} {"current_steps": 12960, "total_steps": 67140, "loss": 0.5435, "lr": 4.869380393766137e-05, "epoch": 1.9302949061662198, "percentage": 19.3, "elapsed_time": "0:52:51", "remaining_time": "3:40:59", "throughput": 2355.78, "total_tokens": 7471776} {"current_steps": 12965, "total_steps": 67140, "loss": 0.5739, "lr": 4.8691729956848986e-05, "epoch": 1.931039618707179, "percentage": 19.31, "elapsed_time": "0:52:52", "remaining_time": "3:40:57", "throughput": 2355.83, "total_tokens": 7474656} {"current_steps": 12970, "total_steps": 67140, "loss": 0.6463, "lr": 4.868965437504581e-05, "epoch": 1.9317843312481382, "percentage": 19.32, "elapsed_time": "0:52:53", "remaining_time": "3:40:56", "throughput": 2355.95, "total_tokens": 7477760} {"current_steps": 12975, "total_steps": 67140, "loss": 0.7572, "lr": 4.868757719239211e-05, "epoch": 1.9325290437890974, "percentage": 19.33, "elapsed_time": "0:52:55", "remaining_time": "3:40:54", "throughput": 2355.97, "total_tokens": 7480416} {"current_steps": 12980, "total_steps": 67140, "loss": 0.7319, "lr": 4.8685498409028254e-05, "epoch": 1.9332737563300566, "percentage": 19.33, "elapsed_time": "0:52:56", "remaining_time": "3:40:53", "throughput": 2356.0, "total_tokens": 7483168} {"current_steps": 12985, "total_steps": 67140, "loss": 0.7626, "lr": 4.8683418025094704e-05, "epoch": 1.9340184688710158, "percentage": 19.34, "elapsed_time": "0:52:57", "remaining_time": "3:40:51", "throughput": 2356.09, "total_tokens": 7486144} {"current_steps": 12990, "total_steps": 67140, "loss": 0.7374, "lr": 4.8681336040732055e-05, "epoch": 1.934763181411975, "percentage": 19.35, "elapsed_time": "0:52:58", "remaining_time": "3:40:49", "throughput": 2356.15, "total_tokens": 7489024} {"current_steps": 12995, "total_steps": 67140, "loss": 0.6741, "lr": 4.8679252456081e-05, "epoch": 1.9355078939529342, "percentage": 19.36, "elapsed_time": "0:52:59", "remaining_time": "3:40:48", "throughput": 2356.16, "total_tokens": 7491648} {"current_steps": 13000, "total_steps": 67140, "loss": 0.6416, "lr": 4.8677167271282344e-05, "epoch": 1.9362526064938934, "percentage": 19.36, "elapsed_time": "0:53:00", "remaining_time": "3:40:46", "throughput": 2356.23, "total_tokens": 7494560} {"current_steps": 13005, "total_steps": 67140, "loss": 0.6761, "lr": 4.867508048647698e-05, "epoch": 1.9369973190348526, "percentage": 19.37, "elapsed_time": "0:53:01", "remaining_time": "3:40:44", "throughput": 2356.26, "total_tokens": 7497312} {"current_steps": 13010, "total_steps": 67140, "loss": 0.6891, "lr": 4.867299210180593e-05, "epoch": 1.9377420315758118, "percentage": 19.38, "elapsed_time": "0:53:03", "remaining_time": "3:40:43", "throughput": 2356.36, "total_tokens": 7500352} {"current_steps": 13015, "total_steps": 67140, "loss": 0.7064, "lr": 4.867090211741033e-05, "epoch": 1.938486744116771, "percentage": 19.38, "elapsed_time": "0:53:04", "remaining_time": "3:40:42", "throughput": 2356.49, "total_tokens": 7503552} {"current_steps": 13020, "total_steps": 67140, "loss": 0.7506, "lr": 4.86688105334314e-05, "epoch": 1.9392314566577302, "percentage": 19.39, "elapsed_time": "0:53:05", "remaining_time": "3:40:40", "throughput": 2356.57, "total_tokens": 7506528} {"current_steps": 13025, "total_steps": 67140, "loss": 0.541, "lr": 4.866671735001048e-05, "epoch": 1.9399761691986894, "percentage": 19.4, "elapsed_time": "0:53:06", "remaining_time": "3:40:38", "throughput": 2356.58, "total_tokens": 7509120} {"current_steps": 13030, "total_steps": 67140, "loss": 0.5798, "lr": 4.866462256728902e-05, "epoch": 1.9407208817396486, "percentage": 19.41, "elapsed_time": "0:53:07", "remaining_time": "3:40:37", "throughput": 2356.69, "total_tokens": 7512224} {"current_steps": 13035, "total_steps": 67140, "loss": 0.7413, "lr": 4.8662526185408595e-05, "epoch": 1.9414655942806078, "percentage": 19.41, "elapsed_time": "0:53:08", "remaining_time": "3:40:35", "throughput": 2356.71, "total_tokens": 7514880} {"current_steps": 13040, "total_steps": 67140, "loss": 0.7985, "lr": 4.866042820451084e-05, "epoch": 1.942210306821567, "percentage": 19.42, "elapsed_time": "0:53:09", "remaining_time": "3:40:34", "throughput": 2356.84, "total_tokens": 7518080} {"current_steps": 13045, "total_steps": 67140, "loss": 0.6066, "lr": 4.865832862473756e-05, "epoch": 1.942955019362526, "percentage": 19.43, "elapsed_time": "0:53:11", "remaining_time": "3:40:32", "throughput": 2356.91, "total_tokens": 7520992} {"current_steps": 13050, "total_steps": 67140, "loss": 0.7592, "lr": 4.865622744623061e-05, "epoch": 1.9436997319034852, "percentage": 19.44, "elapsed_time": "0:53:12", "remaining_time": "3:40:30", "throughput": 2356.9, "total_tokens": 7523520} {"current_steps": 13055, "total_steps": 67140, "loss": 0.6844, "lr": 4.8654124669131984e-05, "epoch": 1.9444444444444444, "percentage": 19.44, "elapsed_time": "0:53:13", "remaining_time": "3:40:29", "throughput": 2356.91, "total_tokens": 7526112} {"current_steps": 13060, "total_steps": 67140, "loss": 0.5784, "lr": 4.865202029358379e-05, "epoch": 1.9451891569854036, "percentage": 19.45, "elapsed_time": "0:53:14", "remaining_time": "3:40:27", "throughput": 2357.0, "total_tokens": 7529120} {"current_steps": 13065, "total_steps": 67140, "loss": 0.5941, "lr": 4.864991431972822e-05, "epoch": 1.9459338695263628, "percentage": 19.46, "elapsed_time": "0:53:15", "remaining_time": "3:40:25", "throughput": 2357.04, "total_tokens": 7531904} {"current_steps": 13070, "total_steps": 67140, "loss": 0.7548, "lr": 4.86478067477076e-05, "epoch": 1.946678582067322, "percentage": 19.47, "elapsed_time": "0:53:16", "remaining_time": "3:40:24", "throughput": 2357.09, "total_tokens": 7534656} {"current_steps": 13075, "total_steps": 67140, "loss": 0.5488, "lr": 4.8645697577664347e-05, "epoch": 1.9474232946082812, "percentage": 19.47, "elapsed_time": "0:53:17", "remaining_time": "3:40:22", "throughput": 2357.07, "total_tokens": 7537088} {"current_steps": 13080, "total_steps": 67140, "loss": 0.7888, "lr": 4.8643586809740985e-05, "epoch": 1.9481680071492404, "percentage": 19.48, "elapsed_time": "0:53:18", "remaining_time": "3:40:20", "throughput": 2357.08, "total_tokens": 7539712} {"current_steps": 13085, "total_steps": 67140, "loss": 0.6333, "lr": 4.864147444408015e-05, "epoch": 1.9489127196901996, "percentage": 19.49, "elapsed_time": "0:53:19", "remaining_time": "3:40:18", "throughput": 2357.14, "total_tokens": 7542528} {"current_steps": 13090, "total_steps": 67140, "loss": 0.7536, "lr": 4.86393604808246e-05, "epoch": 1.9496574322311586, "percentage": 19.5, "elapsed_time": "0:53:21", "remaining_time": "3:40:17", "throughput": 2357.21, "total_tokens": 7545440} {"current_steps": 13095, "total_steps": 67140, "loss": 0.5311, "lr": 4.8637244920117175e-05, "epoch": 1.9504021447721178, "percentage": 19.5, "elapsed_time": "0:53:22", "remaining_time": "3:40:15", "throughput": 2357.26, "total_tokens": 7548192} {"current_steps": 13100, "total_steps": 67140, "loss": 0.7892, "lr": 4.863512776210084e-05, "epoch": 1.951146857313077, "percentage": 19.51, "elapsed_time": "0:53:23", "remaining_time": "3:40:13", "throughput": 2357.28, "total_tokens": 7550880} {"current_steps": 13105, "total_steps": 67140, "loss": 0.6539, "lr": 4.8633009006918665e-05, "epoch": 1.9518915698540362, "percentage": 19.52, "elapsed_time": "0:53:24", "remaining_time": "3:40:12", "throughput": 2357.38, "total_tokens": 7553888} {"current_steps": 13110, "total_steps": 67140, "loss": 0.5117, "lr": 4.863088865471382e-05, "epoch": 1.9526362823949954, "percentage": 19.53, "elapsed_time": "0:53:25", "remaining_time": "3:40:10", "throughput": 2357.47, "total_tokens": 7556896} {"current_steps": 13115, "total_steps": 67140, "loss": 0.699, "lr": 4.8628766705629604e-05, "epoch": 1.9533809949359546, "percentage": 19.53, "elapsed_time": "0:53:26", "remaining_time": "3:40:09", "throughput": 2357.51, "total_tokens": 7559648} {"current_steps": 13120, "total_steps": 67140, "loss": 0.6128, "lr": 4.862664315980939e-05, "epoch": 1.9541257074769138, "percentage": 19.54, "elapsed_time": "0:53:27", "remaining_time": "3:40:07", "throughput": 2357.58, "total_tokens": 7562560} {"current_steps": 13125, "total_steps": 67140, "loss": 0.7685, "lr": 4.8624518017396706e-05, "epoch": 1.954870420017873, "percentage": 19.55, "elapsed_time": "0:53:28", "remaining_time": "3:40:06", "throughput": 2357.78, "total_tokens": 7566080} {"current_steps": 13130, "total_steps": 67140, "loss": 0.8422, "lr": 4.862239127853514e-05, "epoch": 1.9556151325588322, "percentage": 19.56, "elapsed_time": "0:53:30", "remaining_time": "3:40:04", "throughput": 2357.82, "total_tokens": 7568800} {"current_steps": 13135, "total_steps": 67140, "loss": 0.6193, "lr": 4.8620262943368405e-05, "epoch": 1.9563598450997914, "percentage": 19.56, "elapsed_time": "0:53:31", "remaining_time": "3:40:03", "throughput": 2357.9, "total_tokens": 7571776} {"current_steps": 13140, "total_steps": 67140, "loss": 0.6243, "lr": 4.861813301204034e-05, "epoch": 1.9571045576407506, "percentage": 19.57, "elapsed_time": "0:53:32", "remaining_time": "3:40:01", "throughput": 2357.92, "total_tokens": 7574432} {"current_steps": 13145, "total_steps": 67140, "loss": 0.5555, "lr": 4.861600148469487e-05, "epoch": 1.9578492701817098, "percentage": 19.58, "elapsed_time": "0:53:33", "remaining_time": "3:39:59", "throughput": 2358.0, "total_tokens": 7577408} {"current_steps": 13150, "total_steps": 67140, "loss": 0.7203, "lr": 4.861386836147603e-05, "epoch": 1.958593982722669, "percentage": 19.59, "elapsed_time": "0:53:34", "remaining_time": "3:39:58", "throughput": 2358.06, "total_tokens": 7580256} {"current_steps": 13155, "total_steps": 67140, "loss": 0.5946, "lr": 4.861173364252798e-05, "epoch": 1.9593386952636282, "percentage": 19.59, "elapsed_time": "0:53:35", "remaining_time": "3:39:56", "throughput": 2358.14, "total_tokens": 7583200} {"current_steps": 13160, "total_steps": 67140, "loss": 0.7359, "lr": 4.860959732799497e-05, "epoch": 1.9600834078045875, "percentage": 19.6, "elapsed_time": "0:53:36", "remaining_time": "3:39:54", "throughput": 2358.14, "total_tokens": 7585792} {"current_steps": 13165, "total_steps": 67140, "loss": 0.6763, "lr": 4.860745941802136e-05, "epoch": 1.9608281203455467, "percentage": 19.61, "elapsed_time": "0:53:37", "remaining_time": "3:39:53", "throughput": 2358.16, "total_tokens": 7588416} {"current_steps": 13170, "total_steps": 67140, "loss": 0.4456, "lr": 4.860531991275162e-05, "epoch": 1.9615728328865059, "percentage": 19.62, "elapsed_time": "0:53:39", "remaining_time": "3:39:51", "throughput": 2358.24, "total_tokens": 7591392} {"current_steps": 13175, "total_steps": 67140, "loss": 0.6438, "lr": 4.860317881233033e-05, "epoch": 1.962317545427465, "percentage": 19.62, "elapsed_time": "0:53:40", "remaining_time": "3:39:50", "throughput": 2358.35, "total_tokens": 7594496} {"current_steps": 13180, "total_steps": 67140, "loss": 0.7361, "lr": 4.8601036116902184e-05, "epoch": 1.9630622579684243, "percentage": 19.63, "elapsed_time": "0:53:41", "remaining_time": "3:39:48", "throughput": 2358.38, "total_tokens": 7597184} {"current_steps": 13185, "total_steps": 67140, "loss": 0.5812, "lr": 4.8598891826611974e-05, "epoch": 1.9638069705093835, "percentage": 19.64, "elapsed_time": "0:53:42", "remaining_time": "3:39:46", "throughput": 2358.44, "total_tokens": 7600096} {"current_steps": 13190, "total_steps": 67140, "loss": 0.6925, "lr": 4.85967459416046e-05, "epoch": 1.9645516830503427, "percentage": 19.65, "elapsed_time": "0:53:43", "remaining_time": "3:39:45", "throughput": 2358.5, "total_tokens": 7602976} {"current_steps": 13195, "total_steps": 67140, "loss": 0.5757, "lr": 4.859459846202507e-05, "epoch": 1.9652963955913019, "percentage": 19.65, "elapsed_time": "0:53:44", "remaining_time": "3:39:43", "throughput": 2358.51, "total_tokens": 7605600} {"current_steps": 13200, "total_steps": 67140, "loss": 0.6069, "lr": 4.859244938801851e-05, "epoch": 1.966041108132261, "percentage": 19.66, "elapsed_time": "0:53:45", "remaining_time": "3:39:42", "throughput": 2358.57, "total_tokens": 7608448} {"current_steps": 13205, "total_steps": 67140, "loss": 0.6389, "lr": 4.859029871973013e-05, "epoch": 1.9667858206732203, "percentage": 19.67, "elapsed_time": "0:53:47", "remaining_time": "3:39:40", "throughput": 2358.59, "total_tokens": 7611168} {"current_steps": 13210, "total_steps": 67140, "loss": 0.6381, "lr": 4.8588146457305284e-05, "epoch": 1.9675305332141795, "percentage": 19.68, "elapsed_time": "0:53:48", "remaining_time": "3:39:38", "throughput": 2358.68, "total_tokens": 7614144} {"current_steps": 13215, "total_steps": 67140, "loss": 0.6786, "lr": 4.85859926008894e-05, "epoch": 1.9682752457551387, "percentage": 19.68, "elapsed_time": "0:53:49", "remaining_time": "3:39:37", "throughput": 2358.71, "total_tokens": 7616896} {"current_steps": 13220, "total_steps": 67140, "loss": 0.687, "lr": 4.858383715062803e-05, "epoch": 1.9690199582960977, "percentage": 19.69, "elapsed_time": "0:53:50", "remaining_time": "3:39:35", "throughput": 2358.79, "total_tokens": 7619904} {"current_steps": 13225, "total_steps": 67140, "loss": 0.6532, "lr": 4.8581680106666827e-05, "epoch": 1.9697646708370569, "percentage": 19.7, "elapsed_time": "0:53:51", "remaining_time": "3:39:34", "throughput": 2358.83, "total_tokens": 7622720} {"current_steps": 13230, "total_steps": 67140, "loss": 0.837, "lr": 4.8579521469151555e-05, "epoch": 1.970509383378016, "percentage": 19.71, "elapsed_time": "0:53:52", "remaining_time": "3:39:32", "throughput": 2358.93, "total_tokens": 7625792} {"current_steps": 13235, "total_steps": 67140, "loss": 0.7435, "lr": 4.85773612382281e-05, "epoch": 1.9712540959189753, "percentage": 19.71, "elapsed_time": "0:53:53", "remaining_time": "3:39:31", "throughput": 2359.04, "total_tokens": 7628896} {"current_steps": 13240, "total_steps": 67140, "loss": 0.7677, "lr": 4.857519941404242e-05, "epoch": 1.9719988084599345, "percentage": 19.72, "elapsed_time": "0:53:55", "remaining_time": "3:39:29", "throughput": 2359.11, "total_tokens": 7631776} {"current_steps": 13245, "total_steps": 67140, "loss": 0.6554, "lr": 4.8573035996740626e-05, "epoch": 1.9727435210008937, "percentage": 19.73, "elapsed_time": "0:53:56", "remaining_time": "3:39:28", "throughput": 2359.19, "total_tokens": 7634688} {"current_steps": 13250, "total_steps": 67140, "loss": 0.6617, "lr": 4.8570870986468886e-05, "epoch": 1.9734882335418529, "percentage": 19.73, "elapsed_time": "0:53:57", "remaining_time": "3:39:26", "throughput": 2359.28, "total_tokens": 7637696} {"current_steps": 13255, "total_steps": 67140, "loss": 0.6718, "lr": 4.856870438337353e-05, "epoch": 1.974232946082812, "percentage": 19.74, "elapsed_time": "0:53:58", "remaining_time": "3:39:24", "throughput": 2359.3, "total_tokens": 7640384} {"current_steps": 13260, "total_steps": 67140, "loss": 0.73, "lr": 4.856653618760094e-05, "epoch": 1.974977658623771, "percentage": 19.75, "elapsed_time": "0:53:59", "remaining_time": "3:39:23", "throughput": 2359.39, "total_tokens": 7643360} {"current_steps": 13265, "total_steps": 67140, "loss": 0.6434, "lr": 4.8564366399297666e-05, "epoch": 1.9757223711647303, "percentage": 19.76, "elapsed_time": "0:54:00", "remaining_time": "3:39:21", "throughput": 2359.45, "total_tokens": 7646208} {"current_steps": 13270, "total_steps": 67140, "loss": 0.655, "lr": 4.856219501861031e-05, "epoch": 1.9764670837056895, "percentage": 19.76, "elapsed_time": "0:54:01", "remaining_time": "3:39:20", "throughput": 2359.51, "total_tokens": 7649024} {"current_steps": 13275, "total_steps": 67140, "loss": 0.5658, "lr": 4.8560022045685606e-05, "epoch": 1.9772117962466487, "percentage": 19.77, "elapsed_time": "0:54:02", "remaining_time": "3:39:18", "throughput": 2359.61, "total_tokens": 7652160} {"current_steps": 13280, "total_steps": 67140, "loss": 0.7768, "lr": 4.85578474806704e-05, "epoch": 1.9779565087876079, "percentage": 19.78, "elapsed_time": "0:54:04", "remaining_time": "3:39:17", "throughput": 2359.67, "total_tokens": 7655040} {"current_steps": 13285, "total_steps": 67140, "loss": 0.6906, "lr": 4.8555671323711646e-05, "epoch": 1.978701221328567, "percentage": 19.79, "elapsed_time": "0:54:05", "remaining_time": "3:39:15", "throughput": 2359.71, "total_tokens": 7657792} {"current_steps": 13290, "total_steps": 67140, "loss": 0.5647, "lr": 4.85534935749564e-05, "epoch": 1.9794459338695263, "percentage": 19.79, "elapsed_time": "0:54:06", "remaining_time": "3:39:14", "throughput": 2359.84, "total_tokens": 7660960} {"current_steps": 13295, "total_steps": 67140, "loss": 0.6887, "lr": 4.8551314234551814e-05, "epoch": 1.9801906464104855, "percentage": 19.8, "elapsed_time": "0:54:07", "remaining_time": "3:39:12", "throughput": 2359.93, "total_tokens": 7664000} {"current_steps": 13300, "total_steps": 67140, "loss": 0.549, "lr": 4.854913330264516e-05, "epoch": 1.9809353589514447, "percentage": 19.81, "elapsed_time": "0:54:08", "remaining_time": "3:39:11", "throughput": 2360.01, "total_tokens": 7666912} {"current_steps": 13305, "total_steps": 67140, "loss": 0.7194, "lr": 4.8546950779383825e-05, "epoch": 1.9816800714924039, "percentage": 19.82, "elapsed_time": "0:54:09", "remaining_time": "3:39:09", "throughput": 2360.03, "total_tokens": 7669568} {"current_steps": 13310, "total_steps": 67140, "loss": 0.7399, "lr": 4.854476666491529e-05, "epoch": 1.982424784033363, "percentage": 19.82, "elapsed_time": "0:54:10", "remaining_time": "3:39:07", "throughput": 2360.13, "total_tokens": 7672608} {"current_steps": 13315, "total_steps": 67140, "loss": 0.6878, "lr": 4.854258095938715e-05, "epoch": 1.9831694965743223, "percentage": 19.83, "elapsed_time": "0:54:12", "remaining_time": "3:39:06", "throughput": 2360.14, "total_tokens": 7675232} {"current_steps": 13320, "total_steps": 67140, "loss": 0.7111, "lr": 4.854039366294711e-05, "epoch": 1.9839142091152815, "percentage": 19.84, "elapsed_time": "0:54:13", "remaining_time": "3:39:04", "throughput": 2360.21, "total_tokens": 7678112} {"current_steps": 13325, "total_steps": 67140, "loss": 0.742, "lr": 4.853820477574297e-05, "epoch": 1.9846589216562407, "percentage": 19.85, "elapsed_time": "0:54:14", "remaining_time": "3:39:03", "throughput": 2360.29, "total_tokens": 7681152} {"current_steps": 13330, "total_steps": 67140, "loss": 0.593, "lr": 4.853601429792265e-05, "epoch": 1.9854036341972, "percentage": 19.85, "elapsed_time": "0:54:15", "remaining_time": "3:39:01", "throughput": 2360.31, "total_tokens": 7683808} {"current_steps": 13335, "total_steps": 67140, "loss": 0.6469, "lr": 4.853382222963418e-05, "epoch": 1.986148346738159, "percentage": 19.86, "elapsed_time": "0:54:16", "remaining_time": "3:38:59", "throughput": 2360.4, "total_tokens": 7686880} {"current_steps": 13340, "total_steps": 67140, "loss": 0.5515, "lr": 4.853162857102568e-05, "epoch": 1.9868930592791183, "percentage": 19.87, "elapsed_time": "0:54:17", "remaining_time": "3:38:58", "throughput": 2360.43, "total_tokens": 7689568} {"current_steps": 13345, "total_steps": 67140, "loss": 0.7373, "lr": 4.85294333222454e-05, "epoch": 1.9876377718200775, "percentage": 19.88, "elapsed_time": "0:54:18", "remaining_time": "3:38:56", "throughput": 2360.51, "total_tokens": 7692544} {"current_steps": 13350, "total_steps": 67140, "loss": 0.5704, "lr": 4.852723648344167e-05, "epoch": 1.9883824843610367, "percentage": 19.88, "elapsed_time": "0:54:19", "remaining_time": "3:38:55", "throughput": 2360.57, "total_tokens": 7695392} {"current_steps": 13355, "total_steps": 67140, "loss": 0.6886, "lr": 4.852503805476296e-05, "epoch": 1.989127196901996, "percentage": 19.89, "elapsed_time": "0:54:21", "remaining_time": "3:38:53", "throughput": 2360.64, "total_tokens": 7698336} {"current_steps": 13360, "total_steps": 67140, "loss": 0.6807, "lr": 4.852283803635782e-05, "epoch": 1.9898719094429551, "percentage": 19.9, "elapsed_time": "0:54:22", "remaining_time": "3:38:52", "throughput": 2360.7, "total_tokens": 7701216} {"current_steps": 13365, "total_steps": 67140, "loss": 0.6729, "lr": 4.852063642837493e-05, "epoch": 1.9906166219839143, "percentage": 19.91, "elapsed_time": "0:54:23", "remaining_time": "3:38:50", "throughput": 2360.82, "total_tokens": 7704384} {"current_steps": 13370, "total_steps": 67140, "loss": 0.6027, "lr": 4.851843323096305e-05, "epoch": 1.9913613345248735, "percentage": 19.91, "elapsed_time": "0:54:24", "remaining_time": "3:38:49", "throughput": 2360.86, "total_tokens": 7707168} {"current_steps": 13375, "total_steps": 67140, "loss": 0.6437, "lr": 4.851622844427107e-05, "epoch": 1.9921060470658327, "percentage": 19.92, "elapsed_time": "0:54:25", "remaining_time": "3:38:47", "throughput": 2360.89, "total_tokens": 7709888} {"current_steps": 13380, "total_steps": 67140, "loss": 0.7616, "lr": 4.851402206844799e-05, "epoch": 1.992850759606792, "percentage": 19.93, "elapsed_time": "0:54:26", "remaining_time": "3:38:45", "throughput": 2360.96, "total_tokens": 7712768} {"current_steps": 13385, "total_steps": 67140, "loss": 0.8084, "lr": 4.8511814103642894e-05, "epoch": 1.9935954721477511, "percentage": 19.94, "elapsed_time": "0:54:27", "remaining_time": "3:38:44", "throughput": 2361.02, "total_tokens": 7715680} {"current_steps": 13390, "total_steps": 67140, "loss": 0.6609, "lr": 4.850960455000499e-05, "epoch": 1.99434018468871, "percentage": 19.94, "elapsed_time": "0:54:29", "remaining_time": "3:38:42", "throughput": 2361.08, "total_tokens": 7718496} {"current_steps": 13395, "total_steps": 67140, "loss": 0.7482, "lr": 4.85073934076836e-05, "epoch": 1.9950848972296693, "percentage": 19.95, "elapsed_time": "0:54:30", "remaining_time": "3:38:41", "throughput": 2361.21, "total_tokens": 7721792} {"current_steps": 13400, "total_steps": 67140, "loss": 0.6239, "lr": 4.8505180676828144e-05, "epoch": 1.9958296097706285, "percentage": 19.96, "elapsed_time": "0:54:31", "remaining_time": "3:38:39", "throughput": 2361.31, "total_tokens": 7724800} {"current_steps": 13405, "total_steps": 67140, "loss": 0.5615, "lr": 4.850296635758813e-05, "epoch": 1.9965743223115877, "percentage": 19.97, "elapsed_time": "0:54:32", "remaining_time": "3:38:38", "throughput": 2361.44, "total_tokens": 7728096} {"current_steps": 13410, "total_steps": 67140, "loss": 0.6605, "lr": 4.850075045011321e-05, "epoch": 1.997319034852547, "percentage": 19.97, "elapsed_time": "0:54:48", "remaining_time": "3:39:37", "throughput": 2350.63, "total_tokens": 7731072} {"current_steps": 13415, "total_steps": 67140, "loss": 0.679, "lr": 4.8498532954553125e-05, "epoch": 1.9980637473935061, "percentage": 19.98, "elapsed_time": "0:54:50", "remaining_time": "3:39:36", "throughput": 2350.7, "total_tokens": 7733952} {"current_steps": 13420, "total_steps": 67140, "loss": 0.7003, "lr": 4.8496313871057716e-05, "epoch": 1.9988084599344653, "percentage": 19.99, "elapsed_time": "0:54:51", "remaining_time": "3:39:34", "throughput": 2350.84, "total_tokens": 7737152} {"current_steps": 13425, "total_steps": 67140, "loss": 0.7187, "lr": 4.8494093199776944e-05, "epoch": 1.9995531724754245, "percentage": 20.0, "elapsed_time": "0:54:52", "remaining_time": "3:39:33", "throughput": 2350.93, "total_tokens": 7740128} {"current_steps": 13428, "total_steps": 67140, "eval_loss": 0.6616544127464294, "epoch": 2.0, "percentage": 20.0, "elapsed_time": "0:56:07", "remaining_time": "3:44:28", "throughput": 2299.03, "total_tokens": 7741288} {"current_steps": 13430, "total_steps": 67140, "loss": 0.669, "lr": 4.849187094086088e-05, "epoch": 2.0002978850163835, "percentage": 20.0, "elapsed_time": "0:56:09", "remaining_time": "3:44:35", "throughput": 2297.86, "total_tokens": 7742568} {"current_steps": 13435, "total_steps": 67140, "loss": 0.7021, "lr": 4.848964709445969e-05, "epoch": 2.0010425975573427, "percentage": 20.01, "elapsed_time": "0:56:10", "remaining_time": "3:44:33", "throughput": 2297.94, "total_tokens": 7745416} {"current_steps": 13440, "total_steps": 67140, "loss": 0.6305, "lr": 4.848742166072364e-05, "epoch": 2.001787310098302, "percentage": 20.02, "elapsed_time": "0:56:11", "remaining_time": "3:44:31", "throughput": 2298.01, "total_tokens": 7748264} {"current_steps": 13445, "total_steps": 67140, "loss": 0.7045, "lr": 4.8485194639803136e-05, "epoch": 2.002532022639261, "percentage": 20.03, "elapsed_time": "0:56:12", "remaining_time": "3:44:30", "throughput": 2298.08, "total_tokens": 7751112} {"current_steps": 13450, "total_steps": 67140, "loss": 0.6557, "lr": 4.848296603184866e-05, "epoch": 2.0032767351802203, "percentage": 20.03, "elapsed_time": "0:56:13", "remaining_time": "3:44:28", "throughput": 2298.17, "total_tokens": 7754024} {"current_steps": 13455, "total_steps": 67140, "loss": 0.5899, "lr": 4.848073583701081e-05, "epoch": 2.0040214477211795, "percentage": 20.04, "elapsed_time": "0:56:15", "remaining_time": "3:44:26", "throughput": 2298.28, "total_tokens": 7757064} {"current_steps": 13460, "total_steps": 67140, "loss": 0.5772, "lr": 4.847850405544031e-05, "epoch": 2.0047661602621387, "percentage": 20.05, "elapsed_time": "0:56:16", "remaining_time": "3:44:24", "throughput": 2298.33, "total_tokens": 7759816} {"current_steps": 13465, "total_steps": 67140, "loss": 0.6716, "lr": 4.847627068728795e-05, "epoch": 2.005510872803098, "percentage": 20.06, "elapsed_time": "0:56:17", "remaining_time": "3:44:23", "throughput": 2298.47, "total_tokens": 7763016} {"current_steps": 13470, "total_steps": 67140, "loss": 0.6789, "lr": 4.847403573270467e-05, "epoch": 2.006255585344057, "percentage": 20.06, "elapsed_time": "0:56:18", "remaining_time": "3:44:21", "throughput": 2298.58, "total_tokens": 7766024} {"current_steps": 13475, "total_steps": 67140, "loss": 0.7531, "lr": 4.847179919184149e-05, "epoch": 2.0070002978850163, "percentage": 20.07, "elapsed_time": "0:56:19", "remaining_time": "3:44:19", "throughput": 2298.62, "total_tokens": 7768712} {"current_steps": 13480, "total_steps": 67140, "loss": 0.9731, "lr": 4.8469561064849555e-05, "epoch": 2.0077450104259755, "percentage": 20.08, "elapsed_time": "0:56:20", "remaining_time": "3:44:18", "throughput": 2298.64, "total_tokens": 7771304} {"current_steps": 13485, "total_steps": 67140, "loss": 0.7966, "lr": 4.84673213518801e-05, "epoch": 2.0084897229669347, "percentage": 20.08, "elapsed_time": "0:56:21", "remaining_time": "3:44:16", "throughput": 2298.7, "total_tokens": 7774024} {"current_steps": 13490, "total_steps": 67140, "loss": 0.6238, "lr": 4.846508005308448e-05, "epoch": 2.009234435507894, "percentage": 20.09, "elapsed_time": "0:56:23", "remaining_time": "3:44:14", "throughput": 2298.79, "total_tokens": 7776936} {"current_steps": 13495, "total_steps": 67140, "loss": 0.7302, "lr": 4.846283716861415e-05, "epoch": 2.009979148048853, "percentage": 20.1, "elapsed_time": "0:56:24", "remaining_time": "3:44:12", "throughput": 2298.91, "total_tokens": 7780040} {"current_steps": 13500, "total_steps": 67140, "loss": 0.5736, "lr": 4.8460592698620686e-05, "epoch": 2.0107238605898123, "percentage": 20.11, "elapsed_time": "0:56:25", "remaining_time": "3:44:11", "throughput": 2298.97, "total_tokens": 7782792} {"current_steps": 13505, "total_steps": 67140, "loss": 0.5442, "lr": 4.845834664325574e-05, "epoch": 2.0114685731307715, "percentage": 20.11, "elapsed_time": "0:56:26", "remaining_time": "3:44:09", "throughput": 2299.07, "total_tokens": 7785800} {"current_steps": 13510, "total_steps": 67140, "loss": 0.7986, "lr": 4.8456099002671104e-05, "epoch": 2.0122132856717307, "percentage": 20.12, "elapsed_time": "0:56:27", "remaining_time": "3:44:07", "throughput": 2299.09, "total_tokens": 7788392} {"current_steps": 13515, "total_steps": 67140, "loss": 0.6657, "lr": 4.8453849777018675e-05, "epoch": 2.01295799821269, "percentage": 20.13, "elapsed_time": "0:56:28", "remaining_time": "3:44:05", "throughput": 2299.2, "total_tokens": 7791432} {"current_steps": 13520, "total_steps": 67140, "loss": 0.5902, "lr": 4.845159896645042e-05, "epoch": 2.013702710753649, "percentage": 20.14, "elapsed_time": "0:56:29", "remaining_time": "3:44:04", "throughput": 2299.3, "total_tokens": 7794376} {"current_steps": 13525, "total_steps": 67140, "loss": 0.6935, "lr": 4.844934657111846e-05, "epoch": 2.0144474232946084, "percentage": 20.14, "elapsed_time": "0:56:31", "remaining_time": "3:44:02", "throughput": 2299.37, "total_tokens": 7797256} {"current_steps": 13530, "total_steps": 67140, "loss": 0.6023, "lr": 4.8447092591175e-05, "epoch": 2.0151921358355676, "percentage": 20.15, "elapsed_time": "0:56:32", "remaining_time": "3:44:00", "throughput": 2299.39, "total_tokens": 7799880} {"current_steps": 13535, "total_steps": 67140, "loss": 0.6085, "lr": 4.844483702677235e-05, "epoch": 2.0159368483765268, "percentage": 20.16, "elapsed_time": "0:56:33", "remaining_time": "3:43:58", "throughput": 2299.43, "total_tokens": 7802536} {"current_steps": 13540, "total_steps": 67140, "loss": 0.7277, "lr": 4.8442579878062934e-05, "epoch": 2.016681560917486, "percentage": 20.17, "elapsed_time": "0:56:34", "remaining_time": "3:43:56", "throughput": 2299.5, "total_tokens": 7805288} {"current_steps": 13545, "total_steps": 67140, "loss": 0.7463, "lr": 4.844032114519928e-05, "epoch": 2.017426273458445, "percentage": 20.17, "elapsed_time": "0:56:35", "remaining_time": "3:43:55", "throughput": 2299.57, "total_tokens": 7808200} {"current_steps": 13550, "total_steps": 67140, "loss": 0.6885, "lr": 4.8438060828334014e-05, "epoch": 2.0181709859994044, "percentage": 20.18, "elapsed_time": "0:56:36", "remaining_time": "3:43:53", "throughput": 2299.66, "total_tokens": 7811144} {"current_steps": 13555, "total_steps": 67140, "loss": 0.7304, "lr": 4.84357989276199e-05, "epoch": 2.0189156985403636, "percentage": 20.19, "elapsed_time": "0:56:37", "remaining_time": "3:43:52", "throughput": 2299.79, "total_tokens": 7814280} {"current_steps": 13560, "total_steps": 67140, "loss": 0.5297, "lr": 4.843353544320978e-05, "epoch": 2.0196604110813228, "percentage": 20.2, "elapsed_time": "0:56:38", "remaining_time": "3:43:50", "throughput": 2299.87, "total_tokens": 7817096} {"current_steps": 13565, "total_steps": 67140, "loss": 0.6521, "lr": 4.84312703752566e-05, "epoch": 2.020405123622282, "percentage": 20.2, "elapsed_time": "0:56:40", "remaining_time": "3:43:48", "throughput": 2299.96, "total_tokens": 7820008} {"current_steps": 13570, "total_steps": 67140, "loss": 0.5853, "lr": 4.842900372391344e-05, "epoch": 2.021149836163241, "percentage": 20.21, "elapsed_time": "0:56:41", "remaining_time": "3:43:46", "throughput": 2300.02, "total_tokens": 7822824} {"current_steps": 13575, "total_steps": 67140, "loss": 0.6365, "lr": 4.842673548933345e-05, "epoch": 2.0218945487042004, "percentage": 20.22, "elapsed_time": "0:56:42", "remaining_time": "3:43:45", "throughput": 2300.05, "total_tokens": 7825480} {"current_steps": 13580, "total_steps": 67140, "loss": 0.744, "lr": 4.8424465671669935e-05, "epoch": 2.0226392612451596, "percentage": 20.23, "elapsed_time": "0:56:43", "remaining_time": "3:43:43", "throughput": 2300.09, "total_tokens": 7828200} {"current_steps": 13585, "total_steps": 67140, "loss": 0.7299, "lr": 4.842219427107627e-05, "epoch": 2.0233839737861183, "percentage": 20.23, "elapsed_time": "0:56:44", "remaining_time": "3:43:41", "throughput": 2300.18, "total_tokens": 7831144} {"current_steps": 13590, "total_steps": 67140, "loss": 0.5679, "lr": 4.841992128770594e-05, "epoch": 2.0241286863270775, "percentage": 20.24, "elapsed_time": "0:56:45", "remaining_time": "3:43:39", "throughput": 2300.19, "total_tokens": 7833672} {"current_steps": 13595, "total_steps": 67140, "loss": 0.6039, "lr": 4.841764672171254e-05, "epoch": 2.0248733988680367, "percentage": 20.25, "elapsed_time": "0:56:46", "remaining_time": "3:43:37", "throughput": 2300.23, "total_tokens": 7836328} {"current_steps": 13600, "total_steps": 67140, "loss": 0.5435, "lr": 4.841537057324979e-05, "epoch": 2.025618111408996, "percentage": 20.26, "elapsed_time": "0:56:47", "remaining_time": "3:43:35", "throughput": 2300.29, "total_tokens": 7839080} {"current_steps": 13605, "total_steps": 67140, "loss": 0.5322, "lr": 4.8413092842471496e-05, "epoch": 2.026362823949955, "percentage": 20.26, "elapsed_time": "0:56:48", "remaining_time": "3:43:34", "throughput": 2300.33, "total_tokens": 7841768} {"current_steps": 13610, "total_steps": 67140, "loss": 0.649, "lr": 4.841081352953158e-05, "epoch": 2.0271075364909144, "percentage": 20.27, "elapsed_time": "0:56:50", "remaining_time": "3:43:32", "throughput": 2300.45, "total_tokens": 7844872} {"current_steps": 13615, "total_steps": 67140, "loss": 0.5403, "lr": 4.8408532634584063e-05, "epoch": 2.0278522490318736, "percentage": 20.28, "elapsed_time": "0:56:51", "remaining_time": "3:43:30", "throughput": 2300.51, "total_tokens": 7847624} {"current_steps": 13620, "total_steps": 67140, "loss": 0.7163, "lr": 4.840625015778308e-05, "epoch": 2.0285969615728328, "percentage": 20.29, "elapsed_time": "0:56:52", "remaining_time": "3:43:29", "throughput": 2300.61, "total_tokens": 7850600} {"current_steps": 13625, "total_steps": 67140, "loss": 0.702, "lr": 4.8403966099282886e-05, "epoch": 2.029341674113792, "percentage": 20.29, "elapsed_time": "0:56:53", "remaining_time": "3:43:27", "throughput": 2300.72, "total_tokens": 7853608} {"current_steps": 13630, "total_steps": 67140, "loss": 0.7827, "lr": 4.840168045923781e-05, "epoch": 2.030086386654751, "percentage": 20.3, "elapsed_time": "0:56:54", "remaining_time": "3:43:25", "throughput": 2300.87, "total_tokens": 7856872} {"current_steps": 13635, "total_steps": 67140, "loss": 0.6031, "lr": 4.8399393237802315e-05, "epoch": 2.0308310991957104, "percentage": 20.31, "elapsed_time": "0:56:55", "remaining_time": "3:43:24", "throughput": 2301.01, "total_tokens": 7860104} {"current_steps": 13640, "total_steps": 67140, "loss": 0.6036, "lr": 4.839710443513096e-05, "epoch": 2.0315758117366696, "percentage": 20.32, "elapsed_time": "0:56:57", "remaining_time": "3:43:22", "throughput": 2301.11, "total_tokens": 7863144} {"current_steps": 13645, "total_steps": 67140, "loss": 0.616, "lr": 4.8394814051378414e-05, "epoch": 2.0323205242776288, "percentage": 20.32, "elapsed_time": "0:56:58", "remaining_time": "3:43:21", "throughput": 2301.22, "total_tokens": 7866120} {"current_steps": 13650, "total_steps": 67140, "loss": 0.6903, "lr": 4.839252208669944e-05, "epoch": 2.033065236818588, "percentage": 20.33, "elapsed_time": "0:56:59", "remaining_time": "3:43:19", "throughput": 2301.33, "total_tokens": 7869160} {"current_steps": 13655, "total_steps": 67140, "loss": 0.5739, "lr": 4.839022854124894e-05, "epoch": 2.033809949359547, "percentage": 20.34, "elapsed_time": "0:57:00", "remaining_time": "3:43:17", "throughput": 2301.42, "total_tokens": 7872136} {"current_steps": 13660, "total_steps": 67140, "loss": 0.4866, "lr": 4.838793341518189e-05, "epoch": 2.0345546619005064, "percentage": 20.35, "elapsed_time": "0:57:01", "remaining_time": "3:43:16", "throughput": 2301.48, "total_tokens": 7874888} {"current_steps": 13665, "total_steps": 67140, "loss": 0.7034, "lr": 4.838563670865339e-05, "epoch": 2.0352993744414656, "percentage": 20.35, "elapsed_time": "0:57:02", "remaining_time": "3:43:14", "throughput": 2301.59, "total_tokens": 7877896} {"current_steps": 13670, "total_steps": 67140, "loss": 0.7636, "lr": 4.838333842181864e-05, "epoch": 2.036044086982425, "percentage": 20.36, "elapsed_time": "0:57:03", "remaining_time": "3:43:12", "throughput": 2301.65, "total_tokens": 7880648} {"current_steps": 13675, "total_steps": 67140, "loss": 0.6321, "lr": 4.838103855483295e-05, "epoch": 2.036788799523384, "percentage": 20.37, "elapsed_time": "0:57:05", "remaining_time": "3:43:10", "throughput": 2301.71, "total_tokens": 7883432} {"current_steps": 13680, "total_steps": 67140, "loss": 0.5437, "lr": 4.8378737107851736e-05, "epoch": 2.037533512064343, "percentage": 20.38, "elapsed_time": "0:57:06", "remaining_time": "3:43:09", "throughput": 2301.78, "total_tokens": 7886280} {"current_steps": 13685, "total_steps": 67140, "loss": 0.6726, "lr": 4.837643408103051e-05, "epoch": 2.0382782246053024, "percentage": 20.38, "elapsed_time": "0:57:07", "remaining_time": "3:43:07", "throughput": 2301.86, "total_tokens": 7889128} {"current_steps": 13690, "total_steps": 67140, "loss": 0.5919, "lr": 4.837412947452492e-05, "epoch": 2.0390229371462616, "percentage": 20.39, "elapsed_time": "0:57:08", "remaining_time": "3:43:05", "throughput": 2301.96, "total_tokens": 7892200} {"current_steps": 13695, "total_steps": 67140, "loss": 0.6373, "lr": 4.8371823288490694e-05, "epoch": 2.039767649687221, "percentage": 20.4, "elapsed_time": "0:57:09", "remaining_time": "3:43:04", "throughput": 2302.06, "total_tokens": 7895112} {"current_steps": 13700, "total_steps": 67140, "loss": 0.6507, "lr": 4.8369515523083664e-05, "epoch": 2.04051236222818, "percentage": 20.41, "elapsed_time": "0:57:10", "remaining_time": "3:43:02", "throughput": 2302.15, "total_tokens": 7898056} {"current_steps": 13705, "total_steps": 67140, "loss": 0.8578, "lr": 4.83672061784598e-05, "epoch": 2.041257074769139, "percentage": 20.41, "elapsed_time": "0:57:11", "remaining_time": "3:43:00", "throughput": 2302.2, "total_tokens": 7900840} {"current_steps": 13710, "total_steps": 67140, "loss": 0.671, "lr": 4.836489525477513e-05, "epoch": 2.0420017873100984, "percentage": 20.42, "elapsed_time": "0:57:12", "remaining_time": "3:42:58", "throughput": 2302.28, "total_tokens": 7903720} {"current_steps": 13715, "total_steps": 67140, "loss": 0.7579, "lr": 4.8362582752185844e-05, "epoch": 2.0427464998510576, "percentage": 20.43, "elapsed_time": "0:57:14", "remaining_time": "3:42:57", "throughput": 2302.43, "total_tokens": 7906984} {"current_steps": 13720, "total_steps": 67140, "loss": 0.634, "lr": 4.836026867084821e-05, "epoch": 2.043491212392017, "percentage": 20.43, "elapsed_time": "0:57:15", "remaining_time": "3:42:55", "throughput": 2302.51, "total_tokens": 7909928} {"current_steps": 13725, "total_steps": 67140, "loss": 0.7197, "lr": 4.8357953010918585e-05, "epoch": 2.044235924932976, "percentage": 20.44, "elapsed_time": "0:57:16", "remaining_time": "3:42:54", "throughput": 2302.64, "total_tokens": 7913064} {"current_steps": 13730, "total_steps": 67140, "loss": 0.7411, "lr": 4.835563577255346e-05, "epoch": 2.044980637473935, "percentage": 20.45, "elapsed_time": "0:57:17", "remaining_time": "3:42:52", "throughput": 2302.69, "total_tokens": 7915784} {"current_steps": 13735, "total_steps": 67140, "loss": 0.7609, "lr": 4.835331695590943e-05, "epoch": 2.0457253500148944, "percentage": 20.46, "elapsed_time": "0:57:18", "remaining_time": "3:42:50", "throughput": 2302.77, "total_tokens": 7918664} {"current_steps": 13740, "total_steps": 67140, "loss": 0.6546, "lr": 4.835099656114319e-05, "epoch": 2.0464700625558536, "percentage": 20.46, "elapsed_time": "0:57:19", "remaining_time": "3:42:49", "throughput": 2302.87, "total_tokens": 7921704} {"current_steps": 13745, "total_steps": 67140, "loss": 0.5647, "lr": 4.834867458841154e-05, "epoch": 2.047214775096813, "percentage": 20.47, "elapsed_time": "0:57:20", "remaining_time": "3:42:47", "throughput": 2302.87, "total_tokens": 7924136} {"current_steps": 13750, "total_steps": 67140, "loss": 0.686, "lr": 4.8346351037871386e-05, "epoch": 2.047959487637772, "percentage": 20.48, "elapsed_time": "0:57:22", "remaining_time": "3:42:45", "throughput": 2302.96, "total_tokens": 7927080} {"current_steps": 13755, "total_steps": 67140, "loss": 0.8306, "lr": 4.8344025909679746e-05, "epoch": 2.0487042001787312, "percentage": 20.49, "elapsed_time": "0:57:23", "remaining_time": "3:42:43", "throughput": 2303.07, "total_tokens": 7930120} {"current_steps": 13760, "total_steps": 67140, "loss": 0.6857, "lr": 4.834169920399375e-05, "epoch": 2.04944891271969, "percentage": 20.49, "elapsed_time": "0:57:24", "remaining_time": "3:42:42", "throughput": 2303.14, "total_tokens": 7932936} {"current_steps": 13765, "total_steps": 67140, "loss": 0.6353, "lr": 4.8339370920970614e-05, "epoch": 2.050193625260649, "percentage": 20.5, "elapsed_time": "0:57:25", "remaining_time": "3:42:40", "throughput": 2303.2, "total_tokens": 7935720} {"current_steps": 13770, "total_steps": 67140, "loss": 0.6805, "lr": 4.8337041060767696e-05, "epoch": 2.0509383378016084, "percentage": 20.51, "elapsed_time": "0:57:26", "remaining_time": "3:42:38", "throughput": 2303.31, "total_tokens": 7938760} {"current_steps": 13775, "total_steps": 67140, "loss": 0.6031, "lr": 4.833470962354242e-05, "epoch": 2.0516830503425676, "percentage": 20.52, "elapsed_time": "0:57:27", "remaining_time": "3:42:36", "throughput": 2303.35, "total_tokens": 7941416} {"current_steps": 13780, "total_steps": 67140, "loss": 0.4957, "lr": 4.8332376609452334e-05, "epoch": 2.052427762883527, "percentage": 20.52, "elapsed_time": "0:57:29", "remaining_time": "3:42:36", "throughput": 2303.62, "total_tokens": 7945608} {"current_steps": 13785, "total_steps": 67140, "loss": 0.809, "lr": 4.83300420186551e-05, "epoch": 2.053172475424486, "percentage": 20.53, "elapsed_time": "0:57:30", "remaining_time": "3:42:34", "throughput": 2303.69, "total_tokens": 7948360} {"current_steps": 13790, "total_steps": 67140, "loss": 0.6273, "lr": 4.832770585130849e-05, "epoch": 2.053917187965445, "percentage": 20.54, "elapsed_time": "0:57:31", "remaining_time": "3:42:32", "throughput": 2303.76, "total_tokens": 7951240} {"current_steps": 13795, "total_steps": 67140, "loss": 0.6207, "lr": 4.8325368107570354e-05, "epoch": 2.0546619005064044, "percentage": 20.55, "elapsed_time": "0:57:32", "remaining_time": "3:42:30", "throughput": 2303.83, "total_tokens": 7954088} {"current_steps": 13800, "total_steps": 67140, "loss": 0.6808, "lr": 4.8323028787598666e-05, "epoch": 2.0554066130473636, "percentage": 20.55, "elapsed_time": "0:57:33", "remaining_time": "3:42:29", "throughput": 2303.91, "total_tokens": 7956968} {"current_steps": 13805, "total_steps": 67140, "loss": 0.5172, "lr": 4.832068789155153e-05, "epoch": 2.056151325588323, "percentage": 20.56, "elapsed_time": "0:57:34", "remaining_time": "3:42:27", "throughput": 2303.98, "total_tokens": 7959816} {"current_steps": 13810, "total_steps": 67140, "loss": 0.5372, "lr": 4.831834541958712e-05, "epoch": 2.056896038129282, "percentage": 20.57, "elapsed_time": "0:57:35", "remaining_time": "3:42:25", "throughput": 2304.09, "total_tokens": 7962792} {"current_steps": 13815, "total_steps": 67140, "loss": 0.4529, "lr": 4.8316001371863726e-05, "epoch": 2.057640750670241, "percentage": 20.58, "elapsed_time": "0:57:37", "remaining_time": "3:42:24", "throughput": 2304.16, "total_tokens": 7965608} {"current_steps": 13820, "total_steps": 67140, "loss": 0.7717, "lr": 4.831365574853977e-05, "epoch": 2.0583854632112004, "percentage": 20.58, "elapsed_time": "0:57:38", "remaining_time": "3:42:22", "throughput": 2304.22, "total_tokens": 7968424} {"current_steps": 13825, "total_steps": 67140, "loss": 0.5897, "lr": 4.831130854977373e-05, "epoch": 2.0591301757521596, "percentage": 20.59, "elapsed_time": "0:57:39", "remaining_time": "3:42:20", "throughput": 2304.34, "total_tokens": 7971496} {"current_steps": 13830, "total_steps": 67140, "loss": 0.7273, "lr": 4.830895977572424e-05, "epoch": 2.059874888293119, "percentage": 20.6, "elapsed_time": "0:57:40", "remaining_time": "3:42:18", "throughput": 2304.37, "total_tokens": 7974152} {"current_steps": 13835, "total_steps": 67140, "loss": 0.6449, "lr": 4.830660942655001e-05, "epoch": 2.060619600834078, "percentage": 20.61, "elapsed_time": "0:57:41", "remaining_time": "3:42:17", "throughput": 2304.5, "total_tokens": 7977352} {"current_steps": 13840, "total_steps": 67140, "loss": 0.7719, "lr": 4.8304257502409875e-05, "epoch": 2.0613643133750372, "percentage": 20.61, "elapsed_time": "0:57:42", "remaining_time": "3:42:15", "throughput": 2304.53, "total_tokens": 7979976} {"current_steps": 13845, "total_steps": 67140, "loss": 0.5858, "lr": 4.830190400346277e-05, "epoch": 2.0621090259159964, "percentage": 20.62, "elapsed_time": "0:57:43", "remaining_time": "3:42:13", "throughput": 2304.61, "total_tokens": 7982920} {"current_steps": 13850, "total_steps": 67140, "loss": 0.7791, "lr": 4.829954892986773e-05, "epoch": 2.0628537384569556, "percentage": 20.63, "elapsed_time": "0:57:44", "remaining_time": "3:42:12", "throughput": 2304.64, "total_tokens": 7985544} {"current_steps": 13855, "total_steps": 67140, "loss": 0.74, "lr": 4.829719228178391e-05, "epoch": 2.063598450997915, "percentage": 20.64, "elapsed_time": "0:57:46", "remaining_time": "3:42:10", "throughput": 2304.74, "total_tokens": 7988488} {"current_steps": 13860, "total_steps": 67140, "loss": 0.6432, "lr": 4.829483405937054e-05, "epoch": 2.064343163538874, "percentage": 20.64, "elapsed_time": "0:57:47", "remaining_time": "3:42:08", "throughput": 2304.79, "total_tokens": 7991240} {"current_steps": 13865, "total_steps": 67140, "loss": 0.4415, "lr": 4.8292474262787e-05, "epoch": 2.0650878760798332, "percentage": 20.65, "elapsed_time": "0:57:48", "remaining_time": "3:42:06", "throughput": 2304.9, "total_tokens": 7994280} {"current_steps": 13870, "total_steps": 67140, "loss": 0.7079, "lr": 4.829011289219276e-05, "epoch": 2.0658325886207924, "percentage": 20.66, "elapsed_time": "0:57:49", "remaining_time": "3:42:05", "throughput": 2304.99, "total_tokens": 7997192} {"current_steps": 13875, "total_steps": 67140, "loss": 0.5728, "lr": 4.828774994774737e-05, "epoch": 2.0665773011617516, "percentage": 20.67, "elapsed_time": "0:57:50", "remaining_time": "3:42:03", "throughput": 2305.07, "total_tokens": 8000072} {"current_steps": 13880, "total_steps": 67140, "loss": 0.7005, "lr": 4.828538542961052e-05, "epoch": 2.067322013702711, "percentage": 20.67, "elapsed_time": "0:57:51", "remaining_time": "3:42:01", "throughput": 2305.15, "total_tokens": 8003048} {"current_steps": 13885, "total_steps": 67140, "loss": 0.6041, "lr": 4.8283019337942e-05, "epoch": 2.06806672624367, "percentage": 20.68, "elapsed_time": "0:57:52", "remaining_time": "3:42:00", "throughput": 2305.2, "total_tokens": 8005768} {"current_steps": 13890, "total_steps": 67140, "loss": 0.7176, "lr": 4.828065167290169e-05, "epoch": 2.0688114387846293, "percentage": 20.69, "elapsed_time": "0:57:54", "remaining_time": "3:41:58", "throughput": 2305.28, "total_tokens": 8008648} {"current_steps": 13895, "total_steps": 67140, "loss": 0.5816, "lr": 4.827828243464959e-05, "epoch": 2.0695561513255885, "percentage": 20.7, "elapsed_time": "0:57:55", "remaining_time": "3:41:56", "throughput": 2305.33, "total_tokens": 8011432} {"current_steps": 13900, "total_steps": 67140, "loss": 0.7717, "lr": 4.8275911623345816e-05, "epoch": 2.0703008638665477, "percentage": 20.7, "elapsed_time": "0:57:56", "remaining_time": "3:41:55", "throughput": 2305.49, "total_tokens": 8014696} {"current_steps": 13905, "total_steps": 67140, "loss": 0.5138, "lr": 4.8273539239150555e-05, "epoch": 2.071045576407507, "percentage": 20.71, "elapsed_time": "0:57:57", "remaining_time": "3:41:53", "throughput": 2305.56, "total_tokens": 8017576} {"current_steps": 13910, "total_steps": 67140, "loss": 0.6736, "lr": 4.827116528222414e-05, "epoch": 2.071790288948466, "percentage": 20.72, "elapsed_time": "0:57:58", "remaining_time": "3:41:51", "throughput": 2305.71, "total_tokens": 8020808} {"current_steps": 13915, "total_steps": 67140, "loss": 0.6095, "lr": 4.8268789752726993e-05, "epoch": 2.0725350014894253, "percentage": 20.73, "elapsed_time": "0:57:59", "remaining_time": "3:41:50", "throughput": 2305.75, "total_tokens": 8023528} {"current_steps": 13920, "total_steps": 67140, "loss": 0.5528, "lr": 4.826641265081964e-05, "epoch": 2.0732797140303845, "percentage": 20.73, "elapsed_time": "0:58:00", "remaining_time": "3:41:48", "throughput": 2305.86, "total_tokens": 8026632} {"current_steps": 13925, "total_steps": 67140, "loss": 0.6113, "lr": 4.82640339766627e-05, "epoch": 2.0740244265713437, "percentage": 20.74, "elapsed_time": "0:58:02", "remaining_time": "3:41:46", "throughput": 2305.91, "total_tokens": 8029352} {"current_steps": 13930, "total_steps": 67140, "loss": 0.6441, "lr": 4.8261653730416945e-05, "epoch": 2.074769139112303, "percentage": 20.75, "elapsed_time": "0:58:03", "remaining_time": "3:41:45", "throughput": 2306.01, "total_tokens": 8032424} {"current_steps": 13935, "total_steps": 67140, "loss": 0.747, "lr": 4.8259271912243196e-05, "epoch": 2.0755138516532616, "percentage": 20.76, "elapsed_time": "0:58:04", "remaining_time": "3:41:43", "throughput": 2306.05, "total_tokens": 8035080} {"current_steps": 13940, "total_steps": 67140, "loss": 0.6894, "lr": 4.8256888522302426e-05, "epoch": 2.076258564194221, "percentage": 20.76, "elapsed_time": "0:58:05", "remaining_time": "3:41:41", "throughput": 2306.15, "total_tokens": 8038120} {"current_steps": 13945, "total_steps": 67140, "loss": 0.7425, "lr": 4.825450356075568e-05, "epoch": 2.07700327673518, "percentage": 20.77, "elapsed_time": "0:58:06", "remaining_time": "3:41:40", "throughput": 2306.25, "total_tokens": 8041160} {"current_steps": 13950, "total_steps": 67140, "loss": 0.5183, "lr": 4.825211702776412e-05, "epoch": 2.0777479892761392, "percentage": 20.78, "elapsed_time": "0:58:07", "remaining_time": "3:41:38", "throughput": 2306.34, "total_tokens": 8044104} {"current_steps": 13955, "total_steps": 67140, "loss": 0.5504, "lr": 4.824972892348904e-05, "epoch": 2.0784927018170984, "percentage": 20.78, "elapsed_time": "0:58:08", "remaining_time": "3:41:36", "throughput": 2306.37, "total_tokens": 8046728} {"current_steps": 13960, "total_steps": 67140, "loss": 0.6852, "lr": 4.8247339248091805e-05, "epoch": 2.0792374143580576, "percentage": 20.79, "elapsed_time": "0:58:10", "remaining_time": "3:41:35", "throughput": 2306.47, "total_tokens": 8049704} {"current_steps": 13965, "total_steps": 67140, "loss": 0.7166, "lr": 4.824494800173389e-05, "epoch": 2.079982126899017, "percentage": 20.8, "elapsed_time": "0:58:11", "remaining_time": "3:41:33", "throughput": 2306.54, "total_tokens": 8052584} {"current_steps": 13970, "total_steps": 67140, "loss": 0.7116, "lr": 4.824255518457691e-05, "epoch": 2.080726839439976, "percentage": 20.81, "elapsed_time": "0:58:12", "remaining_time": "3:41:31", "throughput": 2306.58, "total_tokens": 8055304} {"current_steps": 13975, "total_steps": 67140, "loss": 0.695, "lr": 4.824016079678254e-05, "epoch": 2.0814715519809353, "percentage": 20.81, "elapsed_time": "0:58:13", "remaining_time": "3:41:30", "throughput": 2306.64, "total_tokens": 8058120} {"current_steps": 13980, "total_steps": 67140, "loss": 0.6675, "lr": 4.823776483851259e-05, "epoch": 2.0822162645218945, "percentage": 20.82, "elapsed_time": "0:58:14", "remaining_time": "3:41:28", "throughput": 2306.75, "total_tokens": 8061224} {"current_steps": 13985, "total_steps": 67140, "loss": 0.6969, "lr": 4.8235367309928975e-05, "epoch": 2.0829609770628537, "percentage": 20.83, "elapsed_time": "0:58:15", "remaining_time": "3:41:26", "throughput": 2306.83, "total_tokens": 8064136} {"current_steps": 13990, "total_steps": 67140, "loss": 0.7218, "lr": 4.82329682111937e-05, "epoch": 2.083705689603813, "percentage": 20.84, "elapsed_time": "0:58:16", "remaining_time": "3:41:25", "throughput": 2306.87, "total_tokens": 8066792} {"current_steps": 13995, "total_steps": 67140, "loss": 0.6222, "lr": 4.82305675424689e-05, "epoch": 2.084450402144772, "percentage": 20.84, "elapsed_time": "0:58:18", "remaining_time": "3:41:23", "throughput": 2307.01, "total_tokens": 8070024} {"current_steps": 14000, "total_steps": 67140, "loss": 0.7028, "lr": 4.822816530391678e-05, "epoch": 2.0851951146857313, "percentage": 20.85, "elapsed_time": "0:58:19", "remaining_time": "3:41:21", "throughput": 2307.04, "total_tokens": 8072680} {"current_steps": 14005, "total_steps": 67140, "loss": 0.6089, "lr": 4.82257614956997e-05, "epoch": 2.0859398272266905, "percentage": 20.86, "elapsed_time": "0:58:20", "remaining_time": "3:41:20", "throughput": 2307.16, "total_tokens": 8075848} {"current_steps": 14010, "total_steps": 67140, "loss": 0.7352, "lr": 4.8223356117980085e-05, "epoch": 2.0866845397676497, "percentage": 20.87, "elapsed_time": "0:58:21", "remaining_time": "3:41:18", "throughput": 2307.3, "total_tokens": 8079048} {"current_steps": 14015, "total_steps": 67140, "loss": 0.6431, "lr": 4.822094917092048e-05, "epoch": 2.087429252308609, "percentage": 20.87, "elapsed_time": "0:58:22", "remaining_time": "3:41:17", "throughput": 2307.35, "total_tokens": 8081832} {"current_steps": 14020, "total_steps": 67140, "loss": 0.837, "lr": 4.8218540654683544e-05, "epoch": 2.088173964849568, "percentage": 20.88, "elapsed_time": "0:58:23", "remaining_time": "3:41:15", "throughput": 2307.4, "total_tokens": 8084584} {"current_steps": 14025, "total_steps": 67140, "loss": 0.7519, "lr": 4.821613056943203e-05, "epoch": 2.0889186773905273, "percentage": 20.89, "elapsed_time": "0:58:24", "remaining_time": "3:41:13", "throughput": 2307.48, "total_tokens": 8087464} {"current_steps": 14030, "total_steps": 67140, "loss": 0.6432, "lr": 4.821371891532879e-05, "epoch": 2.0896633899314865, "percentage": 20.9, "elapsed_time": "0:58:26", "remaining_time": "3:41:11", "throughput": 2307.56, "total_tokens": 8090376} {"current_steps": 14035, "total_steps": 67140, "loss": 0.6422, "lr": 4.821130569253682e-05, "epoch": 2.0904081024724457, "percentage": 20.9, "elapsed_time": "0:58:27", "remaining_time": "3:41:10", "throughput": 2307.62, "total_tokens": 8093192} {"current_steps": 14040, "total_steps": 67140, "loss": 0.7596, "lr": 4.8208890901219174e-05, "epoch": 2.091152815013405, "percentage": 20.91, "elapsed_time": "0:58:28", "remaining_time": "3:41:08", "throughput": 2307.73, "total_tokens": 8096296} {"current_steps": 14045, "total_steps": 67140, "loss": 0.7203, "lr": 4.820647454153905e-05, "epoch": 2.091897527554364, "percentage": 20.92, "elapsed_time": "0:58:29", "remaining_time": "3:41:07", "throughput": 2307.8, "total_tokens": 8099144} {"current_steps": 14050, "total_steps": 67140, "loss": 0.6328, "lr": 4.820405661365972e-05, "epoch": 2.0926422400953233, "percentage": 20.93, "elapsed_time": "0:58:30", "remaining_time": "3:41:05", "throughput": 2307.86, "total_tokens": 8101960} {"current_steps": 14055, "total_steps": 67140, "loss": 0.5378, "lr": 4.8201637117744584e-05, "epoch": 2.0933869526362825, "percentage": 20.93, "elapsed_time": "0:58:31", "remaining_time": "3:41:03", "throughput": 2307.91, "total_tokens": 8104712} {"current_steps": 14060, "total_steps": 67140, "loss": 0.5961, "lr": 4.819921605395714e-05, "epoch": 2.0941316651772417, "percentage": 20.94, "elapsed_time": "0:58:32", "remaining_time": "3:41:01", "throughput": 2307.95, "total_tokens": 8107368} {"current_steps": 14065, "total_steps": 67140, "loss": 0.7377, "lr": 4.819679342246101e-05, "epoch": 2.094876377718201, "percentage": 20.95, "elapsed_time": "0:58:33", "remaining_time": "3:41:00", "throughput": 2308.04, "total_tokens": 8110440} {"current_steps": 14070, "total_steps": 67140, "loss": 0.7102, "lr": 4.819436922341988e-05, "epoch": 2.09562109025916, "percentage": 20.96, "elapsed_time": "0:58:35", "remaining_time": "3:40:58", "throughput": 2308.14, "total_tokens": 8113448} {"current_steps": 14075, "total_steps": 67140, "loss": 0.4925, "lr": 4.819194345699758e-05, "epoch": 2.0963658028001193, "percentage": 20.96, "elapsed_time": "0:58:36", "remaining_time": "3:40:56", "throughput": 2308.17, "total_tokens": 8116104} {"current_steps": 14080, "total_steps": 67140, "loss": 0.6815, "lr": 4.818951612335803e-05, "epoch": 2.0971105153410785, "percentage": 20.97, "elapsed_time": "0:58:37", "remaining_time": "3:40:55", "throughput": 2308.23, "total_tokens": 8118920} {"current_steps": 14085, "total_steps": 67140, "loss": 0.5829, "lr": 4.8187087222665266e-05, "epoch": 2.0978552278820377, "percentage": 20.98, "elapsed_time": "0:58:38", "remaining_time": "3:40:53", "throughput": 2308.3, "total_tokens": 8121768} {"current_steps": 14090, "total_steps": 67140, "loss": 0.6726, "lr": 4.818465675508342e-05, "epoch": 2.098599940422997, "percentage": 20.99, "elapsed_time": "0:58:39", "remaining_time": "3:40:51", "throughput": 2308.44, "total_tokens": 8124968} {"current_steps": 14095, "total_steps": 67140, "loss": 0.7304, "lr": 4.818222472077674e-05, "epoch": 2.099344652963956, "percentage": 20.99, "elapsed_time": "0:58:40", "remaining_time": "3:40:50", "throughput": 2308.45, "total_tokens": 8127592} {"current_steps": 14100, "total_steps": 67140, "loss": 0.7225, "lr": 4.817979111990955e-05, "epoch": 2.1000893655049153, "percentage": 21.0, "elapsed_time": "0:58:41", "remaining_time": "3:40:48", "throughput": 2308.47, "total_tokens": 8130152} {"current_steps": 14105, "total_steps": 67140, "loss": 0.7979, "lr": 4.817735595264633e-05, "epoch": 2.1008340780458745, "percentage": 21.01, "elapsed_time": "0:58:43", "remaining_time": "3:40:46", "throughput": 2308.53, "total_tokens": 8132968} {"current_steps": 14110, "total_steps": 67140, "loss": 0.6171, "lr": 4.817491921915162e-05, "epoch": 2.1015787905868333, "percentage": 21.02, "elapsed_time": "0:58:44", "remaining_time": "3:40:44", "throughput": 2308.63, "total_tokens": 8135944} {"current_steps": 14115, "total_steps": 67140, "loss": 0.6959, "lr": 4.817248091959009e-05, "epoch": 2.1023235031277925, "percentage": 21.02, "elapsed_time": "0:58:45", "remaining_time": "3:40:43", "throughput": 2308.63, "total_tokens": 8138952} {"current_steps": 14120, "total_steps": 67140, "loss": 0.7163, "lr": 4.817004105412652e-05, "epoch": 2.1030682156687517, "percentage": 21.03, "elapsed_time": "0:58:46", "remaining_time": "3:40:42", "throughput": 2308.71, "total_tokens": 8141800} {"current_steps": 14125, "total_steps": 67140, "loss": 0.7559, "lr": 4.8167599622925776e-05, "epoch": 2.103812928209711, "percentage": 21.04, "elapsed_time": "0:58:47", "remaining_time": "3:40:40", "throughput": 2308.76, "total_tokens": 8144552} {"current_steps": 14130, "total_steps": 67140, "loss": 0.6786, "lr": 4.816515662615284e-05, "epoch": 2.10455764075067, "percentage": 21.05, "elapsed_time": "0:58:48", "remaining_time": "3:40:38", "throughput": 2308.81, "total_tokens": 8147336} {"current_steps": 14135, "total_steps": 67140, "loss": 0.5532, "lr": 4.8162712063972805e-05, "epoch": 2.1053023532916293, "percentage": 21.05, "elapsed_time": "0:58:49", "remaining_time": "3:40:36", "throughput": 2308.87, "total_tokens": 8150152} {"current_steps": 14140, "total_steps": 67140, "loss": 0.7331, "lr": 4.816026593655085e-05, "epoch": 2.1060470658325885, "percentage": 21.06, "elapsed_time": "0:58:51", "remaining_time": "3:40:35", "throughput": 2308.96, "total_tokens": 8153128} {"current_steps": 14145, "total_steps": 67140, "loss": 0.6278, "lr": 4.81578182440523e-05, "epoch": 2.1067917783735477, "percentage": 21.07, "elapsed_time": "0:58:52", "remaining_time": "3:40:33", "throughput": 2309.01, "total_tokens": 8155848} {"current_steps": 14150, "total_steps": 67140, "loss": 0.6466, "lr": 4.815536898664254e-05, "epoch": 2.107536490914507, "percentage": 21.08, "elapsed_time": "0:58:53", "remaining_time": "3:40:31", "throughput": 2309.07, "total_tokens": 8158632} {"current_steps": 14155, "total_steps": 67140, "loss": 0.5196, "lr": 4.815291816448709e-05, "epoch": 2.108281203455466, "percentage": 21.08, "elapsed_time": "0:58:54", "remaining_time": "3:40:30", "throughput": 2309.14, "total_tokens": 8161480} {"current_steps": 14160, "total_steps": 67140, "loss": 0.6745, "lr": 4.815046577775156e-05, "epoch": 2.1090259159964253, "percentage": 21.09, "elapsed_time": "0:58:55", "remaining_time": "3:40:28", "throughput": 2309.22, "total_tokens": 8164424} {"current_steps": 14165, "total_steps": 67140, "loss": 0.7423, "lr": 4.8148011826601676e-05, "epoch": 2.1097706285373845, "percentage": 21.1, "elapsed_time": "0:58:56", "remaining_time": "3:40:26", "throughput": 2309.32, "total_tokens": 8167464} {"current_steps": 14170, "total_steps": 67140, "loss": 0.7339, "lr": 4.814555631120327e-05, "epoch": 2.1105153410783437, "percentage": 21.11, "elapsed_time": "0:58:57", "remaining_time": "3:40:25", "throughput": 2309.42, "total_tokens": 8170472} {"current_steps": 14175, "total_steps": 67140, "loss": 0.7571, "lr": 4.814309923172227e-05, "epoch": 2.111260053619303, "percentage": 21.11, "elapsed_time": "0:58:59", "remaining_time": "3:40:23", "throughput": 2309.51, "total_tokens": 8173480} {"current_steps": 14180, "total_steps": 67140, "loss": 0.6249, "lr": 4.8140640588324705e-05, "epoch": 2.112004766160262, "percentage": 21.12, "elapsed_time": "0:59:00", "remaining_time": "3:40:21", "throughput": 2309.56, "total_tokens": 8176232} {"current_steps": 14185, "total_steps": 67140, "loss": 0.7146, "lr": 4.8138180381176744e-05, "epoch": 2.1127494787012213, "percentage": 21.13, "elapsed_time": "0:59:01", "remaining_time": "3:40:20", "throughput": 2309.64, "total_tokens": 8179144} {"current_steps": 14190, "total_steps": 67140, "loss": 0.6909, "lr": 4.813571861044463e-05, "epoch": 2.1134941912421805, "percentage": 21.13, "elapsed_time": "0:59:02", "remaining_time": "3:40:18", "throughput": 2309.72, "total_tokens": 8182056} {"current_steps": 14195, "total_steps": 67140, "loss": 0.6871, "lr": 4.81332552762947e-05, "epoch": 2.1142389037831397, "percentage": 21.14, "elapsed_time": "0:59:03", "remaining_time": "3:40:17", "throughput": 2309.83, "total_tokens": 8185128} {"current_steps": 14200, "total_steps": 67140, "loss": 0.5476, "lr": 4.813079037889344e-05, "epoch": 2.114983616324099, "percentage": 21.15, "elapsed_time": "0:59:04", "remaining_time": "3:40:15", "throughput": 2309.92, "total_tokens": 8188168} {"current_steps": 14205, "total_steps": 67140, "loss": 0.648, "lr": 4.812832391840741e-05, "epoch": 2.115728328865058, "percentage": 21.16, "elapsed_time": "0:59:05", "remaining_time": "3:40:13", "throughput": 2310.01, "total_tokens": 8191112} {"current_steps": 14210, "total_steps": 67140, "loss": 0.7565, "lr": 4.812585589500328e-05, "epoch": 2.1164730414060173, "percentage": 21.16, "elapsed_time": "0:59:07", "remaining_time": "3:40:12", "throughput": 2310.07, "total_tokens": 8193960} {"current_steps": 14215, "total_steps": 67140, "loss": 0.6508, "lr": 4.812338630884783e-05, "epoch": 2.1172177539469765, "percentage": 21.17, "elapsed_time": "0:59:08", "remaining_time": "3:40:10", "throughput": 2310.16, "total_tokens": 8196904} {"current_steps": 14220, "total_steps": 67140, "loss": 0.7306, "lr": 4.812091516010795e-05, "epoch": 2.1179624664879357, "percentage": 21.18, "elapsed_time": "0:59:09", "remaining_time": "3:40:08", "throughput": 2310.21, "total_tokens": 8199656} {"current_steps": 14225, "total_steps": 67140, "loss": 0.6663, "lr": 4.811844244895063e-05, "epoch": 2.118707179028895, "percentage": 21.19, "elapsed_time": "0:59:10", "remaining_time": "3:40:07", "throughput": 2310.29, "total_tokens": 8202568} {"current_steps": 14230, "total_steps": 67140, "loss": 0.695, "lr": 4.811596817554296e-05, "epoch": 2.119451891569854, "percentage": 21.19, "elapsed_time": "0:59:11", "remaining_time": "3:40:05", "throughput": 2310.35, "total_tokens": 8205416} {"current_steps": 14235, "total_steps": 67140, "loss": 0.6991, "lr": 4.8113492340052135e-05, "epoch": 2.1201966041108133, "percentage": 21.2, "elapsed_time": "0:59:12", "remaining_time": "3:40:03", "throughput": 2310.39, "total_tokens": 8208168} {"current_steps": 14240, "total_steps": 67140, "loss": 0.6463, "lr": 4.8111014942645476e-05, "epoch": 2.1209413166517725, "percentage": 21.21, "elapsed_time": "0:59:13", "remaining_time": "3:40:02", "throughput": 2310.45, "total_tokens": 8210984} {"current_steps": 14245, "total_steps": 67140, "loss": 0.6822, "lr": 4.8108535983490386e-05, "epoch": 2.1216860291927317, "percentage": 21.22, "elapsed_time": "0:59:14", "remaining_time": "3:40:00", "throughput": 2310.55, "total_tokens": 8213992} {"current_steps": 14250, "total_steps": 67140, "loss": 0.681, "lr": 4.8106055462754394e-05, "epoch": 2.122430741733691, "percentage": 21.22, "elapsed_time": "0:59:16", "remaining_time": "3:39:58", "throughput": 2310.66, "total_tokens": 8217096} {"current_steps": 14255, "total_steps": 67140, "loss": 0.621, "lr": 4.810357338060512e-05, "epoch": 2.12317545427465, "percentage": 21.23, "elapsed_time": "0:59:17", "remaining_time": "3:39:57", "throughput": 2310.75, "total_tokens": 8220040} {"current_steps": 14260, "total_steps": 67140, "loss": 0.616, "lr": 4.810108973721028e-05, "epoch": 2.1239201668156094, "percentage": 21.24, "elapsed_time": "0:59:18", "remaining_time": "3:39:55", "throughput": 2310.84, "total_tokens": 8222984} {"current_steps": 14265, "total_steps": 67140, "loss": 0.6007, "lr": 4.809860453273772e-05, "epoch": 2.1246648793565686, "percentage": 21.25, "elapsed_time": "0:59:19", "remaining_time": "3:39:54", "throughput": 2310.91, "total_tokens": 8225864} {"current_steps": 14270, "total_steps": 67140, "loss": 0.6976, "lr": 4.809611776735538e-05, "epoch": 2.1254095918975278, "percentage": 21.25, "elapsed_time": "0:59:20", "remaining_time": "3:39:52", "throughput": 2311.01, "total_tokens": 8228936} {"current_steps": 14275, "total_steps": 67140, "loss": 0.831, "lr": 4.809362944123129e-05, "epoch": 2.1261543044384865, "percentage": 21.26, "elapsed_time": "0:59:21", "remaining_time": "3:39:50", "throughput": 2311.04, "total_tokens": 8231592} {"current_steps": 14280, "total_steps": 67140, "loss": 0.8254, "lr": 4.809113955453363e-05, "epoch": 2.126899016979446, "percentage": 21.27, "elapsed_time": "0:59:22", "remaining_time": "3:39:49", "throughput": 2311.08, "total_tokens": 8234312} {"current_steps": 14285, "total_steps": 67140, "loss": 0.6256, "lr": 4.8088648107430636e-05, "epoch": 2.127643729520405, "percentage": 21.28, "elapsed_time": "0:59:24", "remaining_time": "3:39:47", "throughput": 2311.13, "total_tokens": 8237096} {"current_steps": 14290, "total_steps": 67140, "loss": 0.6849, "lr": 4.8086155100090676e-05, "epoch": 2.128388442061364, "percentage": 21.28, "elapsed_time": "0:59:25", "remaining_time": "3:39:45", "throughput": 2311.18, "total_tokens": 8239848} {"current_steps": 14295, "total_steps": 67140, "loss": 0.6017, "lr": 4.8083660532682214e-05, "epoch": 2.1291331546023233, "percentage": 21.29, "elapsed_time": "0:59:26", "remaining_time": "3:39:43", "throughput": 2311.24, "total_tokens": 8242664} {"current_steps": 14300, "total_steps": 67140, "loss": 0.6126, "lr": 4.8081164405373825e-05, "epoch": 2.1298778671432825, "percentage": 21.3, "elapsed_time": "0:59:27", "remaining_time": "3:39:42", "throughput": 2311.35, "total_tokens": 8245704} {"current_steps": 14305, "total_steps": 67140, "loss": 0.6868, "lr": 4.807866671833418e-05, "epoch": 2.1306225796842417, "percentage": 21.31, "elapsed_time": "0:59:28", "remaining_time": "3:39:40", "throughput": 2311.39, "total_tokens": 8248424} {"current_steps": 14310, "total_steps": 67140, "loss": 0.6748, "lr": 4.807616747173208e-05, "epoch": 2.131367292225201, "percentage": 21.31, "elapsed_time": "0:59:29", "remaining_time": "3:39:38", "throughput": 2311.47, "total_tokens": 8251400} {"current_steps": 14315, "total_steps": 67140, "loss": 0.7786, "lr": 4.8073666665736394e-05, "epoch": 2.13211200476616, "percentage": 21.32, "elapsed_time": "0:59:30", "remaining_time": "3:39:37", "throughput": 2311.57, "total_tokens": 8254472} {"current_steps": 14320, "total_steps": 67140, "loss": 0.7551, "lr": 4.807116430051614e-05, "epoch": 2.1328567173071193, "percentage": 21.33, "elapsed_time": "0:59:32", "remaining_time": "3:39:35", "throughput": 2311.62, "total_tokens": 8257256} {"current_steps": 14325, "total_steps": 67140, "loss": 0.7543, "lr": 4.806866037624039e-05, "epoch": 2.1336014298480785, "percentage": 21.34, "elapsed_time": "0:59:33", "remaining_time": "3:39:34", "throughput": 2311.74, "total_tokens": 8260392} {"current_steps": 14330, "total_steps": 67140, "loss": 0.6907, "lr": 4.806615489307836e-05, "epoch": 2.1343461423890377, "percentage": 21.34, "elapsed_time": "0:59:34", "remaining_time": "3:39:32", "throughput": 2311.8, "total_tokens": 8263208} {"current_steps": 14335, "total_steps": 67140, "loss": 0.6786, "lr": 4.806364785119937e-05, "epoch": 2.135090854929997, "percentage": 21.35, "elapsed_time": "0:59:35", "remaining_time": "3:39:30", "throughput": 2311.85, "total_tokens": 8265960} {"current_steps": 14340, "total_steps": 67140, "loss": 0.6021, "lr": 4.8061139250772825e-05, "epoch": 2.135835567470956, "percentage": 21.36, "elapsed_time": "0:59:36", "remaining_time": "3:39:29", "throughput": 2311.93, "total_tokens": 8268872} {"current_steps": 14345, "total_steps": 67140, "loss": 0.5387, "lr": 4.805862909196825e-05, "epoch": 2.1365802800119154, "percentage": 21.37, "elapsed_time": "0:59:37", "remaining_time": "3:39:27", "throughput": 2311.98, "total_tokens": 8271624} {"current_steps": 14350, "total_steps": 67140, "loss": 0.6795, "lr": 4.805611737495527e-05, "epoch": 2.1373249925528746, "percentage": 21.37, "elapsed_time": "0:59:38", "remaining_time": "3:39:25", "throughput": 2312.05, "total_tokens": 8274536} {"current_steps": 14355, "total_steps": 67140, "loss": 0.7663, "lr": 4.8053604099903614e-05, "epoch": 2.1380697050938338, "percentage": 21.38, "elapsed_time": "0:59:40", "remaining_time": "3:39:24", "throughput": 2312.15, "total_tokens": 8277544} {"current_steps": 14360, "total_steps": 67140, "loss": 0.6736, "lr": 4.8051089266983126e-05, "epoch": 2.138814417634793, "percentage": 21.39, "elapsed_time": "0:59:41", "remaining_time": "3:39:22", "throughput": 2312.26, "total_tokens": 8280712} {"current_steps": 14365, "total_steps": 67140, "loss": 0.6301, "lr": 4.804857287636375e-05, "epoch": 2.139559130175752, "percentage": 21.4, "elapsed_time": "0:59:42", "remaining_time": "3:39:21", "throughput": 2312.37, "total_tokens": 8283752} {"current_steps": 14370, "total_steps": 67140, "loss": 0.771, "lr": 4.804605492821552e-05, "epoch": 2.1403038427167114, "percentage": 21.4, "elapsed_time": "0:59:43", "remaining_time": "3:39:19", "throughput": 2312.43, "total_tokens": 8286536} {"current_steps": 14375, "total_steps": 67140, "loss": 0.6524, "lr": 4.80435354227086e-05, "epoch": 2.1410485552576706, "percentage": 21.41, "elapsed_time": "0:59:44", "remaining_time": "3:39:17", "throughput": 2312.52, "total_tokens": 8289512} {"current_steps": 14380, "total_steps": 67140, "loss": 0.7673, "lr": 4.8041014360013236e-05, "epoch": 2.1417932677986298, "percentage": 21.42, "elapsed_time": "0:59:45", "remaining_time": "3:39:16", "throughput": 2312.59, "total_tokens": 8292360} {"current_steps": 14385, "total_steps": 67140, "loss": 0.5483, "lr": 4.803849174029981e-05, "epoch": 2.142537980339589, "percentage": 21.43, "elapsed_time": "0:59:46", "remaining_time": "3:39:14", "throughput": 2312.63, "total_tokens": 8295048} {"current_steps": 14390, "total_steps": 67140, "loss": 0.7286, "lr": 4.803596756373877e-05, "epoch": 2.143282692880548, "percentage": 21.43, "elapsed_time": "0:59:47", "remaining_time": "3:39:12", "throughput": 2312.73, "total_tokens": 8298088} {"current_steps": 14395, "total_steps": 67140, "loss": 0.6504, "lr": 4.8033441830500706e-05, "epoch": 2.1440274054215074, "percentage": 21.44, "elapsed_time": "0:59:49", "remaining_time": "3:39:11", "throughput": 2312.83, "total_tokens": 8301128} {"current_steps": 14400, "total_steps": 67140, "loss": 0.6306, "lr": 4.803091454075629e-05, "epoch": 2.1447721179624666, "percentage": 21.45, "elapsed_time": "0:59:50", "remaining_time": "3:39:09", "throughput": 2312.9, "total_tokens": 8304072} {"current_steps": 14405, "total_steps": 67140, "loss": 0.703, "lr": 4.8028385694676306e-05, "epoch": 2.145516830503426, "percentage": 21.46, "elapsed_time": "0:59:51", "remaining_time": "3:39:07", "throughput": 2312.99, "total_tokens": 8307016} {"current_steps": 14410, "total_steps": 67140, "loss": 0.5142, "lr": 4.802585529243164e-05, "epoch": 2.146261543044385, "percentage": 21.46, "elapsed_time": "0:59:52", "remaining_time": "3:39:05", "throughput": 2312.98, "total_tokens": 8309416} {"current_steps": 14415, "total_steps": 67140, "loss": 0.7509, "lr": 4.80233233341933e-05, "epoch": 2.147006255585344, "percentage": 21.47, "elapsed_time": "0:59:53", "remaining_time": "3:39:04", "throughput": 2313.09, "total_tokens": 8312552} {"current_steps": 14420, "total_steps": 67140, "loss": 0.5542, "lr": 4.802078982013236e-05, "epoch": 2.1477509681263034, "percentage": 21.48, "elapsed_time": "0:59:54", "remaining_time": "3:39:02", "throughput": 2313.12, "total_tokens": 8315176} {"current_steps": 14425, "total_steps": 67140, "loss": 0.6721, "lr": 4.801825475042005e-05, "epoch": 2.1484956806672626, "percentage": 21.48, "elapsed_time": "0:59:55", "remaining_time": "3:39:00", "throughput": 2313.2, "total_tokens": 8318056} {"current_steps": 14430, "total_steps": 67140, "loss": 0.6372, "lr": 4.801571812522767e-05, "epoch": 2.149240393208222, "percentage": 21.49, "elapsed_time": "0:59:57", "remaining_time": "3:38:59", "throughput": 2313.25, "total_tokens": 8320840} {"current_steps": 14435, "total_steps": 67140, "loss": 0.5022, "lr": 4.801317994472663e-05, "epoch": 2.149985105749181, "percentage": 21.5, "elapsed_time": "0:59:58", "remaining_time": "3:38:57", "throughput": 2313.31, "total_tokens": 8323688} {"current_steps": 14440, "total_steps": 67140, "loss": 0.5966, "lr": 4.801064020908845e-05, "epoch": 2.15072981829014, "percentage": 21.51, "elapsed_time": "0:59:59", "remaining_time": "3:38:56", "throughput": 2313.39, "total_tokens": 8326664} {"current_steps": 14445, "total_steps": 67140, "loss": 0.492, "lr": 4.800809891848477e-05, "epoch": 2.1514745308310994, "percentage": 21.51, "elapsed_time": "1:00:00", "remaining_time": "3:38:54", "throughput": 2313.43, "total_tokens": 8329384} {"current_steps": 14450, "total_steps": 67140, "loss": 0.6373, "lr": 4.80055560730873e-05, "epoch": 2.152219243372058, "percentage": 21.52, "elapsed_time": "1:00:01", "remaining_time": "3:38:52", "throughput": 2313.5, "total_tokens": 8332296} {"current_steps": 14455, "total_steps": 67140, "loss": 0.6405, "lr": 4.800301167306789e-05, "epoch": 2.1529639559130174, "percentage": 21.53, "elapsed_time": "1:00:02", "remaining_time": "3:38:51", "throughput": 2313.58, "total_tokens": 8335272} {"current_steps": 14460, "total_steps": 67140, "loss": 0.6507, "lr": 4.800046571859847e-05, "epoch": 2.1537086684539766, "percentage": 21.54, "elapsed_time": "1:00:03", "remaining_time": "3:38:49", "throughput": 2313.68, "total_tokens": 8338344} {"current_steps": 14465, "total_steps": 67140, "loss": 0.5883, "lr": 4.79979182098511e-05, "epoch": 2.1544533809949358, "percentage": 21.54, "elapsed_time": "1:00:05", "remaining_time": "3:38:47", "throughput": 2313.75, "total_tokens": 8341192} {"current_steps": 14470, "total_steps": 67140, "loss": 0.798, "lr": 4.7995369146997906e-05, "epoch": 2.155198093535895, "percentage": 21.55, "elapsed_time": "1:00:06", "remaining_time": "3:38:46", "throughput": 2313.84, "total_tokens": 8344200} {"current_steps": 14475, "total_steps": 67140, "loss": 0.7771, "lr": 4.7992818530211164e-05, "epoch": 2.155942806076854, "percentage": 21.56, "elapsed_time": "1:00:07", "remaining_time": "3:38:44", "throughput": 2313.93, "total_tokens": 8347176} {"current_steps": 14480, "total_steps": 67140, "loss": 0.7311, "lr": 4.799026635966323e-05, "epoch": 2.1566875186178134, "percentage": 21.57, "elapsed_time": "1:00:08", "remaining_time": "3:38:43", "throughput": 2314.01, "total_tokens": 8350120} {"current_steps": 14485, "total_steps": 67140, "loss": 0.5666, "lr": 4.798771263552656e-05, "epoch": 2.1574322311587726, "percentage": 21.57, "elapsed_time": "1:00:09", "remaining_time": "3:38:41", "throughput": 2314.09, "total_tokens": 8353032} {"current_steps": 14490, "total_steps": 67140, "loss": 0.7009, "lr": 4.798515735797374e-05, "epoch": 2.158176943699732, "percentage": 21.58, "elapsed_time": "1:00:10", "remaining_time": "3:38:40", "throughput": 2314.29, "total_tokens": 8356776} {"current_steps": 14495, "total_steps": 67140, "loss": 0.5773, "lr": 4.7982600527177427e-05, "epoch": 2.158921656240691, "percentage": 21.59, "elapsed_time": "1:00:12", "remaining_time": "3:38:38", "throughput": 2314.4, "total_tokens": 8359848} {"current_steps": 14500, "total_steps": 67140, "loss": 0.5745, "lr": 4.798004214331042e-05, "epoch": 2.15966636878165, "percentage": 21.6, "elapsed_time": "1:00:13", "remaining_time": "3:38:37", "throughput": 2314.43, "total_tokens": 8362536} {"current_steps": 14505, "total_steps": 67140, "loss": 0.5126, "lr": 4.7977482206545586e-05, "epoch": 2.1604110813226094, "percentage": 21.6, "elapsed_time": "1:00:14", "remaining_time": "3:38:35", "throughput": 2314.46, "total_tokens": 8365160} {"current_steps": 14510, "total_steps": 67140, "loss": 0.7992, "lr": 4.797492071705593e-05, "epoch": 2.1611557938635686, "percentage": 21.61, "elapsed_time": "1:00:15", "remaining_time": "3:38:33", "throughput": 2314.56, "total_tokens": 8368168} {"current_steps": 14515, "total_steps": 67140, "loss": 0.576, "lr": 4.7972357675014546e-05, "epoch": 2.161900506404528, "percentage": 21.62, "elapsed_time": "1:00:16", "remaining_time": "3:38:32", "throughput": 2314.6, "total_tokens": 8370888} {"current_steps": 14520, "total_steps": 67140, "loss": 0.742, "lr": 4.796979308059462e-05, "epoch": 2.162645218945487, "percentage": 21.63, "elapsed_time": "1:00:17", "remaining_time": "3:38:30", "throughput": 2314.63, "total_tokens": 8373480} {"current_steps": 14525, "total_steps": 67140, "loss": 0.6841, "lr": 4.796722693396947e-05, "epoch": 2.163389931486446, "percentage": 21.63, "elapsed_time": "1:00:18", "remaining_time": "3:38:28", "throughput": 2314.74, "total_tokens": 8376552} {"current_steps": 14530, "total_steps": 67140, "loss": 0.6513, "lr": 4.79646592353125e-05, "epoch": 2.1641346440274054, "percentage": 21.64, "elapsed_time": "1:00:19", "remaining_time": "3:38:27", "throughput": 2314.81, "total_tokens": 8379464} {"current_steps": 14535, "total_steps": 67140, "loss": 0.5741, "lr": 4.7962089984797235e-05, "epoch": 2.1648793565683646, "percentage": 21.65, "elapsed_time": "1:00:21", "remaining_time": "3:38:25", "throughput": 2314.89, "total_tokens": 8382440} {"current_steps": 14540, "total_steps": 67140, "loss": 0.5065, "lr": 4.795951918259727e-05, "epoch": 2.165624069109324, "percentage": 21.66, "elapsed_time": "1:00:22", "remaining_time": "3:38:23", "throughput": 2314.93, "total_tokens": 8385160} {"current_steps": 14545, "total_steps": 67140, "loss": 0.8411, "lr": 4.795694682888635e-05, "epoch": 2.166368781650283, "percentage": 21.66, "elapsed_time": "1:00:23", "remaining_time": "3:38:21", "throughput": 2314.98, "total_tokens": 8387848} {"current_steps": 14550, "total_steps": 67140, "loss": 0.7387, "lr": 4.795437292383831e-05, "epoch": 2.167113494191242, "percentage": 21.67, "elapsed_time": "1:00:24", "remaining_time": "3:38:20", "throughput": 2315.02, "total_tokens": 8390600} {"current_steps": 14555, "total_steps": 67140, "loss": 0.5314, "lr": 4.7951797467627065e-05, "epoch": 2.1678582067322014, "percentage": 21.68, "elapsed_time": "1:00:25", "remaining_time": "3:38:18", "throughput": 2315.1, "total_tokens": 8393480} {"current_steps": 14560, "total_steps": 67140, "loss": 0.6399, "lr": 4.7949220460426666e-05, "epoch": 2.1686029192731606, "percentage": 21.69, "elapsed_time": "1:00:26", "remaining_time": "3:38:16", "throughput": 2315.14, "total_tokens": 8396200} {"current_steps": 14565, "total_steps": 67140, "loss": 0.5939, "lr": 4.794664190241125e-05, "epoch": 2.16934763181412, "percentage": 21.69, "elapsed_time": "1:00:27", "remaining_time": "3:38:15", "throughput": 2315.23, "total_tokens": 8399208} {"current_steps": 14570, "total_steps": 67140, "loss": 0.5199, "lr": 4.794406179375507e-05, "epoch": 2.170092344355079, "percentage": 21.7, "elapsed_time": "1:00:28", "remaining_time": "3:38:13", "throughput": 2315.25, "total_tokens": 8401800} {"current_steps": 14575, "total_steps": 67140, "loss": 0.5517, "lr": 4.794148013463248e-05, "epoch": 2.1708370568960382, "percentage": 21.71, "elapsed_time": "1:00:30", "remaining_time": "3:38:11", "throughput": 2315.32, "total_tokens": 8404712} {"current_steps": 14580, "total_steps": 67140, "loss": 0.7342, "lr": 4.793889692521792e-05, "epoch": 2.1715817694369974, "percentage": 21.72, "elapsed_time": "1:00:31", "remaining_time": "3:38:10", "throughput": 2315.37, "total_tokens": 8407432} {"current_steps": 14585, "total_steps": 67140, "loss": 0.6637, "lr": 4.793631216568599e-05, "epoch": 2.1723264819779566, "percentage": 21.72, "elapsed_time": "1:00:32", "remaining_time": "3:38:08", "throughput": 2315.44, "total_tokens": 8410312} {"current_steps": 14590, "total_steps": 67140, "loss": 0.712, "lr": 4.793372585621133e-05, "epoch": 2.173071194518916, "percentage": 21.73, "elapsed_time": "1:00:33", "remaining_time": "3:38:06", "throughput": 2315.52, "total_tokens": 8413320} {"current_steps": 14595, "total_steps": 67140, "loss": 0.5606, "lr": 4.793113799696871e-05, "epoch": 2.173815907059875, "percentage": 21.74, "elapsed_time": "1:00:34", "remaining_time": "3:38:05", "throughput": 2315.58, "total_tokens": 8416168} {"current_steps": 14600, "total_steps": 67140, "loss": 0.7773, "lr": 4.792854858813303e-05, "epoch": 2.1745606196008342, "percentage": 21.75, "elapsed_time": "1:00:35", "remaining_time": "3:38:03", "throughput": 2315.69, "total_tokens": 8419240} {"current_steps": 14605, "total_steps": 67140, "loss": 0.7389, "lr": 4.792595762987924e-05, "epoch": 2.1753053321417934, "percentage": 21.75, "elapsed_time": "1:00:36", "remaining_time": "3:38:02", "throughput": 2315.82, "total_tokens": 8422440} {"current_steps": 14610, "total_steps": 67140, "loss": 0.9258, "lr": 4.792336512238246e-05, "epoch": 2.1760500446827526, "percentage": 21.76, "elapsed_time": "1:00:38", "remaining_time": "3:38:00", "throughput": 2315.84, "total_tokens": 8425032} {"current_steps": 14615, "total_steps": 67140, "loss": 0.7243, "lr": 4.7920771065817846e-05, "epoch": 2.176794757223712, "percentage": 21.77, "elapsed_time": "1:00:39", "remaining_time": "3:37:58", "throughput": 2315.89, "total_tokens": 8427816} {"current_steps": 14620, "total_steps": 67140, "loss": 0.7244, "lr": 4.791817546036072e-05, "epoch": 2.177539469764671, "percentage": 21.78, "elapsed_time": "1:00:40", "remaining_time": "3:37:57", "throughput": 2315.94, "total_tokens": 8430632} {"current_steps": 14625, "total_steps": 67140, "loss": 0.7683, "lr": 4.7915578306186485e-05, "epoch": 2.17828418230563, "percentage": 21.78, "elapsed_time": "1:00:41", "remaining_time": "3:37:55", "throughput": 2315.98, "total_tokens": 8433384} {"current_steps": 14630, "total_steps": 67140, "loss": 0.6438, "lr": 4.791297960347063e-05, "epoch": 2.179028894846589, "percentage": 21.79, "elapsed_time": "1:00:42", "remaining_time": "3:37:53", "throughput": 2316.0, "total_tokens": 8435976} {"current_steps": 14635, "total_steps": 67140, "loss": 0.704, "lr": 4.791037935238877e-05, "epoch": 2.179773607387548, "percentage": 21.8, "elapsed_time": "1:00:43", "remaining_time": "3:37:52", "throughput": 2316.07, "total_tokens": 8438920} {"current_steps": 14640, "total_steps": 67140, "loss": 0.721, "lr": 4.790777755311662e-05, "epoch": 2.1805183199285074, "percentage": 21.81, "elapsed_time": "1:00:44", "remaining_time": "3:37:50", "throughput": 2316.11, "total_tokens": 8441640} {"current_steps": 14645, "total_steps": 67140, "loss": 0.7425, "lr": 4.790517420583e-05, "epoch": 2.1812630324694666, "percentage": 21.81, "elapsed_time": "1:00:45", "remaining_time": "3:37:48", "throughput": 2316.18, "total_tokens": 8444488} {"current_steps": 14650, "total_steps": 67140, "loss": 0.6379, "lr": 4.790256931070483e-05, "epoch": 2.182007745010426, "percentage": 21.82, "elapsed_time": "1:00:46", "remaining_time": "3:37:46", "throughput": 2316.23, "total_tokens": 8447240} {"current_steps": 14655, "total_steps": 67140, "loss": 0.5947, "lr": 4.789996286791715e-05, "epoch": 2.182752457551385, "percentage": 21.83, "elapsed_time": "1:00:48", "remaining_time": "3:37:45", "throughput": 2316.29, "total_tokens": 8450088} {"current_steps": 14660, "total_steps": 67140, "loss": 0.7735, "lr": 4.789735487764307e-05, "epoch": 2.1834971700923442, "percentage": 21.83, "elapsed_time": "1:00:49", "remaining_time": "3:37:43", "throughput": 2316.33, "total_tokens": 8452776} {"current_steps": 14665, "total_steps": 67140, "loss": 0.6484, "lr": 4.789474534005885e-05, "epoch": 2.1842418826333034, "percentage": 21.84, "elapsed_time": "1:00:50", "remaining_time": "3:37:41", "throughput": 2316.39, "total_tokens": 8455656} {"current_steps": 14670, "total_steps": 67140, "loss": 0.5069, "lr": 4.789213425534082e-05, "epoch": 2.1849865951742626, "percentage": 21.85, "elapsed_time": "1:00:51", "remaining_time": "3:37:40", "throughput": 2316.42, "total_tokens": 8458312} {"current_steps": 14675, "total_steps": 67140, "loss": 0.7101, "lr": 4.788952162366543e-05, "epoch": 2.185731307715222, "percentage": 21.86, "elapsed_time": "1:00:52", "remaining_time": "3:37:38", "throughput": 2316.57, "total_tokens": 8461672} {"current_steps": 14680, "total_steps": 67140, "loss": 0.6543, "lr": 4.7886907445209234e-05, "epoch": 2.186476020256181, "percentage": 21.86, "elapsed_time": "1:00:53", "remaining_time": "3:37:37", "throughput": 2316.64, "total_tokens": 8464584} {"current_steps": 14685, "total_steps": 67140, "loss": 0.7726, "lr": 4.7884291720148876e-05, "epoch": 2.1872207327971402, "percentage": 21.87, "elapsed_time": "1:00:54", "remaining_time": "3:37:35", "throughput": 2316.68, "total_tokens": 8467336} {"current_steps": 14690, "total_steps": 67140, "loss": 0.6818, "lr": 4.7881674448661136e-05, "epoch": 2.1879654453380994, "percentage": 21.88, "elapsed_time": "1:00:56", "remaining_time": "3:37:33", "throughput": 2316.76, "total_tokens": 8470280} {"current_steps": 14695, "total_steps": 67140, "loss": 0.639, "lr": 4.7879055630922856e-05, "epoch": 2.1887101578790586, "percentage": 21.89, "elapsed_time": "1:00:57", "remaining_time": "3:37:32", "throughput": 2316.86, "total_tokens": 8473384} {"current_steps": 14700, "total_steps": 67140, "loss": 0.8402, "lr": 4.7876435267111024e-05, "epoch": 2.189454870420018, "percentage": 21.89, "elapsed_time": "1:00:58", "remaining_time": "3:37:30", "throughput": 2316.96, "total_tokens": 8476424} {"current_steps": 14705, "total_steps": 67140, "loss": 0.6352, "lr": 4.7873813357402704e-05, "epoch": 2.190199582960977, "percentage": 21.9, "elapsed_time": "1:00:59", "remaining_time": "3:37:29", "throughput": 2317.01, "total_tokens": 8479176} {"current_steps": 14710, "total_steps": 67140, "loss": 0.6683, "lr": 4.7871189901975075e-05, "epoch": 2.1909442955019363, "percentage": 21.91, "elapsed_time": "1:01:00", "remaining_time": "3:37:27", "throughput": 2317.1, "total_tokens": 8482184} {"current_steps": 14715, "total_steps": 67140, "loss": 0.5051, "lr": 4.786856490100542e-05, "epoch": 2.1916890080428955, "percentage": 21.92, "elapsed_time": "1:01:01", "remaining_time": "3:37:26", "throughput": 2317.21, "total_tokens": 8485256} {"current_steps": 14720, "total_steps": 67140, "loss": 0.5552, "lr": 4.786593835467112e-05, "epoch": 2.1924337205838547, "percentage": 21.92, "elapsed_time": "1:01:03", "remaining_time": "3:37:24", "throughput": 2317.29, "total_tokens": 8488264} {"current_steps": 14725, "total_steps": 67140, "loss": 0.5125, "lr": 4.786331026314968e-05, "epoch": 2.193178433124814, "percentage": 21.93, "elapsed_time": "1:01:04", "remaining_time": "3:37:22", "throughput": 2317.36, "total_tokens": 8491144} {"current_steps": 14730, "total_steps": 67140, "loss": 0.7842, "lr": 4.7860680626618684e-05, "epoch": 2.193923145665773, "percentage": 21.94, "elapsed_time": "1:01:05", "remaining_time": "3:37:21", "throughput": 2317.42, "total_tokens": 8493960} {"current_steps": 14735, "total_steps": 67140, "loss": 0.6259, "lr": 4.7858049445255834e-05, "epoch": 2.1946678582067323, "percentage": 21.95, "elapsed_time": "1:01:06", "remaining_time": "3:37:19", "throughput": 2317.48, "total_tokens": 8496840} {"current_steps": 14740, "total_steps": 67140, "loss": 0.715, "lr": 4.7855416719238945e-05, "epoch": 2.1954125707476915, "percentage": 21.95, "elapsed_time": "1:01:07", "remaining_time": "3:37:17", "throughput": 2317.53, "total_tokens": 8499592} {"current_steps": 14745, "total_steps": 67140, "loss": 0.621, "lr": 4.78527824487459e-05, "epoch": 2.1961572832886507, "percentage": 21.96, "elapsed_time": "1:01:08", "remaining_time": "3:37:16", "throughput": 2317.62, "total_tokens": 8502632} {"current_steps": 14750, "total_steps": 67140, "loss": 0.6383, "lr": 4.785014663395475e-05, "epoch": 2.19690199582961, "percentage": 21.97, "elapsed_time": "1:01:09", "remaining_time": "3:37:14", "throughput": 2317.74, "total_tokens": 8505800} {"current_steps": 14755, "total_steps": 67140, "loss": 0.5961, "lr": 4.784750927504358e-05, "epoch": 2.197646708370569, "percentage": 21.98, "elapsed_time": "1:01:10", "remaining_time": "3:37:13", "throughput": 2317.78, "total_tokens": 8508552} {"current_steps": 14760, "total_steps": 67140, "loss": 0.6374, "lr": 4.784487037219063e-05, "epoch": 2.1983914209115283, "percentage": 21.98, "elapsed_time": "1:01:12", "remaining_time": "3:37:11", "throughput": 2317.86, "total_tokens": 8511464} {"current_steps": 14765, "total_steps": 67140, "loss": 0.6996, "lr": 4.784222992557422e-05, "epoch": 2.1991361334524875, "percentage": 21.99, "elapsed_time": "1:01:13", "remaining_time": "3:37:09", "throughput": 2317.86, "total_tokens": 8513992} {"current_steps": 14770, "total_steps": 67140, "loss": 0.7027, "lr": 4.783958793537278e-05, "epoch": 2.1998808459934467, "percentage": 22.0, "elapsed_time": "1:01:14", "remaining_time": "3:37:08", "throughput": 2317.9, "total_tokens": 8516680} {"current_steps": 14775, "total_steps": 67140, "loss": 0.5339, "lr": 4.783694440176485e-05, "epoch": 2.200625558534406, "percentage": 22.01, "elapsed_time": "1:01:15", "remaining_time": "3:37:06", "throughput": 2317.97, "total_tokens": 8519624} {"current_steps": 14780, "total_steps": 67140, "loss": 0.7701, "lr": 4.7834299324929056e-05, "epoch": 2.201370271075365, "percentage": 22.01, "elapsed_time": "1:01:16", "remaining_time": "3:37:04", "throughput": 2318.04, "total_tokens": 8522536} {"current_steps": 14785, "total_steps": 67140, "loss": 0.7502, "lr": 4.7831652705044164e-05, "epoch": 2.2021149836163243, "percentage": 22.02, "elapsed_time": "1:01:17", "remaining_time": "3:37:03", "throughput": 2318.13, "total_tokens": 8525512} {"current_steps": 14790, "total_steps": 67140, "loss": 0.5278, "lr": 4.7829004542289e-05, "epoch": 2.202859696157283, "percentage": 22.03, "elapsed_time": "1:01:18", "remaining_time": "3:37:01", "throughput": 2318.2, "total_tokens": 8528392} {"current_steps": 14795, "total_steps": 67140, "loss": 0.751, "lr": 4.7826354836842525e-05, "epoch": 2.2036044086982427, "percentage": 22.04, "elapsed_time": "1:01:20", "remaining_time": "3:37:00", "throughput": 2318.3, "total_tokens": 8531432} {"current_steps": 14800, "total_steps": 67140, "loss": 0.7227, "lr": 4.7823703588883796e-05, "epoch": 2.2043491212392015, "percentage": 22.04, "elapsed_time": "1:01:21", "remaining_time": "3:36:58", "throughput": 2318.39, "total_tokens": 8534440} {"current_steps": 14805, "total_steps": 67140, "loss": 0.679, "lr": 4.782105079859198e-05, "epoch": 2.2050938337801607, "percentage": 22.05, "elapsed_time": "1:01:22", "remaining_time": "3:36:56", "throughput": 2318.47, "total_tokens": 8537384} {"current_steps": 14810, "total_steps": 67140, "loss": 0.6437, "lr": 4.7818396466146326e-05, "epoch": 2.20583854632112, "percentage": 22.06, "elapsed_time": "1:01:23", "remaining_time": "3:36:55", "throughput": 2318.52, "total_tokens": 8540200} {"current_steps": 14815, "total_steps": 67140, "loss": 0.6691, "lr": 4.781574059172621e-05, "epoch": 2.206583258862079, "percentage": 22.07, "elapsed_time": "1:01:24", "remaining_time": "3:36:53", "throughput": 2318.56, "total_tokens": 8542888} {"current_steps": 14820, "total_steps": 67140, "loss": 0.5414, "lr": 4.781308317551112e-05, "epoch": 2.2073279714030383, "percentage": 22.07, "elapsed_time": "1:01:25", "remaining_time": "3:36:51", "throughput": 2318.63, "total_tokens": 8545768} {"current_steps": 14825, "total_steps": 67140, "loss": 0.5539, "lr": 4.781042421768061e-05, "epoch": 2.2080726839439975, "percentage": 22.08, "elapsed_time": "1:01:26", "remaining_time": "3:36:50", "throughput": 2318.68, "total_tokens": 8548552} {"current_steps": 14830, "total_steps": 67140, "loss": 0.6698, "lr": 4.7807763718414374e-05, "epoch": 2.2088173964849567, "percentage": 22.09, "elapsed_time": "1:01:27", "remaining_time": "3:36:48", "throughput": 2318.74, "total_tokens": 8551432} {"current_steps": 14835, "total_steps": 67140, "loss": 0.6687, "lr": 4.7805101677892194e-05, "epoch": 2.209562109025916, "percentage": 22.1, "elapsed_time": "1:01:29", "remaining_time": "3:36:47", "throughput": 2318.83, "total_tokens": 8554408} {"current_steps": 14840, "total_steps": 67140, "loss": 0.6831, "lr": 4.7802438096293964e-05, "epoch": 2.210306821566875, "percentage": 22.1, "elapsed_time": "1:01:30", "remaining_time": "3:36:45", "throughput": 2318.87, "total_tokens": 8557128} {"current_steps": 14845, "total_steps": 67140, "loss": 0.6204, "lr": 4.7799772973799674e-05, "epoch": 2.2110515341078343, "percentage": 22.11, "elapsed_time": "1:01:31", "remaining_time": "3:36:43", "throughput": 2318.95, "total_tokens": 8560040} {"current_steps": 14850, "total_steps": 67140, "loss": 0.621, "lr": 4.7797106310589424e-05, "epoch": 2.2117962466487935, "percentage": 22.12, "elapsed_time": "1:01:32", "remaining_time": "3:36:41", "throughput": 2319.0, "total_tokens": 8562824} {"current_steps": 14855, "total_steps": 67140, "loss": 0.8546, "lr": 4.779443810684341e-05, "epoch": 2.2125409591897527, "percentage": 22.13, "elapsed_time": "1:01:33", "remaining_time": "3:36:40", "throughput": 2319.11, "total_tokens": 8565960} {"current_steps": 14860, "total_steps": 67140, "loss": 0.7142, "lr": 4.779176836274195e-05, "epoch": 2.213285671730712, "percentage": 22.13, "elapsed_time": "1:01:34", "remaining_time": "3:36:38", "throughput": 2319.16, "total_tokens": 8568808} {"current_steps": 14865, "total_steps": 67140, "loss": 0.6979, "lr": 4.778909707846545e-05, "epoch": 2.214030384271671, "percentage": 22.14, "elapsed_time": "1:01:35", "remaining_time": "3:36:37", "throughput": 2319.2, "total_tokens": 8571496} {"current_steps": 14870, "total_steps": 67140, "loss": 0.6798, "lr": 4.778642425419442e-05, "epoch": 2.2147750968126303, "percentage": 22.15, "elapsed_time": "1:01:37", "remaining_time": "3:36:35", "throughput": 2319.28, "total_tokens": 8574504} {"current_steps": 14875, "total_steps": 67140, "loss": 0.7507, "lr": 4.778374989010949e-05, "epoch": 2.2155198093535895, "percentage": 22.16, "elapsed_time": "1:01:38", "remaining_time": "3:36:33", "throughput": 2319.32, "total_tokens": 8577256} {"current_steps": 14880, "total_steps": 67140, "loss": 0.7099, "lr": 4.778107398639136e-05, "epoch": 2.2162645218945487, "percentage": 22.16, "elapsed_time": "1:01:39", "remaining_time": "3:36:32", "throughput": 2319.41, "total_tokens": 8580200} {"current_steps": 14885, "total_steps": 67140, "loss": 0.6948, "lr": 4.777839654322088e-05, "epoch": 2.217009234435508, "percentage": 22.17, "elapsed_time": "1:01:40", "remaining_time": "3:36:30", "throughput": 2319.51, "total_tokens": 8583304} {"current_steps": 14890, "total_steps": 67140, "loss": 0.7786, "lr": 4.777571756077897e-05, "epoch": 2.217753946976467, "percentage": 22.18, "elapsed_time": "1:01:41", "remaining_time": "3:36:29", "throughput": 2319.59, "total_tokens": 8586248} {"current_steps": 14895, "total_steps": 67140, "loss": 0.6687, "lr": 4.777303703924667e-05, "epoch": 2.2184986595174263, "percentage": 22.18, "elapsed_time": "1:01:42", "remaining_time": "3:36:27", "throughput": 2319.63, "total_tokens": 8588968} {"current_steps": 14900, "total_steps": 67140, "loss": 0.6461, "lr": 4.777035497880511e-05, "epoch": 2.2192433720583855, "percentage": 22.19, "elapsed_time": "1:01:43", "remaining_time": "3:36:25", "throughput": 2319.73, "total_tokens": 8592008} {"current_steps": 14905, "total_steps": 67140, "loss": 0.6697, "lr": 4.776767137963554e-05, "epoch": 2.2199880845993447, "percentage": 22.2, "elapsed_time": "1:01:45", "remaining_time": "3:36:24", "throughput": 2319.84, "total_tokens": 8595144} {"current_steps": 14910, "total_steps": 67140, "loss": 0.6659, "lr": 4.776498624191931e-05, "epoch": 2.220732797140304, "percentage": 22.21, "elapsed_time": "1:01:46", "remaining_time": "3:36:23", "throughput": 2319.97, "total_tokens": 8598408} {"current_steps": 14915, "total_steps": 67140, "loss": 0.7664, "lr": 4.7762299565837855e-05, "epoch": 2.221477509681263, "percentage": 22.21, "elapsed_time": "1:01:47", "remaining_time": "3:36:21", "throughput": 2320.05, "total_tokens": 8601352} {"current_steps": 14920, "total_steps": 67140, "loss": 0.7017, "lr": 4.775961135157275e-05, "epoch": 2.2222222222222223, "percentage": 22.22, "elapsed_time": "1:01:48", "remaining_time": "3:36:19", "throughput": 2320.16, "total_tokens": 8604456} {"current_steps": 14925, "total_steps": 67140, "loss": 0.6124, "lr": 4.775692159930564e-05, "epoch": 2.2229669347631815, "percentage": 22.23, "elapsed_time": "1:01:49", "remaining_time": "3:36:18", "throughput": 2320.27, "total_tokens": 8607560} {"current_steps": 14930, "total_steps": 67140, "loss": 0.6304, "lr": 4.775423030921828e-05, "epoch": 2.2237116473041407, "percentage": 22.24, "elapsed_time": "1:01:50", "remaining_time": "3:36:16", "throughput": 2320.34, "total_tokens": 8610440} {"current_steps": 14935, "total_steps": 67140, "loss": 0.7242, "lr": 4.7751537481492565e-05, "epoch": 2.2244563598451, "percentage": 22.24, "elapsed_time": "1:01:52", "remaining_time": "3:36:15", "throughput": 2320.41, "total_tokens": 8613384} {"current_steps": 14940, "total_steps": 67140, "loss": 0.5488, "lr": 4.7748843116310434e-05, "epoch": 2.225201072386059, "percentage": 22.25, "elapsed_time": "1:01:53", "remaining_time": "3:36:13", "throughput": 2320.49, "total_tokens": 8616296} {"current_steps": 14945, "total_steps": 67140, "loss": 0.6717, "lr": 4.774614721385399e-05, "epoch": 2.2259457849270183, "percentage": 22.26, "elapsed_time": "1:01:54", "remaining_time": "3:36:12", "throughput": 2320.58, "total_tokens": 8619368} {"current_steps": 14950, "total_steps": 67140, "loss": 0.5777, "lr": 4.7743449774305386e-05, "epoch": 2.2266904974679775, "percentage": 22.27, "elapsed_time": "1:01:55", "remaining_time": "3:36:10", "throughput": 2320.65, "total_tokens": 8622248} {"current_steps": 14955, "total_steps": 67140, "loss": 0.7055, "lr": 4.774075079784692e-05, "epoch": 2.2274352100089367, "percentage": 22.27, "elapsed_time": "1:01:56", "remaining_time": "3:36:08", "throughput": 2320.71, "total_tokens": 8625128} {"current_steps": 14960, "total_steps": 67140, "loss": 0.566, "lr": 4.7738050284660966e-05, "epoch": 2.228179922549896, "percentage": 22.28, "elapsed_time": "1:01:57", "remaining_time": "3:36:07", "throughput": 2320.81, "total_tokens": 8628168} {"current_steps": 14965, "total_steps": 67140, "loss": 0.6546, "lr": 4.7735348234930024e-05, "epoch": 2.2289246350908547, "percentage": 22.29, "elapsed_time": "1:01:58", "remaining_time": "3:36:05", "throughput": 2320.91, "total_tokens": 8631208} {"current_steps": 14970, "total_steps": 67140, "loss": 0.6518, "lr": 4.773264464883669e-05, "epoch": 2.2296693476318143, "percentage": 22.3, "elapsed_time": "1:02:00", "remaining_time": "3:36:04", "throughput": 2321.0, "total_tokens": 8634152} {"current_steps": 14975, "total_steps": 67140, "loss": 0.6133, "lr": 4.772993952656364e-05, "epoch": 2.230414060172773, "percentage": 22.3, "elapsed_time": "1:02:01", "remaining_time": "3:36:02", "throughput": 2321.13, "total_tokens": 8637384} {"current_steps": 14980, "total_steps": 67140, "loss": 0.7801, "lr": 4.7727232868293705e-05, "epoch": 2.2311587727137323, "percentage": 22.31, "elapsed_time": "1:02:02", "remaining_time": "3:36:01", "throughput": 2321.21, "total_tokens": 8640424} {"current_steps": 14985, "total_steps": 67140, "loss": 0.6701, "lr": 4.7724524674209765e-05, "epoch": 2.2319034852546915, "percentage": 22.32, "elapsed_time": "1:02:03", "remaining_time": "3:35:59", "throughput": 2321.27, "total_tokens": 8643240} {"current_steps": 14990, "total_steps": 67140, "loss": 0.5551, "lr": 4.7721814944494834e-05, "epoch": 2.2326481977956507, "percentage": 22.33, "elapsed_time": "1:02:04", "remaining_time": "3:35:57", "throughput": 2321.32, "total_tokens": 8646024} {"current_steps": 14995, "total_steps": 67140, "loss": 0.7924, "lr": 4.771910367933204e-05, "epoch": 2.23339291033661, "percentage": 22.33, "elapsed_time": "1:02:05", "remaining_time": "3:35:56", "throughput": 2321.38, "total_tokens": 8648840} {"current_steps": 15000, "total_steps": 67140, "loss": 0.8663, "lr": 4.771639087890459e-05, "epoch": 2.234137622877569, "percentage": 22.34, "elapsed_time": "1:02:06", "remaining_time": "3:35:54", "throughput": 2321.44, "total_tokens": 8651688} {"current_steps": 15005, "total_steps": 67140, "loss": 0.6963, "lr": 4.771367654339579e-05, "epoch": 2.2348823354185283, "percentage": 22.35, "elapsed_time": "1:02:07", "remaining_time": "3:35:52", "throughput": 2321.46, "total_tokens": 8654344} {"current_steps": 15010, "total_steps": 67140, "loss": 0.574, "lr": 4.771096067298909e-05, "epoch": 2.2356270479594875, "percentage": 22.36, "elapsed_time": "1:02:09", "remaining_time": "3:35:51", "throughput": 2321.51, "total_tokens": 8657128} {"current_steps": 15015, "total_steps": 67140, "loss": 0.6121, "lr": 4.7708243267868e-05, "epoch": 2.2363717605004467, "percentage": 22.36, "elapsed_time": "1:02:10", "remaining_time": "3:35:49", "throughput": 2321.56, "total_tokens": 8659912} {"current_steps": 15020, "total_steps": 67140, "loss": 0.8117, "lr": 4.770552432821615e-05, "epoch": 2.237116473041406, "percentage": 22.37, "elapsed_time": "1:02:11", "remaining_time": "3:35:48", "throughput": 2321.67, "total_tokens": 8663016} {"current_steps": 15025, "total_steps": 67140, "loss": 0.6482, "lr": 4.770280385421728e-05, "epoch": 2.237861185582365, "percentage": 22.38, "elapsed_time": "1:02:12", "remaining_time": "3:35:46", "throughput": 2321.8, "total_tokens": 8666280} {"current_steps": 15030, "total_steps": 67140, "loss": 0.6719, "lr": 4.7700081846055236e-05, "epoch": 2.2386058981233243, "percentage": 22.39, "elapsed_time": "1:02:13", "remaining_time": "3:35:44", "throughput": 2321.88, "total_tokens": 8669224} {"current_steps": 15035, "total_steps": 67140, "loss": 0.6822, "lr": 4.7697358303913944e-05, "epoch": 2.2393506106642835, "percentage": 22.39, "elapsed_time": "1:02:14", "remaining_time": "3:35:43", "throughput": 2321.92, "total_tokens": 8671912} {"current_steps": 15040, "total_steps": 67140, "loss": 0.7778, "lr": 4.769463322797746e-05, "epoch": 2.2400953232052427, "percentage": 22.4, "elapsed_time": "1:02:15", "remaining_time": "3:35:41", "throughput": 2322.02, "total_tokens": 8674984} {"current_steps": 15045, "total_steps": 67140, "loss": 0.7074, "lr": 4.7691906618429935e-05, "epoch": 2.240840035746202, "percentage": 22.41, "elapsed_time": "1:02:17", "remaining_time": "3:35:40", "throughput": 2322.09, "total_tokens": 8677896} {"current_steps": 15050, "total_steps": 67140, "loss": 0.5987, "lr": 4.768917847545562e-05, "epoch": 2.241584748287161, "percentage": 22.42, "elapsed_time": "1:02:18", "remaining_time": "3:35:38", "throughput": 2322.17, "total_tokens": 8680872} {"current_steps": 15055, "total_steps": 67140, "loss": 0.7142, "lr": 4.768644879923887e-05, "epoch": 2.2423294608281203, "percentage": 22.42, "elapsed_time": "1:02:19", "remaining_time": "3:35:36", "throughput": 2322.2, "total_tokens": 8683560} {"current_steps": 15060, "total_steps": 67140, "loss": 0.7553, "lr": 4.768371758996415e-05, "epoch": 2.2430741733690795, "percentage": 22.43, "elapsed_time": "1:02:20", "remaining_time": "3:35:35", "throughput": 2322.26, "total_tokens": 8686408} {"current_steps": 15065, "total_steps": 67140, "loss": 0.6491, "lr": 4.7680984847816015e-05, "epoch": 2.2438188859100388, "percentage": 22.44, "elapsed_time": "1:02:21", "remaining_time": "3:35:33", "throughput": 2322.33, "total_tokens": 8689320} {"current_steps": 15070, "total_steps": 67140, "loss": 0.7574, "lr": 4.767825057297914e-05, "epoch": 2.244563598450998, "percentage": 22.45, "elapsed_time": "1:02:22", "remaining_time": "3:35:32", "throughput": 2322.45, "total_tokens": 8692584} {"current_steps": 15075, "total_steps": 67140, "loss": 0.6686, "lr": 4.767551476563829e-05, "epoch": 2.245308310991957, "percentage": 22.45, "elapsed_time": "1:02:23", "remaining_time": "3:35:30", "throughput": 2322.51, "total_tokens": 8695432} {"current_steps": 15080, "total_steps": 67140, "loss": 0.6816, "lr": 4.767277742597835e-05, "epoch": 2.2460530235329164, "percentage": 22.46, "elapsed_time": "1:02:25", "remaining_time": "3:35:28", "throughput": 2322.55, "total_tokens": 8698152} {"current_steps": 15085, "total_steps": 67140, "loss": 0.6998, "lr": 4.7670038554184296e-05, "epoch": 2.2467977360738756, "percentage": 22.47, "elapsed_time": "1:02:26", "remaining_time": "3:35:27", "throughput": 2322.58, "total_tokens": 8700840} {"current_steps": 15090, "total_steps": 67140, "loss": 0.7293, "lr": 4.7667298150441194e-05, "epoch": 2.2475424486148348, "percentage": 22.48, "elapsed_time": "1:02:27", "remaining_time": "3:35:25", "throughput": 2322.68, "total_tokens": 8703912} {"current_steps": 15095, "total_steps": 67140, "loss": 0.6448, "lr": 4.7664556214934255e-05, "epoch": 2.248287161155794, "percentage": 22.48, "elapsed_time": "1:02:28", "remaining_time": "3:35:24", "throughput": 2322.76, "total_tokens": 8706888} {"current_steps": 15100, "total_steps": 67140, "loss": 0.6386, "lr": 4.766181274784874e-05, "epoch": 2.249031873696753, "percentage": 22.49, "elapsed_time": "1:02:29", "remaining_time": "3:35:22", "throughput": 2322.82, "total_tokens": 8709800} {"current_steps": 15105, "total_steps": 67140, "loss": 0.6544, "lr": 4.765906774937007e-05, "epoch": 2.2497765862377124, "percentage": 22.5, "elapsed_time": "1:02:30", "remaining_time": "3:35:21", "throughput": 2322.88, "total_tokens": 8712616} {"current_steps": 15110, "total_steps": 67140, "loss": 0.8153, "lr": 4.765632121968371e-05, "epoch": 2.2505212987786716, "percentage": 22.51, "elapsed_time": "1:02:31", "remaining_time": "3:35:19", "throughput": 2322.94, "total_tokens": 8715464} {"current_steps": 15115, "total_steps": 67140, "loss": 0.7552, "lr": 4.765357315897529e-05, "epoch": 2.2512660113196308, "percentage": 22.51, "elapsed_time": "1:02:33", "remaining_time": "3:35:18", "throughput": 2323.11, "total_tokens": 8718888} {"current_steps": 15120, "total_steps": 67140, "loss": 0.6915, "lr": 4.765082356743049e-05, "epoch": 2.25201072386059, "percentage": 22.52, "elapsed_time": "1:02:34", "remaining_time": "3:35:16", "throughput": 2323.13, "total_tokens": 8721512} {"current_steps": 15125, "total_steps": 67140, "loss": 0.6775, "lr": 4.7648072445235136e-05, "epoch": 2.252755436401549, "percentage": 22.53, "elapsed_time": "1:02:35", "remaining_time": "3:35:14", "throughput": 2323.23, "total_tokens": 8724584} {"current_steps": 15130, "total_steps": 67140, "loss": 0.6681, "lr": 4.764531979257511e-05, "epoch": 2.2535001489425084, "percentage": 22.54, "elapsed_time": "1:02:36", "remaining_time": "3:35:13", "throughput": 2323.36, "total_tokens": 8727880} {"current_steps": 15135, "total_steps": 67140, "loss": 0.711, "lr": 4.764256560963646e-05, "epoch": 2.2542448614834676, "percentage": 22.54, "elapsed_time": "1:02:37", "remaining_time": "3:35:11", "throughput": 2323.46, "total_tokens": 8731016} {"current_steps": 15140, "total_steps": 67140, "loss": 0.6889, "lr": 4.7639809896605275e-05, "epoch": 2.2549895740244263, "percentage": 22.55, "elapsed_time": "1:02:38", "remaining_time": "3:35:10", "throughput": 2323.53, "total_tokens": 8733896} {"current_steps": 15145, "total_steps": 67140, "loss": 0.6489, "lr": 4.763705265366779e-05, "epoch": 2.255734286565386, "percentage": 22.56, "elapsed_time": "1:02:40", "remaining_time": "3:35:08", "throughput": 2323.59, "total_tokens": 8736776} {"current_steps": 15150, "total_steps": 67140, "loss": 0.5727, "lr": 4.763429388101031e-05, "epoch": 2.2564789991063448, "percentage": 22.56, "elapsed_time": "1:02:41", "remaining_time": "3:35:07", "throughput": 2323.68, "total_tokens": 8739816} {"current_steps": 15155, "total_steps": 67140, "loss": 0.5255, "lr": 4.763153357881928e-05, "epoch": 2.257223711647304, "percentage": 22.57, "elapsed_time": "1:02:42", "remaining_time": "3:35:05", "throughput": 2323.79, "total_tokens": 8742984} {"current_steps": 15160, "total_steps": 67140, "loss": 0.6091, "lr": 4.7628771747281226e-05, "epoch": 2.257968424188263, "percentage": 22.58, "elapsed_time": "1:02:43", "remaining_time": "3:35:04", "throughput": 2323.89, "total_tokens": 8746088} {"current_steps": 15165, "total_steps": 67140, "loss": 0.6688, "lr": 4.762600838658278e-05, "epoch": 2.2587131367292224, "percentage": 22.59, "elapsed_time": "1:02:44", "remaining_time": "3:35:02", "throughput": 2323.96, "total_tokens": 8748968} {"current_steps": 15170, "total_steps": 67140, "loss": 0.6101, "lr": 4.762324349691067e-05, "epoch": 2.2594578492701816, "percentage": 22.59, "elapsed_time": "1:02:45", "remaining_time": "3:35:01", "throughput": 2324.03, "total_tokens": 8751848} {"current_steps": 15175, "total_steps": 67140, "loss": 0.7256, "lr": 4.762047707845175e-05, "epoch": 2.2602025618111408, "percentage": 22.6, "elapsed_time": "1:02:46", "remaining_time": "3:34:59", "throughput": 2324.06, "total_tokens": 8754536} {"current_steps": 15180, "total_steps": 67140, "loss": 0.6371, "lr": 4.761770913139296e-05, "epoch": 2.2609472743521, "percentage": 22.61, "elapsed_time": "1:02:48", "remaining_time": "3:34:57", "throughput": 2324.09, "total_tokens": 8757256} {"current_steps": 15185, "total_steps": 67140, "loss": 0.7007, "lr": 4.761493965592134e-05, "epoch": 2.261691986893059, "percentage": 22.62, "elapsed_time": "1:02:49", "remaining_time": "3:34:56", "throughput": 2324.15, "total_tokens": 8760104} {"current_steps": 15190, "total_steps": 67140, "loss": 0.485, "lr": 4.761216865222404e-05, "epoch": 2.2624366994340184, "percentage": 22.62, "elapsed_time": "1:02:50", "remaining_time": "3:34:54", "throughput": 2324.23, "total_tokens": 8763112} {"current_steps": 15195, "total_steps": 67140, "loss": 0.6758, "lr": 4.7609396120488324e-05, "epoch": 2.2631814119749776, "percentage": 22.63, "elapsed_time": "1:02:51", "remaining_time": "3:34:53", "throughput": 2324.34, "total_tokens": 8766248} {"current_steps": 15200, "total_steps": 67140, "loss": 0.7831, "lr": 4.760662206090154e-05, "epoch": 2.2639261245159368, "percentage": 22.64, "elapsed_time": "1:02:52", "remaining_time": "3:34:51", "throughput": 2324.37, "total_tokens": 8768936} {"current_steps": 15205, "total_steps": 67140, "loss": 0.7172, "lr": 4.7603846473651147e-05, "epoch": 2.264670837056896, "percentage": 22.65, "elapsed_time": "1:02:53", "remaining_time": "3:34:49", "throughput": 2324.41, "total_tokens": 8771656} {"current_steps": 15210, "total_steps": 67140, "loss": 0.6847, "lr": 4.760106935892471e-05, "epoch": 2.265415549597855, "percentage": 22.65, "elapsed_time": "1:02:54", "remaining_time": "3:34:48", "throughput": 2324.46, "total_tokens": 8774472} {"current_steps": 15215, "total_steps": 67140, "loss": 0.7723, "lr": 4.7598290716909897e-05, "epoch": 2.2661602621388144, "percentage": 22.66, "elapsed_time": "1:02:55", "remaining_time": "3:34:46", "throughput": 2324.51, "total_tokens": 8777224} {"current_steps": 15220, "total_steps": 67140, "loss": 0.7763, "lr": 4.7595510547794465e-05, "epoch": 2.2669049746797736, "percentage": 22.67, "elapsed_time": "1:02:57", "remaining_time": "3:34:44", "throughput": 2324.6, "total_tokens": 8780296} {"current_steps": 15225, "total_steps": 67140, "loss": 0.6973, "lr": 4.759272885176631e-05, "epoch": 2.267649687220733, "percentage": 22.68, "elapsed_time": "1:02:58", "remaining_time": "3:34:43", "throughput": 2324.69, "total_tokens": 8783240} {"current_steps": 15230, "total_steps": 67140, "loss": 0.5805, "lr": 4.758994562901339e-05, "epoch": 2.268394399761692, "percentage": 22.68, "elapsed_time": "1:02:59", "remaining_time": "3:34:41", "throughput": 2324.76, "total_tokens": 8786216} {"current_steps": 15235, "total_steps": 67140, "loss": 0.7277, "lr": 4.7587160879723785e-05, "epoch": 2.269139112302651, "percentage": 22.69, "elapsed_time": "1:03:00", "remaining_time": "3:34:40", "throughput": 2324.84, "total_tokens": 8789192} {"current_steps": 15240, "total_steps": 67140, "loss": 0.7926, "lr": 4.7584374604085684e-05, "epoch": 2.2698838248436104, "percentage": 22.7, "elapsed_time": "1:03:01", "remaining_time": "3:34:38", "throughput": 2324.9, "total_tokens": 8792040} {"current_steps": 15245, "total_steps": 67140, "loss": 0.7377, "lr": 4.758158680228737e-05, "epoch": 2.2706285373845696, "percentage": 22.71, "elapsed_time": "1:03:02", "remaining_time": "3:34:36", "throughput": 2324.92, "total_tokens": 8794664} {"current_steps": 15250, "total_steps": 67140, "loss": 0.6357, "lr": 4.757879747451722e-05, "epoch": 2.271373249925529, "percentage": 22.71, "elapsed_time": "1:03:03", "remaining_time": "3:34:35", "throughput": 2325.01, "total_tokens": 8797704} {"current_steps": 15255, "total_steps": 67140, "loss": 0.6729, "lr": 4.757600662096375e-05, "epoch": 2.272117962466488, "percentage": 22.72, "elapsed_time": "1:03:05", "remaining_time": "3:34:33", "throughput": 2325.12, "total_tokens": 8800872} {"current_steps": 15260, "total_steps": 67140, "loss": 0.6757, "lr": 4.757321424181553e-05, "epoch": 2.272862675007447, "percentage": 22.73, "elapsed_time": "1:03:06", "remaining_time": "3:34:32", "throughput": 2325.18, "total_tokens": 8803688} {"current_steps": 15265, "total_steps": 67140, "loss": 0.7185, "lr": 4.7570420337261275e-05, "epoch": 2.2736073875484064, "percentage": 22.74, "elapsed_time": "1:03:07", "remaining_time": "3:34:30", "throughput": 2325.23, "total_tokens": 8806504} {"current_steps": 15270, "total_steps": 67140, "loss": 0.6931, "lr": 4.756762490748977e-05, "epoch": 2.2743521000893656, "percentage": 22.74, "elapsed_time": "1:03:08", "remaining_time": "3:34:29", "throughput": 2325.32, "total_tokens": 8809544} {"current_steps": 15275, "total_steps": 67140, "loss": 0.5786, "lr": 4.7564827952689936e-05, "epoch": 2.275096812630325, "percentage": 22.75, "elapsed_time": "1:03:09", "remaining_time": "3:34:27", "throughput": 2325.4, "total_tokens": 8812520} {"current_steps": 15280, "total_steps": 67140, "loss": 0.5897, "lr": 4.756202947305076e-05, "epoch": 2.275841525171284, "percentage": 22.76, "elapsed_time": "1:03:10", "remaining_time": "3:34:25", "throughput": 2325.45, "total_tokens": 8815304} {"current_steps": 15285, "total_steps": 67140, "loss": 0.5542, "lr": 4.755922946876137e-05, "epoch": 2.276586237712243, "percentage": 22.77, "elapsed_time": "1:03:11", "remaining_time": "3:34:24", "throughput": 2325.52, "total_tokens": 8818280} {"current_steps": 15290, "total_steps": 67140, "loss": 0.7092, "lr": 4.755642794001097e-05, "epoch": 2.2773309502532024, "percentage": 22.77, "elapsed_time": "1:03:13", "remaining_time": "3:34:22", "throughput": 2325.56, "total_tokens": 8820968} {"current_steps": 15295, "total_steps": 67140, "loss": 0.7046, "lr": 4.755362488698888e-05, "epoch": 2.2780756627941616, "percentage": 22.78, "elapsed_time": "1:03:14", "remaining_time": "3:34:21", "throughput": 2325.64, "total_tokens": 8823976} {"current_steps": 15300, "total_steps": 67140, "loss": 0.7374, "lr": 4.755082030988452e-05, "epoch": 2.278820375335121, "percentage": 22.79, "elapsed_time": "1:03:15", "remaining_time": "3:34:19", "throughput": 2325.66, "total_tokens": 8826664} {"current_steps": 15305, "total_steps": 67140, "loss": 0.6783, "lr": 4.7548014208887396e-05, "epoch": 2.2795650878760796, "percentage": 22.8, "elapsed_time": "1:03:16", "remaining_time": "3:34:18", "throughput": 2325.79, "total_tokens": 8829928} {"current_steps": 15310, "total_steps": 67140, "loss": 0.5632, "lr": 4.7545206584187155e-05, "epoch": 2.2803098004170392, "percentage": 22.8, "elapsed_time": "1:03:17", "remaining_time": "3:34:16", "throughput": 2325.84, "total_tokens": 8832712} {"current_steps": 15315, "total_steps": 67140, "loss": 0.7296, "lr": 4.7542397435973515e-05, "epoch": 2.281054512957998, "percentage": 22.81, "elapsed_time": "1:03:18", "remaining_time": "3:34:15", "throughput": 2326.01, "total_tokens": 8836200} {"current_steps": 15320, "total_steps": 67140, "loss": 0.6344, "lr": 4.75395867644363e-05, "epoch": 2.2817992254989576, "percentage": 22.82, "elapsed_time": "1:03:19", "remaining_time": "3:34:13", "throughput": 2326.08, "total_tokens": 8839080} {"current_steps": 15325, "total_steps": 67140, "loss": 0.7775, "lr": 4.753677456976546e-05, "epoch": 2.2825439380399164, "percentage": 22.83, "elapsed_time": "1:03:21", "remaining_time": "3:34:11", "throughput": 2326.14, "total_tokens": 8841960} {"current_steps": 15330, "total_steps": 67140, "loss": 0.7516, "lr": 4.753396085215102e-05, "epoch": 2.2832886505808756, "percentage": 22.83, "elapsed_time": "1:03:22", "remaining_time": "3:34:10", "throughput": 2326.16, "total_tokens": 8844584} {"current_steps": 15335, "total_steps": 67140, "loss": 0.5422, "lr": 4.753114561178311e-05, "epoch": 2.284033363121835, "percentage": 22.84, "elapsed_time": "1:03:23", "remaining_time": "3:34:08", "throughput": 2326.2, "total_tokens": 8847400} {"current_steps": 15340, "total_steps": 67140, "loss": 0.7901, "lr": 4.7528328848852e-05, "epoch": 2.284778075662794, "percentage": 22.85, "elapsed_time": "1:03:24", "remaining_time": "3:34:06", "throughput": 2326.24, "total_tokens": 8850120} {"current_steps": 15345, "total_steps": 67140, "loss": 0.7316, "lr": 4.752551056354801e-05, "epoch": 2.285522788203753, "percentage": 22.86, "elapsed_time": "1:03:25", "remaining_time": "3:34:05", "throughput": 2326.29, "total_tokens": 8852936} {"current_steps": 15350, "total_steps": 67140, "loss": 0.6637, "lr": 4.7522690756061606e-05, "epoch": 2.2862675007447124, "percentage": 22.86, "elapsed_time": "1:03:26", "remaining_time": "3:34:03", "throughput": 2326.39, "total_tokens": 8856104} {"current_steps": 15355, "total_steps": 67140, "loss": 0.7048, "lr": 4.751986942658332e-05, "epoch": 2.2870122132856716, "percentage": 22.87, "elapsed_time": "1:03:27", "remaining_time": "3:34:02", "throughput": 2326.52, "total_tokens": 8859368} {"current_steps": 15360, "total_steps": 67140, "loss": 0.6923, "lr": 4.751704657530383e-05, "epoch": 2.287756925826631, "percentage": 22.88, "elapsed_time": "1:03:29", "remaining_time": "3:34:00", "throughput": 2326.54, "total_tokens": 8862024} {"current_steps": 15365, "total_steps": 67140, "loss": 0.6569, "lr": 4.751422220241387e-05, "epoch": 2.28850163836759, "percentage": 22.89, "elapsed_time": "1:03:30", "remaining_time": "3:33:59", "throughput": 2326.6, "total_tokens": 8864872} {"current_steps": 15370, "total_steps": 67140, "loss": 0.6611, "lr": 4.7511396308104314e-05, "epoch": 2.289246350908549, "percentage": 22.89, "elapsed_time": "1:03:31", "remaining_time": "3:33:57", "throughput": 2326.67, "total_tokens": 8867752} {"current_steps": 15375, "total_steps": 67140, "loss": 0.676, "lr": 4.750856889256613e-05, "epoch": 2.2899910634495084, "percentage": 22.9, "elapsed_time": "1:03:32", "remaining_time": "3:33:55", "throughput": 2326.69, "total_tokens": 8870440} {"current_steps": 15380, "total_steps": 67140, "loss": 0.6477, "lr": 4.750573995599036e-05, "epoch": 2.2907357759904676, "percentage": 22.91, "elapsed_time": "1:03:33", "remaining_time": "3:33:54", "throughput": 2326.73, "total_tokens": 8873160} {"current_steps": 15385, "total_steps": 67140, "loss": 0.7901, "lr": 4.7502909498568194e-05, "epoch": 2.291480488531427, "percentage": 22.91, "elapsed_time": "1:03:34", "remaining_time": "3:33:52", "throughput": 2326.79, "total_tokens": 8876040} {"current_steps": 15390, "total_steps": 67140, "loss": 0.5789, "lr": 4.7500077520490884e-05, "epoch": 2.292225201072386, "percentage": 22.92, "elapsed_time": "1:03:35", "remaining_time": "3:33:51", "throughput": 2326.81, "total_tokens": 8878728} {"current_steps": 15395, "total_steps": 67140, "loss": 0.586, "lr": 4.749724402194982e-05, "epoch": 2.2929699136133452, "percentage": 22.93, "elapsed_time": "1:03:36", "remaining_time": "3:33:49", "throughput": 2326.86, "total_tokens": 8881544} {"current_steps": 15400, "total_steps": 67140, "loss": 0.5501, "lr": 4.749440900313648e-05, "epoch": 2.2937146261543044, "percentage": 22.94, "elapsed_time": "1:03:38", "remaining_time": "3:33:47", "throughput": 2326.87, "total_tokens": 8884104} {"current_steps": 15405, "total_steps": 67140, "loss": 0.5865, "lr": 4.7491572464242415e-05, "epoch": 2.2944593386952636, "percentage": 22.94, "elapsed_time": "1:03:39", "remaining_time": "3:33:45", "throughput": 2326.92, "total_tokens": 8886888} {"current_steps": 15410, "total_steps": 67140, "loss": 0.7181, "lr": 4.748873440545935e-05, "epoch": 2.295204051236223, "percentage": 22.95, "elapsed_time": "1:03:40", "remaining_time": "3:33:44", "throughput": 2327.01, "total_tokens": 8889928} {"current_steps": 15415, "total_steps": 67140, "loss": 0.6507, "lr": 4.7485894826979025e-05, "epoch": 2.295948763777182, "percentage": 22.96, "elapsed_time": "1:03:41", "remaining_time": "3:33:43", "throughput": 2327.12, "total_tokens": 8893096} {"current_steps": 15420, "total_steps": 67140, "loss": 0.7366, "lr": 4.748305372899337e-05, "epoch": 2.2966934763181412, "percentage": 22.97, "elapsed_time": "1:03:42", "remaining_time": "3:33:41", "throughput": 2327.13, "total_tokens": 8895624} {"current_steps": 15425, "total_steps": 67140, "loss": 0.5477, "lr": 4.7480211111694335e-05, "epoch": 2.2974381888591004, "percentage": 22.97, "elapsed_time": "1:03:43", "remaining_time": "3:33:39", "throughput": 2327.18, "total_tokens": 8898408} {"current_steps": 15430, "total_steps": 67140, "loss": 0.6682, "lr": 4.747736697527404e-05, "epoch": 2.2981829014000597, "percentage": 22.98, "elapsed_time": "1:03:44", "remaining_time": "3:33:38", "throughput": 2327.25, "total_tokens": 8901352} {"current_steps": 15435, "total_steps": 67140, "loss": 0.6878, "lr": 4.747452131992467e-05, "epoch": 2.298927613941019, "percentage": 22.99, "elapsed_time": "1:03:45", "remaining_time": "3:33:36", "throughput": 2327.28, "total_tokens": 8904008} {"current_steps": 15440, "total_steps": 67140, "loss": 0.5352, "lr": 4.747167414583852e-05, "epoch": 2.299672326481978, "percentage": 23.0, "elapsed_time": "1:03:47", "remaining_time": "3:33:34", "throughput": 2327.35, "total_tokens": 8906920} {"current_steps": 15445, "total_steps": 67140, "loss": 0.7449, "lr": 4.7468825453208e-05, "epoch": 2.3004170390229373, "percentage": 23.0, "elapsed_time": "1:03:48", "remaining_time": "3:33:33", "throughput": 2327.42, "total_tokens": 8909832} {"current_steps": 15450, "total_steps": 67140, "loss": 0.705, "lr": 4.74659752422256e-05, "epoch": 2.3011617515638965, "percentage": 23.01, "elapsed_time": "1:03:49", "remaining_time": "3:33:31", "throughput": 2327.47, "total_tokens": 8912680} {"current_steps": 15455, "total_steps": 67140, "loss": 0.6524, "lr": 4.746312351308394e-05, "epoch": 2.3019064641048557, "percentage": 23.02, "elapsed_time": "1:03:50", "remaining_time": "3:33:29", "throughput": 2327.48, "total_tokens": 8915272} {"current_steps": 15460, "total_steps": 67140, "loss": 0.6612, "lr": 4.746027026597572e-05, "epoch": 2.302651176645815, "percentage": 23.03, "elapsed_time": "1:03:51", "remaining_time": "3:33:28", "throughput": 2327.56, "total_tokens": 8918248} {"current_steps": 15465, "total_steps": 67140, "loss": 0.6718, "lr": 4.7457415501093746e-05, "epoch": 2.303395889186774, "percentage": 23.03, "elapsed_time": "1:03:52", "remaining_time": "3:33:26", "throughput": 2327.61, "total_tokens": 8921064} {"current_steps": 15470, "total_steps": 67140, "loss": 0.6836, "lr": 4.745455921863095e-05, "epoch": 2.3041406017277333, "percentage": 23.04, "elapsed_time": "1:03:53", "remaining_time": "3:33:25", "throughput": 2327.71, "total_tokens": 8924136} {"current_steps": 15475, "total_steps": 67140, "loss": 0.7934, "lr": 4.7451701418780334e-05, "epoch": 2.3048853142686925, "percentage": 23.05, "elapsed_time": "1:03:55", "remaining_time": "3:33:23", "throughput": 2327.79, "total_tokens": 8927080} {"current_steps": 15480, "total_steps": 67140, "loss": 0.6868, "lr": 4.744884210173501e-05, "epoch": 2.3056300268096512, "percentage": 23.06, "elapsed_time": "1:03:56", "remaining_time": "3:33:21", "throughput": 2327.82, "total_tokens": 8929768} {"current_steps": 15485, "total_steps": 67140, "loss": 0.6709, "lr": 4.744598126768821e-05, "epoch": 2.306374739350611, "percentage": 23.06, "elapsed_time": "1:03:57", "remaining_time": "3:33:20", "throughput": 2327.97, "total_tokens": 8933224} {"current_steps": 15490, "total_steps": 67140, "loss": 0.6034, "lr": 4.744311891683325e-05, "epoch": 2.3071194518915696, "percentage": 23.07, "elapsed_time": "1:03:58", "remaining_time": "3:33:18", "throughput": 2327.96, "total_tokens": 8935656} {"current_steps": 15495, "total_steps": 67140, "loss": 0.5988, "lr": 4.7440255049363566e-05, "epoch": 2.3078641644325293, "percentage": 23.08, "elapsed_time": "1:03:59", "remaining_time": "3:33:17", "throughput": 2328.0, "total_tokens": 8938440} {"current_steps": 15500, "total_steps": 67140, "loss": 0.536, "lr": 4.7437389665472686e-05, "epoch": 2.308608876973488, "percentage": 23.09, "elapsed_time": "1:04:00", "remaining_time": "3:33:15", "throughput": 2328.06, "total_tokens": 8941288} {"current_steps": 15505, "total_steps": 67140, "loss": 0.6909, "lr": 4.7434522765354226e-05, "epoch": 2.3093535895144472, "percentage": 23.09, "elapsed_time": "1:04:01", "remaining_time": "3:33:14", "throughput": 2328.13, "total_tokens": 8944200} {"current_steps": 15510, "total_steps": 67140, "loss": 0.4623, "lr": 4.743165434920194e-05, "epoch": 2.3100983020554064, "percentage": 23.1, "elapsed_time": "1:04:02", "remaining_time": "3:33:12", "throughput": 2328.19, "total_tokens": 8947016} {"current_steps": 15515, "total_steps": 67140, "loss": 0.7148, "lr": 4.742878441720965e-05, "epoch": 2.3108430145963657, "percentage": 23.11, "elapsed_time": "1:04:04", "remaining_time": "3:33:10", "throughput": 2328.25, "total_tokens": 8949896} {"current_steps": 15520, "total_steps": 67140, "loss": 0.7236, "lr": 4.7425912969571295e-05, "epoch": 2.311587727137325, "percentage": 23.12, "elapsed_time": "1:04:05", "remaining_time": "3:33:09", "throughput": 2328.33, "total_tokens": 8952872} {"current_steps": 15525, "total_steps": 67140, "loss": 0.5895, "lr": 4.742304000648092e-05, "epoch": 2.312332439678284, "percentage": 23.12, "elapsed_time": "1:04:06", "remaining_time": "3:33:07", "throughput": 2328.37, "total_tokens": 8955656} {"current_steps": 15530, "total_steps": 67140, "loss": 0.5843, "lr": 4.742016552813267e-05, "epoch": 2.3130771522192433, "percentage": 23.13, "elapsed_time": "1:04:07", "remaining_time": "3:33:05", "throughput": 2328.42, "total_tokens": 8958440} {"current_steps": 15535, "total_steps": 67140, "loss": 0.6039, "lr": 4.7417289534720774e-05, "epoch": 2.3138218647602025, "percentage": 23.14, "elapsed_time": "1:04:08", "remaining_time": "3:33:04", "throughput": 2328.46, "total_tokens": 8961192} {"current_steps": 15540, "total_steps": 67140, "loss": 0.6144, "lr": 4.74144120264396e-05, "epoch": 2.3145665773011617, "percentage": 23.15, "elapsed_time": "1:04:09", "remaining_time": "3:33:02", "throughput": 2328.55, "total_tokens": 8964232} {"current_steps": 15545, "total_steps": 67140, "loss": 0.6628, "lr": 4.74115330034836e-05, "epoch": 2.315311289842121, "percentage": 23.15, "elapsed_time": "1:04:10", "remaining_time": "3:33:01", "throughput": 2328.59, "total_tokens": 8967016} {"current_steps": 15550, "total_steps": 67140, "loss": 0.497, "lr": 4.7408652466047313e-05, "epoch": 2.31605600238308, "percentage": 23.16, "elapsed_time": "1:04:11", "remaining_time": "3:32:59", "throughput": 2328.66, "total_tokens": 8969896} {"current_steps": 15555, "total_steps": 67140, "loss": 0.6314, "lr": 4.7405770414325404e-05, "epoch": 2.3168007149240393, "percentage": 23.17, "elapsed_time": "1:04:13", "remaining_time": "3:32:58", "throughput": 2328.78, "total_tokens": 8973160} {"current_steps": 15560, "total_steps": 67140, "loss": 0.716, "lr": 4.740288684851262e-05, "epoch": 2.3175454274649985, "percentage": 23.18, "elapsed_time": "1:04:14", "remaining_time": "3:32:56", "throughput": 2328.82, "total_tokens": 8975976} {"current_steps": 15565, "total_steps": 67140, "loss": 0.5295, "lr": 4.7400001768803826e-05, "epoch": 2.3182901400059577, "percentage": 23.18, "elapsed_time": "1:04:15", "remaining_time": "3:32:55", "throughput": 2328.89, "total_tokens": 8978920} {"current_steps": 15570, "total_steps": 67140, "loss": 0.6388, "lr": 4.739711517539398e-05, "epoch": 2.319034852546917, "percentage": 23.19, "elapsed_time": "1:04:16", "remaining_time": "3:32:53", "throughput": 2328.94, "total_tokens": 8981736} {"current_steps": 15575, "total_steps": 67140, "loss": 0.4647, "lr": 4.7394227068478157e-05, "epoch": 2.319779565087876, "percentage": 23.2, "elapsed_time": "1:04:17", "remaining_time": "3:32:51", "throughput": 2328.99, "total_tokens": 8984488} {"current_steps": 15580, "total_steps": 67140, "loss": 0.7889, "lr": 4.739133744825152e-05, "epoch": 2.3205242776288353, "percentage": 23.21, "elapsed_time": "1:04:18", "remaining_time": "3:32:50", "throughput": 2329.05, "total_tokens": 8987336} {"current_steps": 15585, "total_steps": 67140, "loss": 0.6856, "lr": 4.738844631490933e-05, "epoch": 2.3212689901697945, "percentage": 23.21, "elapsed_time": "1:04:19", "remaining_time": "3:32:48", "throughput": 2329.15, "total_tokens": 8990440} {"current_steps": 15590, "total_steps": 67140, "loss": 0.7022, "lr": 4.738555366864696e-05, "epoch": 2.3220137027107537, "percentage": 23.22, "elapsed_time": "1:04:21", "remaining_time": "3:32:47", "throughput": 2329.19, "total_tokens": 8993160} {"current_steps": 15595, "total_steps": 67140, "loss": 0.7325, "lr": 4.738265950965989e-05, "epoch": 2.322758415251713, "percentage": 23.23, "elapsed_time": "1:04:22", "remaining_time": "3:32:45", "throughput": 2329.24, "total_tokens": 8995976} {"current_steps": 15600, "total_steps": 67140, "loss": 0.5174, "lr": 4.73797638381437e-05, "epoch": 2.323503127792672, "percentage": 23.24, "elapsed_time": "1:04:23", "remaining_time": "3:32:43", "throughput": 2329.26, "total_tokens": 8998632} {"current_steps": 15605, "total_steps": 67140, "loss": 0.6998, "lr": 4.7376866654294047e-05, "epoch": 2.3242478403336313, "percentage": 23.24, "elapsed_time": "1:04:24", "remaining_time": "3:32:42", "throughput": 2329.3, "total_tokens": 9001384} {"current_steps": 15610, "total_steps": 67140, "loss": 0.5867, "lr": 4.7373967958306724e-05, "epoch": 2.3249925528745905, "percentage": 23.25, "elapsed_time": "1:04:25", "remaining_time": "3:32:40", "throughput": 2329.32, "total_tokens": 9004040} {"current_steps": 15615, "total_steps": 67140, "loss": 0.6021, "lr": 4.737106775037762e-05, "epoch": 2.3257372654155497, "percentage": 23.26, "elapsed_time": "1:04:26", "remaining_time": "3:32:38", "throughput": 2329.39, "total_tokens": 9006984} {"current_steps": 15620, "total_steps": 67140, "loss": 0.5933, "lr": 4.736816603070271e-05, "epoch": 2.326481977956509, "percentage": 23.26, "elapsed_time": "1:04:27", "remaining_time": "3:32:37", "throughput": 2329.46, "total_tokens": 9009928} {"current_steps": 15625, "total_steps": 67140, "loss": 0.6788, "lr": 4.736526279947807e-05, "epoch": 2.327226690497468, "percentage": 23.27, "elapsed_time": "1:04:28", "remaining_time": "3:32:35", "throughput": 2329.53, "total_tokens": 9012840} {"current_steps": 15630, "total_steps": 67140, "loss": 0.6332, "lr": 4.736235805689992e-05, "epoch": 2.3279714030384273, "percentage": 23.28, "elapsed_time": "1:04:30", "remaining_time": "3:32:34", "throughput": 2329.54, "total_tokens": 9015400} {"current_steps": 15635, "total_steps": 67140, "loss": 0.6234, "lr": 4.735945180316451e-05, "epoch": 2.3287161155793865, "percentage": 23.29, "elapsed_time": "1:04:31", "remaining_time": "3:32:32", "throughput": 2329.59, "total_tokens": 9018280} {"current_steps": 15640, "total_steps": 67140, "loss": 0.6512, "lr": 4.7356544038468266e-05, "epoch": 2.3294608281203457, "percentage": 23.29, "elapsed_time": "1:04:32", "remaining_time": "3:32:30", "throughput": 2329.64, "total_tokens": 9021096} {"current_steps": 15645, "total_steps": 67140, "loss": 0.7422, "lr": 4.735363476300767e-05, "epoch": 2.330205540661305, "percentage": 23.3, "elapsed_time": "1:04:33", "remaining_time": "3:32:29", "throughput": 2329.7, "total_tokens": 9023976} {"current_steps": 15650, "total_steps": 67140, "loss": 0.7901, "lr": 4.735072397697932e-05, "epoch": 2.330950253202264, "percentage": 23.31, "elapsed_time": "1:04:34", "remaining_time": "3:32:27", "throughput": 2329.78, "total_tokens": 9026920} {"current_steps": 15655, "total_steps": 67140, "loss": 0.5116, "lr": 4.734781168057991e-05, "epoch": 2.331694965743223, "percentage": 23.32, "elapsed_time": "1:04:35", "remaining_time": "3:32:26", "throughput": 2329.8, "total_tokens": 9029576} {"current_steps": 15660, "total_steps": 67140, "loss": 0.7308, "lr": 4.734489787400626e-05, "epoch": 2.3324396782841825, "percentage": 23.32, "elapsed_time": "1:04:36", "remaining_time": "3:32:24", "throughput": 2329.83, "total_tokens": 9032296} {"current_steps": 15665, "total_steps": 67140, "loss": 0.5322, "lr": 4.7341982557455245e-05, "epoch": 2.3331843908251413, "percentage": 23.33, "elapsed_time": "1:04:37", "remaining_time": "3:32:22", "throughput": 2329.9, "total_tokens": 9035272} {"current_steps": 15670, "total_steps": 67140, "loss": 0.6946, "lr": 4.733906573112389e-05, "epoch": 2.333929103366101, "percentage": 23.34, "elapsed_time": "1:04:39", "remaining_time": "3:32:21", "throughput": 2329.96, "total_tokens": 9038120} {"current_steps": 15675, "total_steps": 67140, "loss": 0.6174, "lr": 4.7336147395209294e-05, "epoch": 2.3346738159070597, "percentage": 23.35, "elapsed_time": "1:04:40", "remaining_time": "3:32:19", "throughput": 2329.99, "total_tokens": 9040840} {"current_steps": 15680, "total_steps": 67140, "loss": 0.7495, "lr": 4.733322754990867e-05, "epoch": 2.335418528448019, "percentage": 23.35, "elapsed_time": "1:04:41", "remaining_time": "3:32:18", "throughput": 2330.07, "total_tokens": 9043848} {"current_steps": 15685, "total_steps": 67140, "loss": 0.7057, "lr": 4.733030619541934e-05, "epoch": 2.336163240988978, "percentage": 23.36, "elapsed_time": "1:04:42", "remaining_time": "3:32:16", "throughput": 2330.13, "total_tokens": 9046696} {"current_steps": 15690, "total_steps": 67140, "loss": 0.6782, "lr": 4.732738333193869e-05, "epoch": 2.3369079535299373, "percentage": 23.37, "elapsed_time": "1:04:43", "remaining_time": "3:32:15", "throughput": 2330.24, "total_tokens": 9049928} {"current_steps": 15695, "total_steps": 67140, "loss": 0.4937, "lr": 4.7324458959664256e-05, "epoch": 2.3376526660708965, "percentage": 23.38, "elapsed_time": "1:04:44", "remaining_time": "3:32:13", "throughput": 2330.32, "total_tokens": 9052872} {"current_steps": 15700, "total_steps": 67140, "loss": 0.6863, "lr": 4.7321533078793655e-05, "epoch": 2.3383973786118557, "percentage": 23.38, "elapsed_time": "1:04:45", "remaining_time": "3:32:12", "throughput": 2330.35, "total_tokens": 9055624} {"current_steps": 15705, "total_steps": 67140, "loss": 0.6427, "lr": 4.73186056895246e-05, "epoch": 2.339142091152815, "percentage": 23.39, "elapsed_time": "1:04:47", "remaining_time": "3:32:10", "throughput": 2330.38, "total_tokens": 9058280} {"current_steps": 15710, "total_steps": 67140, "loss": 0.6829, "lr": 4.731567679205491e-05, "epoch": 2.339886803693774, "percentage": 23.4, "elapsed_time": "1:04:48", "remaining_time": "3:32:08", "throughput": 2330.41, "total_tokens": 9061000} {"current_steps": 15715, "total_steps": 67140, "loss": 0.637, "lr": 4.731274638658251e-05, "epoch": 2.3406315162347333, "percentage": 23.41, "elapsed_time": "1:04:49", "remaining_time": "3:32:07", "throughput": 2330.54, "total_tokens": 9064296} {"current_steps": 15720, "total_steps": 67140, "loss": 0.6205, "lr": 4.7309814473305427e-05, "epoch": 2.3413762287756925, "percentage": 23.41, "elapsed_time": "1:04:50", "remaining_time": "3:32:05", "throughput": 2330.54, "total_tokens": 9066856} {"current_steps": 15725, "total_steps": 67140, "loss": 0.4434, "lr": 4.730688105242179e-05, "epoch": 2.3421209413166517, "percentage": 23.42, "elapsed_time": "1:04:51", "remaining_time": "3:32:04", "throughput": 2330.61, "total_tokens": 9069800} {"current_steps": 15730, "total_steps": 67140, "loss": 0.6757, "lr": 4.7303946124129824e-05, "epoch": 2.342865653857611, "percentage": 23.43, "elapsed_time": "1:04:52", "remaining_time": "3:32:02", "throughput": 2330.69, "total_tokens": 9072744} {"current_steps": 15735, "total_steps": 67140, "loss": 0.4556, "lr": 4.730100968862786e-05, "epoch": 2.34361036639857, "percentage": 23.44, "elapsed_time": "1:04:53", "remaining_time": "3:32:00", "throughput": 2330.73, "total_tokens": 9075528} {"current_steps": 15740, "total_steps": 67140, "loss": 0.6437, "lr": 4.7298071746114326e-05, "epoch": 2.3443550789395293, "percentage": 23.44, "elapsed_time": "1:04:54", "remaining_time": "3:31:59", "throughput": 2330.76, "total_tokens": 9078248} {"current_steps": 15745, "total_steps": 67140, "loss": 0.738, "lr": 4.729513229678776e-05, "epoch": 2.3450997914804885, "percentage": 23.45, "elapsed_time": "1:04:56", "remaining_time": "3:31:57", "throughput": 2330.82, "total_tokens": 9081096} {"current_steps": 15750, "total_steps": 67140, "loss": 0.7975, "lr": 4.7292191340846806e-05, "epoch": 2.3458445040214477, "percentage": 23.46, "elapsed_time": "1:04:57", "remaining_time": "3:31:55", "throughput": 2330.84, "total_tokens": 9083688} {"current_steps": 15755, "total_steps": 67140, "loss": 0.5962, "lr": 4.728924887849019e-05, "epoch": 2.346589216562407, "percentage": 23.47, "elapsed_time": "1:04:58", "remaining_time": "3:31:54", "throughput": 2330.85, "total_tokens": 9086312} {"current_steps": 15760, "total_steps": 67140, "loss": 0.7043, "lr": 4.728630490991676e-05, "epoch": 2.347333929103366, "percentage": 23.47, "elapsed_time": "1:04:59", "remaining_time": "3:31:52", "throughput": 2330.89, "total_tokens": 9089032} {"current_steps": 15765, "total_steps": 67140, "loss": 0.5669, "lr": 4.728335943532545e-05, "epoch": 2.3480786416443253, "percentage": 23.48, "elapsed_time": "1:05:00", "remaining_time": "3:31:50", "throughput": 2330.94, "total_tokens": 9091816} {"current_steps": 15770, "total_steps": 67140, "loss": 0.5852, "lr": 4.7280412454915316e-05, "epoch": 2.3488233541852845, "percentage": 23.49, "elapsed_time": "1:05:01", "remaining_time": "3:31:49", "throughput": 2331.04, "total_tokens": 9094920} {"current_steps": 15775, "total_steps": 67140, "loss": 0.6816, "lr": 4.727746396888548e-05, "epoch": 2.3495680667262437, "percentage": 23.5, "elapsed_time": "1:05:02", "remaining_time": "3:31:47", "throughput": 2331.12, "total_tokens": 9097960} {"current_steps": 15780, "total_steps": 67140, "loss": 0.5656, "lr": 4.7274513977435206e-05, "epoch": 2.350312779267203, "percentage": 23.5, "elapsed_time": "1:05:03", "remaining_time": "3:31:46", "throughput": 2331.18, "total_tokens": 9100872} {"current_steps": 15785, "total_steps": 67140, "loss": 0.7515, "lr": 4.7271562480763845e-05, "epoch": 2.351057491808162, "percentage": 23.51, "elapsed_time": "1:05:05", "remaining_time": "3:31:44", "throughput": 2331.23, "total_tokens": 9103720} {"current_steps": 15790, "total_steps": 67140, "loss": 0.6664, "lr": 4.726860947907084e-05, "epoch": 2.3518022043491214, "percentage": 23.52, "elapsed_time": "1:05:06", "remaining_time": "3:31:43", "throughput": 2331.3, "total_tokens": 9106632} {"current_steps": 15795, "total_steps": 67140, "loss": 0.7674, "lr": 4.726565497255575e-05, "epoch": 2.3525469168900806, "percentage": 23.53, "elapsed_time": "1:05:07", "remaining_time": "3:31:41", "throughput": 2331.4, "total_tokens": 9109800} {"current_steps": 15800, "total_steps": 67140, "loss": 0.627, "lr": 4.7262698961418206e-05, "epoch": 2.3532916294310398, "percentage": 23.53, "elapsed_time": "1:05:08", "remaining_time": "3:31:40", "throughput": 2331.43, "total_tokens": 9112456} {"current_steps": 15805, "total_steps": 67140, "loss": 0.6859, "lr": 4.7259741445857994e-05, "epoch": 2.354036341971999, "percentage": 23.54, "elapsed_time": "1:05:09", "remaining_time": "3:31:38", "throughput": 2331.52, "total_tokens": 9115528} {"current_steps": 15810, "total_steps": 67140, "loss": 0.6104, "lr": 4.7256782426074956e-05, "epoch": 2.354781054512958, "percentage": 23.55, "elapsed_time": "1:05:10", "remaining_time": "3:31:37", "throughput": 2331.56, "total_tokens": 9118344} {"current_steps": 15815, "total_steps": 67140, "loss": 0.6918, "lr": 4.725382190226904e-05, "epoch": 2.3555257670539174, "percentage": 23.56, "elapsed_time": "1:05:11", "remaining_time": "3:31:35", "throughput": 2331.62, "total_tokens": 9121224} {"current_steps": 15820, "total_steps": 67140, "loss": 0.7255, "lr": 4.725085987464032e-05, "epoch": 2.3562704795948766, "percentage": 23.56, "elapsed_time": "1:05:13", "remaining_time": "3:31:33", "throughput": 2331.66, "total_tokens": 9123912} {"current_steps": 15825, "total_steps": 67140, "loss": 0.593, "lr": 4.724789634338897e-05, "epoch": 2.3570151921358358, "percentage": 23.57, "elapsed_time": "1:05:14", "remaining_time": "3:31:32", "throughput": 2331.69, "total_tokens": 9126600} {"current_steps": 15830, "total_steps": 67140, "loss": 0.6888, "lr": 4.7244931308715215e-05, "epoch": 2.3577599046767945, "percentage": 23.58, "elapsed_time": "1:05:15", "remaining_time": "3:31:30", "throughput": 2331.74, "total_tokens": 9129384} {"current_steps": 15835, "total_steps": 67140, "loss": 0.6373, "lr": 4.724196477081946e-05, "epoch": 2.358504617217754, "percentage": 23.59, "elapsed_time": "1:05:16", "remaining_time": "3:31:29", "throughput": 2331.79, "total_tokens": 9132264} {"current_steps": 15840, "total_steps": 67140, "loss": 0.7751, "lr": 4.723899672990215e-05, "epoch": 2.359249329758713, "percentage": 23.59, "elapsed_time": "1:05:17", "remaining_time": "3:31:27", "throughput": 2331.8, "total_tokens": 9134856} {"current_steps": 15845, "total_steps": 67140, "loss": 0.7213, "lr": 4.7236027186163856e-05, "epoch": 2.359994042299672, "percentage": 23.6, "elapsed_time": "1:05:18", "remaining_time": "3:31:25", "throughput": 2331.87, "total_tokens": 9137768} {"current_steps": 15850, "total_steps": 67140, "loss": 0.5763, "lr": 4.7233056139805254e-05, "epoch": 2.3607387548406313, "percentage": 23.61, "elapsed_time": "1:05:19", "remaining_time": "3:31:24", "throughput": 2331.89, "total_tokens": 9140456} {"current_steps": 15855, "total_steps": 67140, "loss": 0.6519, "lr": 4.7230083591027106e-05, "epoch": 2.3614834673815905, "percentage": 23.61, "elapsed_time": "1:05:20", "remaining_time": "3:31:22", "throughput": 2331.98, "total_tokens": 9143496} {"current_steps": 15860, "total_steps": 67140, "loss": 0.6502, "lr": 4.72271095400303e-05, "epoch": 2.3622281799225497, "percentage": 23.62, "elapsed_time": "1:05:22", "remaining_time": "3:31:21", "throughput": 2332.03, "total_tokens": 9146312} {"current_steps": 15865, "total_steps": 67140, "loss": 0.6142, "lr": 4.722413398701579e-05, "epoch": 2.362972892463509, "percentage": 23.63, "elapsed_time": "1:05:23", "remaining_time": "3:31:19", "throughput": 2332.08, "total_tokens": 9149128} {"current_steps": 15870, "total_steps": 67140, "loss": 0.5728, "lr": 4.722115693218467e-05, "epoch": 2.363717605004468, "percentage": 23.64, "elapsed_time": "1:05:24", "remaining_time": "3:31:17", "throughput": 2332.11, "total_tokens": 9151752} {"current_steps": 15875, "total_steps": 67140, "loss": 0.4645, "lr": 4.72181783757381e-05, "epoch": 2.3644623175454274, "percentage": 23.64, "elapsed_time": "1:05:25", "remaining_time": "3:31:16", "throughput": 2332.13, "total_tokens": 9154408} {"current_steps": 15880, "total_steps": 67140, "loss": 0.7561, "lr": 4.721519831787737e-05, "epoch": 2.3652070300863866, "percentage": 23.65, "elapsed_time": "1:05:26", "remaining_time": "3:31:14", "throughput": 2332.26, "total_tokens": 9157736} {"current_steps": 15885, "total_steps": 67140, "loss": 0.5301, "lr": 4.721221675880386e-05, "epoch": 2.3659517426273458, "percentage": 23.66, "elapsed_time": "1:05:27", "remaining_time": "3:31:13", "throughput": 2332.31, "total_tokens": 9160552} {"current_steps": 15890, "total_steps": 67140, "loss": 0.79, "lr": 4.7209233698719056e-05, "epoch": 2.366696455168305, "percentage": 23.67, "elapsed_time": "1:05:28", "remaining_time": "3:31:11", "throughput": 2332.34, "total_tokens": 9163272} {"current_steps": 15895, "total_steps": 67140, "loss": 0.5385, "lr": 4.7206249137824535e-05, "epoch": 2.367441167709264, "percentage": 23.67, "elapsed_time": "1:05:29", "remaining_time": "3:31:09", "throughput": 2332.39, "total_tokens": 9166120} {"current_steps": 15900, "total_steps": 67140, "loss": 0.5647, "lr": 4.7203263076321966e-05, "epoch": 2.3681858802502234, "percentage": 23.68, "elapsed_time": "1:05:31", "remaining_time": "3:31:08", "throughput": 2332.45, "total_tokens": 9168968} {"current_steps": 15905, "total_steps": 67140, "loss": 0.7143, "lr": 4.720027551441316e-05, "epoch": 2.3689305927911826, "percentage": 23.69, "elapsed_time": "1:05:32", "remaining_time": "3:31:06", "throughput": 2332.5, "total_tokens": 9171816} {"current_steps": 15910, "total_steps": 67140, "loss": 0.7564, "lr": 4.719728645229999e-05, "epoch": 2.3696753053321418, "percentage": 23.7, "elapsed_time": "1:05:33", "remaining_time": "3:31:05", "throughput": 2332.57, "total_tokens": 9174728} {"current_steps": 15915, "total_steps": 67140, "loss": 0.6057, "lr": 4.719429589018446e-05, "epoch": 2.370420017873101, "percentage": 23.7, "elapsed_time": "1:05:34", "remaining_time": "3:31:03", "throughput": 2332.62, "total_tokens": 9177544} {"current_steps": 15920, "total_steps": 67140, "loss": 0.7375, "lr": 4.719130382826864e-05, "epoch": 2.37116473041406, "percentage": 23.71, "elapsed_time": "1:05:35", "remaining_time": "3:31:01", "throughput": 2332.65, "total_tokens": 9180232} {"current_steps": 15925, "total_steps": 67140, "loss": 0.6009, "lr": 4.718831026675473e-05, "epoch": 2.3719094429550194, "percentage": 23.72, "elapsed_time": "1:05:36", "remaining_time": "3:31:00", "throughput": 2332.7, "total_tokens": 9183048} {"current_steps": 15930, "total_steps": 67140, "loss": 0.5839, "lr": 4.718531520584503e-05, "epoch": 2.3726541554959786, "percentage": 23.73, "elapsed_time": "1:05:37", "remaining_time": "3:30:58", "throughput": 2332.74, "total_tokens": 9185800} {"current_steps": 15935, "total_steps": 67140, "loss": 0.5769, "lr": 4.718231864574193e-05, "epoch": 2.373398868036938, "percentage": 23.73, "elapsed_time": "1:05:38", "remaining_time": "3:30:57", "throughput": 2332.84, "total_tokens": 9188904} {"current_steps": 15940, "total_steps": 67140, "loss": 0.5684, "lr": 4.717932058664791e-05, "epoch": 2.374143580577897, "percentage": 23.74, "elapsed_time": "1:05:40", "remaining_time": "3:30:55", "throughput": 2332.89, "total_tokens": 9191784} {"current_steps": 15945, "total_steps": 67140, "loss": 0.7242, "lr": 4.717632102876559e-05, "epoch": 2.374888293118856, "percentage": 23.75, "elapsed_time": "1:05:41", "remaining_time": "3:30:54", "throughput": 2332.96, "total_tokens": 9194728} {"current_steps": 15950, "total_steps": 67140, "loss": 0.6656, "lr": 4.717331997229765e-05, "epoch": 2.3756330056598154, "percentage": 23.76, "elapsed_time": "1:05:42", "remaining_time": "3:30:52", "throughput": 2332.99, "total_tokens": 9197416} {"current_steps": 15955, "total_steps": 67140, "loss": 0.6691, "lr": 4.71703174174469e-05, "epoch": 2.3763777182007746, "percentage": 23.76, "elapsed_time": "1:05:43", "remaining_time": "3:30:51", "throughput": 2333.1, "total_tokens": 9200648} {"current_steps": 15960, "total_steps": 67140, "loss": 0.7578, "lr": 4.7167313364416234e-05, "epoch": 2.377122430741734, "percentage": 23.77, "elapsed_time": "1:05:44", "remaining_time": "3:30:49", "throughput": 2333.15, "total_tokens": 9203464} {"current_steps": 15965, "total_steps": 67140, "loss": 0.6145, "lr": 4.716430781340866e-05, "epoch": 2.377867143282693, "percentage": 23.78, "elapsed_time": "1:05:45", "remaining_time": "3:30:47", "throughput": 2333.19, "total_tokens": 9206216} {"current_steps": 15970, "total_steps": 67140, "loss": 0.6325, "lr": 4.716130076462728e-05, "epoch": 2.378611855823652, "percentage": 23.79, "elapsed_time": "1:05:46", "remaining_time": "3:30:46", "throughput": 2333.21, "total_tokens": 9208840} {"current_steps": 15975, "total_steps": 67140, "loss": 0.6818, "lr": 4.715829221827529e-05, "epoch": 2.3793565683646114, "percentage": 23.79, "elapsed_time": "1:05:48", "remaining_time": "3:30:44", "throughput": 2333.31, "total_tokens": 9212008} {"current_steps": 15980, "total_steps": 67140, "loss": 0.5968, "lr": 4.7155282174556004e-05, "epoch": 2.3801012809055706, "percentage": 23.8, "elapsed_time": "1:05:49", "remaining_time": "3:30:43", "throughput": 2333.37, "total_tokens": 9214920} {"current_steps": 15985, "total_steps": 67140, "loss": 0.6254, "lr": 4.7152270633672826e-05, "epoch": 2.38084599344653, "percentage": 23.81, "elapsed_time": "1:05:50", "remaining_time": "3:30:41", "throughput": 2333.42, "total_tokens": 9217768} {"current_steps": 15990, "total_steps": 67140, "loss": 0.7284, "lr": 4.7149257595829255e-05, "epoch": 2.381590705987489, "percentage": 23.82, "elapsed_time": "1:05:51", "remaining_time": "3:30:40", "throughput": 2333.45, "total_tokens": 9220488} {"current_steps": 15995, "total_steps": 67140, "loss": 0.6976, "lr": 4.714624306122892e-05, "epoch": 2.382335418528448, "percentage": 23.82, "elapsed_time": "1:05:52", "remaining_time": "3:30:38", "throughput": 2333.5, "total_tokens": 9223304} {"current_steps": 16000, "total_steps": 67140, "loss": 0.6649, "lr": 4.714322703007551e-05, "epoch": 2.3830801310694074, "percentage": 23.83, "elapsed_time": "1:05:53", "remaining_time": "3:30:37", "throughput": 2333.58, "total_tokens": 9226280} {"current_steps": 16005, "total_steps": 67140, "loss": 0.6898, "lr": 4.7140209502572855e-05, "epoch": 2.383824843610366, "percentage": 23.84, "elapsed_time": "1:05:54", "remaining_time": "3:30:35", "throughput": 2333.64, "total_tokens": 9229096} {"current_steps": 16010, "total_steps": 67140, "loss": 0.5268, "lr": 4.713719047892484e-05, "epoch": 2.384569556151326, "percentage": 23.85, "elapsed_time": "1:05:55", "remaining_time": "3:30:33", "throughput": 2333.7, "total_tokens": 9232008} {"current_steps": 16015, "total_steps": 67140, "loss": 0.659, "lr": 4.713416995933551e-05, "epoch": 2.3853142686922846, "percentage": 23.85, "elapsed_time": "1:05:57", "remaining_time": "3:30:32", "throughput": 2333.78, "total_tokens": 9235080} {"current_steps": 16020, "total_steps": 67140, "loss": 0.6796, "lr": 4.7131147944008965e-05, "epoch": 2.386058981233244, "percentage": 23.86, "elapsed_time": "1:05:58", "remaining_time": "3:30:30", "throughput": 2333.85, "total_tokens": 9238056} {"current_steps": 16025, "total_steps": 67140, "loss": 0.7453, "lr": 4.712812443314941e-05, "epoch": 2.386803693774203, "percentage": 23.87, "elapsed_time": "1:05:59", "remaining_time": "3:30:29", "throughput": 2333.96, "total_tokens": 9241192} {"current_steps": 16030, "total_steps": 67140, "loss": 0.7899, "lr": 4.7125099426961185e-05, "epoch": 2.387548406315162, "percentage": 23.88, "elapsed_time": "1:06:00", "remaining_time": "3:30:27", "throughput": 2333.98, "total_tokens": 9243848} {"current_steps": 16035, "total_steps": 67140, "loss": 0.6738, "lr": 4.712207292564869e-05, "epoch": 2.3882931188561214, "percentage": 23.88, "elapsed_time": "1:06:01", "remaining_time": "3:30:26", "throughput": 2334.05, "total_tokens": 9246728} {"current_steps": 16040, "total_steps": 67140, "loss": 0.5364, "lr": 4.7119044929416443e-05, "epoch": 2.3890378313970806, "percentage": 23.89, "elapsed_time": "1:06:02", "remaining_time": "3:30:24", "throughput": 2334.12, "total_tokens": 9249672} {"current_steps": 16045, "total_steps": 67140, "loss": 0.7619, "lr": 4.7116015438469074e-05, "epoch": 2.38978254393804, "percentage": 23.9, "elapsed_time": "1:06:03", "remaining_time": "3:30:23", "throughput": 2334.16, "total_tokens": 9252456} {"current_steps": 16050, "total_steps": 67140, "loss": 0.7557, "lr": 4.7112984453011297e-05, "epoch": 2.390527256478999, "percentage": 23.91, "elapsed_time": "1:06:05", "remaining_time": "3:30:21", "throughput": 2334.23, "total_tokens": 9255432} {"current_steps": 16055, "total_steps": 67140, "loss": 0.802, "lr": 4.7109951973247945e-05, "epoch": 2.391271969019958, "percentage": 23.91, "elapsed_time": "1:06:06", "remaining_time": "3:30:19", "throughput": 2334.3, "total_tokens": 9258344} {"current_steps": 16060, "total_steps": 67140, "loss": 0.6247, "lr": 4.7106917999383926e-05, "epoch": 2.3920166815609174, "percentage": 23.92, "elapsed_time": "1:06:07", "remaining_time": "3:30:18", "throughput": 2334.39, "total_tokens": 9261416} {"current_steps": 16065, "total_steps": 67140, "loss": 0.6963, "lr": 4.710388253162426e-05, "epoch": 2.3927613941018766, "percentage": 23.93, "elapsed_time": "1:06:08", "remaining_time": "3:30:16", "throughput": 2334.44, "total_tokens": 9264264} {"current_steps": 16070, "total_steps": 67140, "loss": 0.7161, "lr": 4.710084557017409e-05, "epoch": 2.393506106642836, "percentage": 23.94, "elapsed_time": "1:06:09", "remaining_time": "3:30:15", "throughput": 2334.55, "total_tokens": 9267400} {"current_steps": 16075, "total_steps": 67140, "loss": 0.7723, "lr": 4.709780711523862e-05, "epoch": 2.394250819183795, "percentage": 23.94, "elapsed_time": "1:06:10", "remaining_time": "3:30:13", "throughput": 2334.59, "total_tokens": 9270184} {"current_steps": 16080, "total_steps": 67140, "loss": 0.6041, "lr": 4.70947671670232e-05, "epoch": 2.394995531724754, "percentage": 23.95, "elapsed_time": "1:06:11", "remaining_time": "3:30:12", "throughput": 2334.61, "total_tokens": 9272776} {"current_steps": 16085, "total_steps": 67140, "loss": 0.637, "lr": 4.709172572573325e-05, "epoch": 2.3957402442657134, "percentage": 23.96, "elapsed_time": "1:06:13", "remaining_time": "3:30:10", "throughput": 2334.68, "total_tokens": 9275816} {"current_steps": 16090, "total_steps": 67140, "loss": 0.7169, "lr": 4.708868279157428e-05, "epoch": 2.3964849568066726, "percentage": 23.96, "elapsed_time": "1:06:14", "remaining_time": "3:30:09", "throughput": 2334.74, "total_tokens": 9278696} {"current_steps": 16095, "total_steps": 67140, "loss": 0.6547, "lr": 4.7085638364751936e-05, "epoch": 2.397229669347632, "percentage": 23.97, "elapsed_time": "1:06:15", "remaining_time": "3:30:07", "throughput": 2334.81, "total_tokens": 9281672} {"current_steps": 16100, "total_steps": 67140, "loss": 0.6404, "lr": 4.7082592445471954e-05, "epoch": 2.397974381888591, "percentage": 23.98, "elapsed_time": "1:06:16", "remaining_time": "3:30:06", "throughput": 2334.87, "total_tokens": 9284552} {"current_steps": 16105, "total_steps": 67140, "loss": 0.5996, "lr": 4.7079545033940155e-05, "epoch": 2.3987190944295502, "percentage": 23.99, "elapsed_time": "1:06:17", "remaining_time": "3:30:04", "throughput": 2334.93, "total_tokens": 9287368} {"current_steps": 16110, "total_steps": 67140, "loss": 0.4573, "lr": 4.7076496130362455e-05, "epoch": 2.3994638069705094, "percentage": 23.99, "elapsed_time": "1:06:18", "remaining_time": "3:30:03", "throughput": 2335.01, "total_tokens": 9290376} {"current_steps": 16115, "total_steps": 67140, "loss": 0.6271, "lr": 4.707344573494492e-05, "epoch": 2.4002085195114686, "percentage": 24.0, "elapsed_time": "1:06:19", "remaining_time": "3:30:01", "throughput": 2335.02, "total_tokens": 9292968} {"current_steps": 16120, "total_steps": 67140, "loss": 0.5716, "lr": 4.7070393847893665e-05, "epoch": 2.400953232052428, "percentage": 24.01, "elapsed_time": "1:06:20", "remaining_time": "3:29:59", "throughput": 2335.09, "total_tokens": 9295944} {"current_steps": 16125, "total_steps": 67140, "loss": 0.5557, "lr": 4.706734046941492e-05, "epoch": 2.401697944593387, "percentage": 24.02, "elapsed_time": "1:06:22", "remaining_time": "3:29:58", "throughput": 2335.11, "total_tokens": 9298568} {"current_steps": 16130, "total_steps": 67140, "loss": 0.6254, "lr": 4.706428559971502e-05, "epoch": 2.4024426571343462, "percentage": 24.02, "elapsed_time": "1:06:23", "remaining_time": "3:29:56", "throughput": 2335.19, "total_tokens": 9301576} {"current_steps": 16135, "total_steps": 67140, "loss": 0.7572, "lr": 4.706122923900042e-05, "epoch": 2.4031873696753054, "percentage": 24.03, "elapsed_time": "1:06:24", "remaining_time": "3:29:55", "throughput": 2335.28, "total_tokens": 9304648} {"current_steps": 16140, "total_steps": 67140, "loss": 0.6123, "lr": 4.705817138747763e-05, "epoch": 2.4039320822162646, "percentage": 24.04, "elapsed_time": "1:06:25", "remaining_time": "3:29:53", "throughput": 2335.32, "total_tokens": 9307400} {"current_steps": 16145, "total_steps": 67140, "loss": 0.7844, "lr": 4.7055112045353304e-05, "epoch": 2.404676794757224, "percentage": 24.05, "elapsed_time": "1:06:26", "remaining_time": "3:29:51", "throughput": 2335.34, "total_tokens": 9310120} {"current_steps": 16150, "total_steps": 67140, "loss": 0.7551, "lr": 4.705205121283418e-05, "epoch": 2.405421507298183, "percentage": 24.05, "elapsed_time": "1:06:27", "remaining_time": "3:29:50", "throughput": 2335.38, "total_tokens": 9312872} {"current_steps": 16155, "total_steps": 67140, "loss": 0.7554, "lr": 4.704898889012709e-05, "epoch": 2.4061662198391423, "percentage": 24.06, "elapsed_time": "1:06:28", "remaining_time": "3:29:48", "throughput": 2335.44, "total_tokens": 9315752} {"current_steps": 16160, "total_steps": 67140, "loss": 0.6319, "lr": 4.704592507743897e-05, "epoch": 2.4069109323801015, "percentage": 24.07, "elapsed_time": "1:06:30", "remaining_time": "3:29:47", "throughput": 2335.51, "total_tokens": 9318696} {"current_steps": 16165, "total_steps": 67140, "loss": 0.5974, "lr": 4.704285977497687e-05, "epoch": 2.4076556449210607, "percentage": 24.08, "elapsed_time": "1:06:31", "remaining_time": "3:29:45", "throughput": 2335.52, "total_tokens": 9321288} {"current_steps": 16170, "total_steps": 67140, "loss": 0.6822, "lr": 4.703979298294793e-05, "epoch": 2.4084003574620194, "percentage": 24.08, "elapsed_time": "1:06:32", "remaining_time": "3:29:43", "throughput": 2335.53, "total_tokens": 9323848} {"current_steps": 16175, "total_steps": 67140, "loss": 0.594, "lr": 4.703672470155938e-05, "epoch": 2.409145070002979, "percentage": 24.09, "elapsed_time": "1:06:33", "remaining_time": "3:29:42", "throughput": 2335.61, "total_tokens": 9326856} {"current_steps": 16180, "total_steps": 67140, "loss": 0.5766, "lr": 4.703365493101857e-05, "epoch": 2.409889782543938, "percentage": 24.1, "elapsed_time": "1:06:34", "remaining_time": "3:29:40", "throughput": 2335.67, "total_tokens": 9329832} {"current_steps": 16185, "total_steps": 67140, "loss": 0.7202, "lr": 4.703058367153295e-05, "epoch": 2.4106344950848975, "percentage": 24.11, "elapsed_time": "1:06:35", "remaining_time": "3:29:39", "throughput": 2335.71, "total_tokens": 9332616} {"current_steps": 16190, "total_steps": 67140, "loss": 0.8387, "lr": 4.702751092331005e-05, "epoch": 2.4113792076258562, "percentage": 24.11, "elapsed_time": "1:06:36", "remaining_time": "3:29:37", "throughput": 2335.84, "total_tokens": 9335848} {"current_steps": 16195, "total_steps": 67140, "loss": 0.5721, "lr": 4.7024436686557516e-05, "epoch": 2.4121239201668154, "percentage": 24.12, "elapsed_time": "1:06:38", "remaining_time": "3:29:36", "throughput": 2335.96, "total_tokens": 9339176} {"current_steps": 16200, "total_steps": 67140, "loss": 0.6606, "lr": 4.70213609614831e-05, "epoch": 2.4128686327077746, "percentage": 24.13, "elapsed_time": "1:06:39", "remaining_time": "3:29:35", "throughput": 2336.02, "total_tokens": 9342088} {"current_steps": 16205, "total_steps": 67140, "loss": 0.5962, "lr": 4.701828374829464e-05, "epoch": 2.413613345248734, "percentage": 24.14, "elapsed_time": "1:06:40", "remaining_time": "3:29:33", "throughput": 2336.07, "total_tokens": 9344904} {"current_steps": 16210, "total_steps": 67140, "loss": 0.6763, "lr": 4.701520504720008e-05, "epoch": 2.414358057789693, "percentage": 24.14, "elapsed_time": "1:06:41", "remaining_time": "3:29:31", "throughput": 2336.09, "total_tokens": 9347592} {"current_steps": 16215, "total_steps": 67140, "loss": 0.7252, "lr": 4.701212485840748e-05, "epoch": 2.4151027703306522, "percentage": 24.15, "elapsed_time": "1:06:42", "remaining_time": "3:29:30", "throughput": 2336.15, "total_tokens": 9350504} {"current_steps": 16220, "total_steps": 67140, "loss": 0.8201, "lr": 4.7009043182124966e-05, "epoch": 2.4158474828716114, "percentage": 24.16, "elapsed_time": "1:06:43", "remaining_time": "3:29:28", "throughput": 2336.24, "total_tokens": 9353608} {"current_steps": 16225, "total_steps": 67140, "loss": 0.5818, "lr": 4.700596001856081e-05, "epoch": 2.4165921954125706, "percentage": 24.17, "elapsed_time": "1:06:44", "remaining_time": "3:29:27", "throughput": 2336.34, "total_tokens": 9356712} {"current_steps": 16230, "total_steps": 67140, "loss": 0.527, "lr": 4.700287536792334e-05, "epoch": 2.41733690795353, "percentage": 24.17, "elapsed_time": "1:06:45", "remaining_time": "3:29:25", "throughput": 2336.39, "total_tokens": 9359560} {"current_steps": 16235, "total_steps": 67140, "loss": 0.5363, "lr": 4.6999789230421e-05, "epoch": 2.418081620494489, "percentage": 24.18, "elapsed_time": "1:06:47", "remaining_time": "3:29:24", "throughput": 2336.43, "total_tokens": 9362376} {"current_steps": 16240, "total_steps": 67140, "loss": 0.6115, "lr": 4.699670160626236e-05, "epoch": 2.4188263330354483, "percentage": 24.19, "elapsed_time": "1:06:48", "remaining_time": "3:29:22", "throughput": 2336.49, "total_tokens": 9365224} {"current_steps": 16245, "total_steps": 67140, "loss": 0.7919, "lr": 4.699361249565605e-05, "epoch": 2.4195710455764075, "percentage": 24.2, "elapsed_time": "1:06:49", "remaining_time": "3:29:21", "throughput": 2336.55, "total_tokens": 9368168} {"current_steps": 16250, "total_steps": 67140, "loss": 0.7095, "lr": 4.699052189881083e-05, "epoch": 2.4203157581173667, "percentage": 24.2, "elapsed_time": "1:06:50", "remaining_time": "3:29:19", "throughput": 2336.63, "total_tokens": 9371176} {"current_steps": 16255, "total_steps": 67140, "loss": 0.8311, "lr": 4.698742981593555e-05, "epoch": 2.421060470658326, "percentage": 24.21, "elapsed_time": "1:06:51", "remaining_time": "3:29:18", "throughput": 2336.71, "total_tokens": 9374216} {"current_steps": 16260, "total_steps": 67140, "loss": 0.6825, "lr": 4.6984336247239155e-05, "epoch": 2.421805183199285, "percentage": 24.22, "elapsed_time": "1:06:52", "remaining_time": "3:29:16", "throughput": 2336.78, "total_tokens": 9377192} {"current_steps": 16265, "total_steps": 67140, "loss": 0.5187, "lr": 4.69812411929307e-05, "epoch": 2.4225498957402443, "percentage": 24.23, "elapsed_time": "1:06:54", "remaining_time": "3:29:15", "throughput": 2336.86, "total_tokens": 9380200} {"current_steps": 16270, "total_steps": 67140, "loss": 0.7287, "lr": 4.697814465321934e-05, "epoch": 2.4232946082812035, "percentage": 24.23, "elapsed_time": "1:06:55", "remaining_time": "3:29:13", "throughput": 2336.9, "total_tokens": 9382984} {"current_steps": 16275, "total_steps": 67140, "loss": 0.7034, "lr": 4.6975046628314304e-05, "epoch": 2.4240393208221627, "percentage": 24.24, "elapsed_time": "1:06:56", "remaining_time": "3:29:12", "throughput": 2336.9, "total_tokens": 9385512} {"current_steps": 16280, "total_steps": 67140, "loss": 0.5689, "lr": 4.6971947118424976e-05, "epoch": 2.424784033363122, "percentage": 24.25, "elapsed_time": "1:06:57", "remaining_time": "3:29:10", "throughput": 2336.97, "total_tokens": 9388520} {"current_steps": 16285, "total_steps": 67140, "loss": 0.6719, "lr": 4.6968846123760786e-05, "epoch": 2.425528745904081, "percentage": 24.26, "elapsed_time": "1:06:58", "remaining_time": "3:29:09", "throughput": 2337.02, "total_tokens": 9391304} {"current_steps": 16290, "total_steps": 67140, "loss": 0.6549, "lr": 4.696574364453129e-05, "epoch": 2.4262734584450403, "percentage": 24.26, "elapsed_time": "1:06:59", "remaining_time": "3:29:07", "throughput": 2337.03, "total_tokens": 9393928} {"current_steps": 16295, "total_steps": 67140, "loss": 0.5851, "lr": 4.6962639680946154e-05, "epoch": 2.4270181709859995, "percentage": 24.27, "elapsed_time": "1:07:00", "remaining_time": "3:29:05", "throughput": 2337.06, "total_tokens": 9396680} {"current_steps": 16300, "total_steps": 67140, "loss": 0.7873, "lr": 4.6959534233215116e-05, "epoch": 2.4277628835269587, "percentage": 24.28, "elapsed_time": "1:07:01", "remaining_time": "3:29:04", "throughput": 2337.15, "total_tokens": 9399752} {"current_steps": 16305, "total_steps": 67140, "loss": 0.7077, "lr": 4.695642730154804e-05, "epoch": 2.428507596067918, "percentage": 24.29, "elapsed_time": "1:07:03", "remaining_time": "3:29:02", "throughput": 2337.19, "total_tokens": 9402536} {"current_steps": 16310, "total_steps": 67140, "loss": 0.5828, "lr": 4.695331888615487e-05, "epoch": 2.429252308608877, "percentage": 24.29, "elapsed_time": "1:07:04", "remaining_time": "3:29:01", "throughput": 2337.25, "total_tokens": 9405416} {"current_steps": 16315, "total_steps": 67140, "loss": 0.8286, "lr": 4.695020898724567e-05, "epoch": 2.4299970211498363, "percentage": 24.3, "elapsed_time": "1:07:05", "remaining_time": "3:28:59", "throughput": 2337.32, "total_tokens": 9408360} {"current_steps": 16320, "total_steps": 67140, "loss": 0.657, "lr": 4.694709760503059e-05, "epoch": 2.4307417336907955, "percentage": 24.31, "elapsed_time": "1:07:06", "remaining_time": "3:28:58", "throughput": 2337.4, "total_tokens": 9411432} {"current_steps": 16325, "total_steps": 67140, "loss": 0.7228, "lr": 4.694398473971988e-05, "epoch": 2.4314864462317547, "percentage": 24.31, "elapsed_time": "1:07:07", "remaining_time": "3:28:56", "throughput": 2337.46, "total_tokens": 9414312} {"current_steps": 16330, "total_steps": 67140, "loss": 0.8601, "lr": 4.6940870391523905e-05, "epoch": 2.432231158772714, "percentage": 24.32, "elapsed_time": "1:07:08", "remaining_time": "3:28:55", "throughput": 2337.48, "total_tokens": 9416968} {"current_steps": 16335, "total_steps": 67140, "loss": 0.7202, "lr": 4.693775456065311e-05, "epoch": 2.432975871313673, "percentage": 24.33, "elapsed_time": "1:07:09", "remaining_time": "3:28:53", "throughput": 2337.51, "total_tokens": 9419688} {"current_steps": 16340, "total_steps": 67140, "loss": 0.6757, "lr": 4.693463724731805e-05, "epoch": 2.4337205838546323, "percentage": 24.34, "elapsed_time": "1:07:10", "remaining_time": "3:28:51", "throughput": 2337.6, "total_tokens": 9422760} {"current_steps": 16345, "total_steps": 67140, "loss": 0.6968, "lr": 4.693151845172939e-05, "epoch": 2.434465296395591, "percentage": 24.34, "elapsed_time": "1:07:12", "remaining_time": "3:28:50", "throughput": 2337.64, "total_tokens": 9425512} {"current_steps": 16350, "total_steps": 67140, "loss": 0.6037, "lr": 4.692839817409788e-05, "epoch": 2.4352100089365507, "percentage": 24.35, "elapsed_time": "1:07:13", "remaining_time": "3:28:48", "throughput": 2337.71, "total_tokens": 9428520} {"current_steps": 16355, "total_steps": 67140, "loss": 0.8361, "lr": 4.6925276414634375e-05, "epoch": 2.4359547214775095, "percentage": 24.36, "elapsed_time": "1:07:14", "remaining_time": "3:28:47", "throughput": 2337.77, "total_tokens": 9431432} {"current_steps": 16360, "total_steps": 67140, "loss": 0.5653, "lr": 4.6922153173549835e-05, "epoch": 2.436699434018469, "percentage": 24.37, "elapsed_time": "1:07:15", "remaining_time": "3:28:45", "throughput": 2337.83, "total_tokens": 9434312} {"current_steps": 16365, "total_steps": 67140, "loss": 0.7201, "lr": 4.691902845105531e-05, "epoch": 2.437444146559428, "percentage": 24.37, "elapsed_time": "1:07:16", "remaining_time": "3:28:44", "throughput": 2337.89, "total_tokens": 9437224} {"current_steps": 16370, "total_steps": 67140, "loss": 0.624, "lr": 4.6915902247361954e-05, "epoch": 2.438188859100387, "percentage": 24.38, "elapsed_time": "1:07:17", "remaining_time": "3:28:42", "throughput": 2337.93, "total_tokens": 9439976} {"current_steps": 16375, "total_steps": 67140, "loss": 0.7064, "lr": 4.691277456268103e-05, "epoch": 2.4389335716413463, "percentage": 24.39, "elapsed_time": "1:07:18", "remaining_time": "3:28:41", "throughput": 2338.03, "total_tokens": 9443208} {"current_steps": 16380, "total_steps": 67140, "loss": 0.5561, "lr": 4.690964539722389e-05, "epoch": 2.4396782841823055, "percentage": 24.4, "elapsed_time": "1:07:20", "remaining_time": "3:28:39", "throughput": 2338.05, "total_tokens": 9445864} {"current_steps": 16385, "total_steps": 67140, "loss": 0.5567, "lr": 4.6906514751202005e-05, "epoch": 2.4404229967232647, "percentage": 24.4, "elapsed_time": "1:07:21", "remaining_time": "3:28:38", "throughput": 2338.14, "total_tokens": 9448936} {"current_steps": 16390, "total_steps": 67140, "loss": 0.5729, "lr": 4.690338262482691e-05, "epoch": 2.441167709264224, "percentage": 24.41, "elapsed_time": "1:07:22", "remaining_time": "3:28:36", "throughput": 2338.22, "total_tokens": 9451976} {"current_steps": 16395, "total_steps": 67140, "loss": 0.6121, "lr": 4.690024901831026e-05, "epoch": 2.441912421805183, "percentage": 24.42, "elapsed_time": "1:07:23", "remaining_time": "3:28:35", "throughput": 2338.28, "total_tokens": 9454824} {"current_steps": 16400, "total_steps": 67140, "loss": 0.7436, "lr": 4.6897113931863837e-05, "epoch": 2.4426571343461423, "percentage": 24.43, "elapsed_time": "1:07:24", "remaining_time": "3:28:33", "throughput": 2338.34, "total_tokens": 9457704} {"current_steps": 16405, "total_steps": 67140, "loss": 0.6005, "lr": 4.6893977365699474e-05, "epoch": 2.4434018468871015, "percentage": 24.43, "elapsed_time": "1:07:25", "remaining_time": "3:28:32", "throughput": 2338.43, "total_tokens": 9460776} {"current_steps": 16410, "total_steps": 67140, "loss": 0.6852, "lr": 4.6890839320029134e-05, "epoch": 2.4441465594280607, "percentage": 24.44, "elapsed_time": "1:07:26", "remaining_time": "3:28:30", "throughput": 2338.5, "total_tokens": 9463848} {"current_steps": 16415, "total_steps": 67140, "loss": 0.6184, "lr": 4.688769979506488e-05, "epoch": 2.44489127196902, "percentage": 24.45, "elapsed_time": "1:07:28", "remaining_time": "3:28:29", "throughput": 2338.53, "total_tokens": 9466568} {"current_steps": 16420, "total_steps": 67140, "loss": 0.5755, "lr": 4.688455879101885e-05, "epoch": 2.445635984509979, "percentage": 24.46, "elapsed_time": "1:07:29", "remaining_time": "3:28:27", "throughput": 2338.64, "total_tokens": 9469800} {"current_steps": 16425, "total_steps": 67140, "loss": 0.6412, "lr": 4.688141630810333e-05, "epoch": 2.4463806970509383, "percentage": 24.46, "elapsed_time": "1:07:30", "remaining_time": "3:28:26", "throughput": 2338.71, "total_tokens": 9472712} {"current_steps": 16430, "total_steps": 67140, "loss": 0.6077, "lr": 4.687827234653065e-05, "epoch": 2.4471254095918975, "percentage": 24.47, "elapsed_time": "1:07:31", "remaining_time": "3:28:24", "throughput": 2338.77, "total_tokens": 9475656} {"current_steps": 16435, "total_steps": 67140, "loss": 0.5175, "lr": 4.687512690651328e-05, "epoch": 2.4478701221328567, "percentage": 24.48, "elapsed_time": "1:07:32", "remaining_time": "3:28:23", "throughput": 2338.8, "total_tokens": 9478312} {"current_steps": 16440, "total_steps": 67140, "loss": 0.5815, "lr": 4.687197998826376e-05, "epoch": 2.448614834673816, "percentage": 24.49, "elapsed_time": "1:07:33", "remaining_time": "3:28:21", "throughput": 2338.88, "total_tokens": 9481352} {"current_steps": 16445, "total_steps": 67140, "loss": 0.6835, "lr": 4.686883159199477e-05, "epoch": 2.449359547214775, "percentage": 24.49, "elapsed_time": "1:07:34", "remaining_time": "3:28:20", "throughput": 2338.91, "total_tokens": 9484072} {"current_steps": 16450, "total_steps": 67140, "loss": 0.6968, "lr": 4.6865681717919047e-05, "epoch": 2.4501042597557343, "percentage": 24.5, "elapsed_time": "1:07:36", "remaining_time": "3:28:18", "throughput": 2338.98, "total_tokens": 9487080} {"current_steps": 16455, "total_steps": 67140, "loss": 0.7178, "lr": 4.686253036624946e-05, "epoch": 2.4508489722966935, "percentage": 24.51, "elapsed_time": "1:07:37", "remaining_time": "3:28:17", "throughput": 2339.02, "total_tokens": 9489928} {"current_steps": 16460, "total_steps": 67140, "loss": 0.7972, "lr": 4.6859377537198945e-05, "epoch": 2.4515936848376527, "percentage": 24.52, "elapsed_time": "1:07:38", "remaining_time": "3:28:15", "throughput": 2339.12, "total_tokens": 9493128} {"current_steps": 16465, "total_steps": 67140, "loss": 0.7981, "lr": 4.6856223230980576e-05, "epoch": 2.452338397378612, "percentage": 24.52, "elapsed_time": "1:07:39", "remaining_time": "3:28:14", "throughput": 2339.19, "total_tokens": 9496072} {"current_steps": 16470, "total_steps": 67140, "loss": 0.666, "lr": 4.6853067447807505e-05, "epoch": 2.453083109919571, "percentage": 24.53, "elapsed_time": "1:07:40", "remaining_time": "3:28:12", "throughput": 2339.24, "total_tokens": 9498984} {"current_steps": 16475, "total_steps": 67140, "loss": 0.6136, "lr": 4.684991018789298e-05, "epoch": 2.4538278224605303, "percentage": 24.54, "elapsed_time": "1:07:41", "remaining_time": "3:28:11", "throughput": 2339.3, "total_tokens": 9501864} {"current_steps": 16480, "total_steps": 67140, "loss": 0.7893, "lr": 4.6846751451450366e-05, "epoch": 2.4545725350014895, "percentage": 24.55, "elapsed_time": "1:07:42", "remaining_time": "3:28:09", "throughput": 2339.37, "total_tokens": 9504840} {"current_steps": 16485, "total_steps": 67140, "loss": 0.6144, "lr": 4.684359123869311e-05, "epoch": 2.4553172475424487, "percentage": 24.55, "elapsed_time": "1:07:44", "remaining_time": "3:28:08", "throughput": 2339.39, "total_tokens": 9507496} {"current_steps": 16490, "total_steps": 67140, "loss": 0.5385, "lr": 4.684042954983476e-05, "epoch": 2.456061960083408, "percentage": 24.56, "elapsed_time": "1:07:45", "remaining_time": "3:28:06", "throughput": 2339.44, "total_tokens": 9510376} {"current_steps": 16495, "total_steps": 67140, "loss": 0.4549, "lr": 4.683726638508899e-05, "epoch": 2.456806672624367, "percentage": 24.57, "elapsed_time": "1:07:46", "remaining_time": "3:28:05", "throughput": 2339.48, "total_tokens": 9513160} {"current_steps": 16500, "total_steps": 67140, "loss": 0.6707, "lr": 4.6834101744669526e-05, "epoch": 2.4575513851653263, "percentage": 24.58, "elapsed_time": "1:07:47", "remaining_time": "3:28:03", "throughput": 2339.55, "total_tokens": 9516168} {"current_steps": 16505, "total_steps": 67140, "loss": 0.7755, "lr": 4.683093562879024e-05, "epoch": 2.4582960977062855, "percentage": 24.58, "elapsed_time": "1:07:48", "remaining_time": "3:28:02", "throughput": 2339.61, "total_tokens": 9519048} {"current_steps": 16510, "total_steps": 67140, "loss": 0.6573, "lr": 4.682776803766509e-05, "epoch": 2.4590408102472447, "percentage": 24.59, "elapsed_time": "1:07:49", "remaining_time": "3:28:00", "throughput": 2339.62, "total_tokens": 9521704} {"current_steps": 16515, "total_steps": 67140, "loss": 0.5424, "lr": 4.682459897150812e-05, "epoch": 2.459785522788204, "percentage": 24.6, "elapsed_time": "1:07:50", "remaining_time": "3:27:58", "throughput": 2339.65, "total_tokens": 9524392} {"current_steps": 16520, "total_steps": 67140, "loss": 0.7356, "lr": 4.682142843053348e-05, "epoch": 2.4605302353291627, "percentage": 24.61, "elapsed_time": "1:07:52", "remaining_time": "3:27:57", "throughput": 2339.77, "total_tokens": 9527720} {"current_steps": 16525, "total_steps": 67140, "loss": 0.6087, "lr": 4.681825641495543e-05, "epoch": 2.4612749478701224, "percentage": 24.61, "elapsed_time": "1:07:53", "remaining_time": "3:27:55", "throughput": 2339.83, "total_tokens": 9530568} {"current_steps": 16530, "total_steps": 67140, "loss": 0.8224, "lr": 4.681508292498832e-05, "epoch": 2.462019660411081, "percentage": 24.62, "elapsed_time": "1:07:54", "remaining_time": "3:27:54", "throughput": 2339.89, "total_tokens": 9533512} {"current_steps": 16535, "total_steps": 67140, "loss": 0.5636, "lr": 4.681190796084659e-05, "epoch": 2.4627643729520408, "percentage": 24.63, "elapsed_time": "1:07:55", "remaining_time": "3:27:52", "throughput": 2339.95, "total_tokens": 9536424} {"current_steps": 16540, "total_steps": 67140, "loss": 0.7502, "lr": 4.680873152274481e-05, "epoch": 2.4635090854929995, "percentage": 24.64, "elapsed_time": "1:07:56", "remaining_time": "3:27:51", "throughput": 2339.99, "total_tokens": 9539176} {"current_steps": 16545, "total_steps": 67140, "loss": 0.6192, "lr": 4.680555361089762e-05, "epoch": 2.4642537980339587, "percentage": 24.64, "elapsed_time": "1:07:57", "remaining_time": "3:27:49", "throughput": 2340.01, "total_tokens": 9541864} {"current_steps": 16550, "total_steps": 67140, "loss": 0.6704, "lr": 4.680237422551977e-05, "epoch": 2.464998510574918, "percentage": 24.65, "elapsed_time": "1:07:58", "remaining_time": "3:27:48", "throughput": 2340.12, "total_tokens": 9545064} {"current_steps": 16555, "total_steps": 67140, "loss": 0.8125, "lr": 4.679919336682611e-05, "epoch": 2.465743223115877, "percentage": 24.66, "elapsed_time": "1:08:00", "remaining_time": "3:27:46", "throughput": 2340.18, "total_tokens": 9548008} {"current_steps": 16560, "total_steps": 67140, "loss": 0.6403, "lr": 4.6796011035031596e-05, "epoch": 2.4664879356568363, "percentage": 24.66, "elapsed_time": "1:08:01", "remaining_time": "3:27:45", "throughput": 2340.2, "total_tokens": 9550632} {"current_steps": 16565, "total_steps": 67140, "loss": 0.606, "lr": 4.6792827230351265e-05, "epoch": 2.4672326481977955, "percentage": 24.67, "elapsed_time": "1:08:02", "remaining_time": "3:27:43", "throughput": 2340.26, "total_tokens": 9553576} {"current_steps": 16570, "total_steps": 67140, "loss": 0.6075, "lr": 4.678964195300028e-05, "epoch": 2.4679773607387547, "percentage": 24.68, "elapsed_time": "1:08:03", "remaining_time": "3:27:42", "throughput": 2340.26, "total_tokens": 9556168} {"current_steps": 16575, "total_steps": 67140, "loss": 0.7335, "lr": 4.678645520319388e-05, "epoch": 2.468722073279714, "percentage": 24.69, "elapsed_time": "1:08:04", "remaining_time": "3:27:40", "throughput": 2340.3, "total_tokens": 9558888} {"current_steps": 16580, "total_steps": 67140, "loss": 0.6615, "lr": 4.678326698114741e-05, "epoch": 2.469466785820673, "percentage": 24.69, "elapsed_time": "1:08:05", "remaining_time": "3:27:38", "throughput": 2340.36, "total_tokens": 9561768} {"current_steps": 16585, "total_steps": 67140, "loss": 0.6961, "lr": 4.678007728707633e-05, "epoch": 2.4702114983616323, "percentage": 24.7, "elapsed_time": "1:08:06", "remaining_time": "3:27:37", "throughput": 2340.44, "total_tokens": 9564776} {"current_steps": 16590, "total_steps": 67140, "loss": 0.5725, "lr": 4.6776886121196175e-05, "epoch": 2.4709562109025915, "percentage": 24.71, "elapsed_time": "1:08:07", "remaining_time": "3:27:35", "throughput": 2340.52, "total_tokens": 9567880} {"current_steps": 16595, "total_steps": 67140, "loss": 0.6527, "lr": 4.677369348372259e-05, "epoch": 2.4717009234435507, "percentage": 24.72, "elapsed_time": "1:08:09", "remaining_time": "3:27:34", "throughput": 2340.62, "total_tokens": 9570984} {"current_steps": 16600, "total_steps": 67140, "loss": 0.6457, "lr": 4.677049937487134e-05, "epoch": 2.47244563598451, "percentage": 24.72, "elapsed_time": "1:08:10", "remaining_time": "3:27:33", "throughput": 2340.7, "total_tokens": 9573992} {"current_steps": 16605, "total_steps": 67140, "loss": 0.5802, "lr": 4.6767303794858235e-05, "epoch": 2.473190348525469, "percentage": 24.73, "elapsed_time": "1:08:11", "remaining_time": "3:27:31", "throughput": 2340.79, "total_tokens": 9577096} {"current_steps": 16610, "total_steps": 67140, "loss": 0.6986, "lr": 4.676410674389925e-05, "epoch": 2.4739350610664284, "percentage": 24.74, "elapsed_time": "1:08:12", "remaining_time": "3:27:30", "throughput": 2340.87, "total_tokens": 9580168} {"current_steps": 16615, "total_steps": 67140, "loss": 0.6681, "lr": 4.676090822221042e-05, "epoch": 2.4746797736073876, "percentage": 24.75, "elapsed_time": "1:08:13", "remaining_time": "3:27:28", "throughput": 2340.9, "total_tokens": 9582888} {"current_steps": 16620, "total_steps": 67140, "loss": 0.6751, "lr": 4.6757708230007877e-05, "epoch": 2.4754244861483468, "percentage": 24.75, "elapsed_time": "1:08:14", "remaining_time": "3:27:27", "throughput": 2340.97, "total_tokens": 9585832} {"current_steps": 16625, "total_steps": 67140, "loss": 0.839, "lr": 4.6754506767507874e-05, "epoch": 2.476169198689306, "percentage": 24.76, "elapsed_time": "1:08:15", "remaining_time": "3:27:25", "throughput": 2341.02, "total_tokens": 9588680} {"current_steps": 16630, "total_steps": 67140, "loss": 0.5225, "lr": 4.6751303834926755e-05, "epoch": 2.476913911230265, "percentage": 24.77, "elapsed_time": "1:08:17", "remaining_time": "3:27:23", "throughput": 2341.03, "total_tokens": 9591304} {"current_steps": 16635, "total_steps": 67140, "loss": 0.7992, "lr": 4.674809943248095e-05, "epoch": 2.4776586237712244, "percentage": 24.78, "elapsed_time": "1:08:18", "remaining_time": "3:27:22", "throughput": 2341.08, "total_tokens": 9594184} {"current_steps": 16640, "total_steps": 67140, "loss": 0.633, "lr": 4.674489356038702e-05, "epoch": 2.4784033363121836, "percentage": 24.78, "elapsed_time": "1:08:19", "remaining_time": "3:27:20", "throughput": 2341.12, "total_tokens": 9597000} {"current_steps": 16645, "total_steps": 67140, "loss": 0.6515, "lr": 4.674168621886158e-05, "epoch": 2.4791480488531428, "percentage": 24.79, "elapsed_time": "1:08:20", "remaining_time": "3:27:19", "throughput": 2341.19, "total_tokens": 9600040} {"current_steps": 16650, "total_steps": 67140, "loss": 0.463, "lr": 4.673847740812138e-05, "epoch": 2.479892761394102, "percentage": 24.8, "elapsed_time": "1:08:21", "remaining_time": "3:27:17", "throughput": 2341.25, "total_tokens": 9602984} {"current_steps": 16655, "total_steps": 67140, "loss": 0.7894, "lr": 4.673526712838326e-05, "epoch": 2.480637473935061, "percentage": 24.81, "elapsed_time": "1:08:22", "remaining_time": "3:27:16", "throughput": 2341.28, "total_tokens": 9605672} {"current_steps": 16660, "total_steps": 67140, "loss": 0.7094, "lr": 4.673205537986416e-05, "epoch": 2.4813821864760204, "percentage": 24.81, "elapsed_time": "1:08:23", "remaining_time": "3:27:14", "throughput": 2341.27, "total_tokens": 9608232} {"current_steps": 16665, "total_steps": 67140, "loss": 0.6324, "lr": 4.672884216278112e-05, "epoch": 2.4821268990169796, "percentage": 24.82, "elapsed_time": "1:08:24", "remaining_time": "3:27:13", "throughput": 2341.31, "total_tokens": 9610984} {"current_steps": 16670, "total_steps": 67140, "loss": 0.6497, "lr": 4.672562747735126e-05, "epoch": 2.482871611557939, "percentage": 24.83, "elapsed_time": "1:08:26", "remaining_time": "3:27:11", "throughput": 2341.4, "total_tokens": 9614120} {"current_steps": 16675, "total_steps": 67140, "loss": 0.6773, "lr": 4.6722411323791824e-05, "epoch": 2.483616324098898, "percentage": 24.84, "elapsed_time": "1:08:27", "remaining_time": "3:27:10", "throughput": 2341.52, "total_tokens": 9617448} {"current_steps": 16680, "total_steps": 67140, "loss": 0.7795, "lr": 4.671919370232015e-05, "epoch": 2.484361036639857, "percentage": 24.84, "elapsed_time": "1:08:28", "remaining_time": "3:27:08", "throughput": 2341.61, "total_tokens": 9620520} {"current_steps": 16685, "total_steps": 67140, "loss": 0.5803, "lr": 4.671597461315367e-05, "epoch": 2.4851057491808164, "percentage": 24.85, "elapsed_time": "1:08:29", "remaining_time": "3:27:07", "throughput": 2341.64, "total_tokens": 9623272} {"current_steps": 16690, "total_steps": 67140, "loss": 0.6913, "lr": 4.6712754056509924e-05, "epoch": 2.4858504617217756, "percentage": 24.86, "elapsed_time": "1:08:30", "remaining_time": "3:27:05", "throughput": 2341.69, "total_tokens": 9626088} {"current_steps": 16695, "total_steps": 67140, "loss": 0.6541, "lr": 4.670953203260653e-05, "epoch": 2.4865951742627344, "percentage": 24.87, "elapsed_time": "1:08:31", "remaining_time": "3:27:04", "throughput": 2341.79, "total_tokens": 9629288} {"current_steps": 16700, "total_steps": 67140, "loss": 0.6182, "lr": 4.6706308541661224e-05, "epoch": 2.487339886803694, "percentage": 24.87, "elapsed_time": "1:08:33", "remaining_time": "3:27:02", "throughput": 2341.78, "total_tokens": 9631816} {"current_steps": 16705, "total_steps": 67140, "loss": 0.671, "lr": 4.670308358389184e-05, "epoch": 2.4880845993446528, "percentage": 24.88, "elapsed_time": "1:08:34", "remaining_time": "3:27:01", "throughput": 2341.8, "total_tokens": 9634504} {"current_steps": 16710, "total_steps": 67140, "loss": 0.9124, "lr": 4.66998571595163e-05, "epoch": 2.488829311885612, "percentage": 24.89, "elapsed_time": "1:08:35", "remaining_time": "3:26:59", "throughput": 2341.87, "total_tokens": 9637448} {"current_steps": 16715, "total_steps": 67140, "loss": 0.6805, "lr": 4.6696629268752647e-05, "epoch": 2.489574024426571, "percentage": 24.9, "elapsed_time": "1:08:36", "remaining_time": "3:26:58", "throughput": 2341.88, "total_tokens": 9640072} {"current_steps": 16720, "total_steps": 67140, "loss": 0.7029, "lr": 4.6693399911818994e-05, "epoch": 2.4903187369675304, "percentage": 24.9, "elapsed_time": "1:08:37", "remaining_time": "3:26:56", "throughput": 2341.92, "total_tokens": 9642856} {"current_steps": 16725, "total_steps": 67140, "loss": 0.6714, "lr": 4.669016908893358e-05, "epoch": 2.4910634495084896, "percentage": 24.91, "elapsed_time": "1:08:38", "remaining_time": "3:26:54", "throughput": 2341.96, "total_tokens": 9645640} {"current_steps": 16730, "total_steps": 67140, "loss": 0.6877, "lr": 4.668693680031472e-05, "epoch": 2.4918081620494488, "percentage": 24.92, "elapsed_time": "1:08:39", "remaining_time": "3:26:53", "throughput": 2341.97, "total_tokens": 9648264} {"current_steps": 16735, "total_steps": 67140, "loss": 0.6459, "lr": 4.668370304618084e-05, "epoch": 2.492552874590408, "percentage": 24.93, "elapsed_time": "1:08:40", "remaining_time": "3:26:51", "throughput": 2341.96, "total_tokens": 9650728} {"current_steps": 16740, "total_steps": 67140, "loss": 0.7051, "lr": 4.668046782675048e-05, "epoch": 2.493297587131367, "percentage": 24.93, "elapsed_time": "1:08:41", "remaining_time": "3:26:50", "throughput": 2341.96, "total_tokens": 9653320} {"current_steps": 16745, "total_steps": 67140, "loss": 0.6144, "lr": 4.667723114224224e-05, "epoch": 2.4940422996723264, "percentage": 24.94, "elapsed_time": "1:08:42", "remaining_time": "3:26:48", "throughput": 2341.96, "total_tokens": 9655848} {"current_steps": 16750, "total_steps": 67140, "loss": 0.5815, "lr": 4.6673992992874855e-05, "epoch": 2.4947870122132856, "percentage": 24.95, "elapsed_time": "1:08:44", "remaining_time": "3:26:46", "throughput": 2342.0, "total_tokens": 9658696} {"current_steps": 16755, "total_steps": 67140, "loss": 0.8167, "lr": 4.667075337886714e-05, "epoch": 2.495531724754245, "percentage": 24.96, "elapsed_time": "1:08:45", "remaining_time": "3:26:45", "throughput": 2342.11, "total_tokens": 9661960} {"current_steps": 16760, "total_steps": 67140, "loss": 0.579, "lr": 4.6667512300438025e-05, "epoch": 2.496276437295204, "percentage": 24.96, "elapsed_time": "1:08:46", "remaining_time": "3:26:44", "throughput": 2342.14, "total_tokens": 9664744} {"current_steps": 16765, "total_steps": 67140, "loss": 0.6213, "lr": 4.6664269757806525e-05, "epoch": 2.497021149836163, "percentage": 24.97, "elapsed_time": "1:08:47", "remaining_time": "3:26:42", "throughput": 2342.18, "total_tokens": 9667528} {"current_steps": 16770, "total_steps": 67140, "loss": 0.6033, "lr": 4.6661025751191746e-05, "epoch": 2.4977658623771224, "percentage": 24.98, "elapsed_time": "1:08:48", "remaining_time": "3:26:40", "throughput": 2342.21, "total_tokens": 9670280} {"current_steps": 16775, "total_steps": 67140, "loss": 0.7276, "lr": 4.665778028081292e-05, "epoch": 2.4985105749180816, "percentage": 24.99, "elapsed_time": "1:08:49", "remaining_time": "3:26:39", "throughput": 2342.25, "total_tokens": 9673128} {"current_steps": 16780, "total_steps": 67140, "loss": 0.7191, "lr": 4.6654533346889356e-05, "epoch": 2.499255287459041, "percentage": 24.99, "elapsed_time": "1:08:50", "remaining_time": "3:26:37", "throughput": 2342.3, "total_tokens": 9675976} {"current_steps": 16785, "total_steps": 67140, "loss": 0.6316, "lr": 4.665128494964047e-05, "epoch": 2.5, "percentage": 25.0, "elapsed_time": "1:08:52", "remaining_time": "3:26:36", "throughput": 2342.32, "total_tokens": 9678632} {"current_steps": 16785, "total_steps": 67140, "eval_loss": 0.656985342502594, "epoch": 2.5, "percentage": 25.0, "elapsed_time": "1:10:06", "remaining_time": "3:30:19", "throughput": 2300.96, "total_tokens": 9678632} {"current_steps": 16790, "total_steps": 67140, "loss": 0.6932, "lr": 4.664803508928577e-05, "epoch": 2.500744712540959, "percentage": 25.01, "elapsed_time": "1:10:08", "remaining_time": "3:30:21", "throughput": 2300.22, "total_tokens": 9681448} {"current_steps": 16795, "total_steps": 67140, "loss": 0.5639, "lr": 4.664478376604488e-05, "epoch": 2.5014894250819184, "percentage": 25.01, "elapsed_time": "1:10:10", "remaining_time": "3:30:20", "throughput": 2300.31, "total_tokens": 9684456} {"current_steps": 16800, "total_steps": 67140, "loss": 0.7801, "lr": 4.6641530980137506e-05, "epoch": 2.5022341376228776, "percentage": 25.02, "elapsed_time": "1:10:11", "remaining_time": "3:30:18", "throughput": 2300.39, "total_tokens": 9687496} {"current_steps": 16805, "total_steps": 67140, "loss": 0.5105, "lr": 4.663827673178345e-05, "epoch": 2.502978850163837, "percentage": 25.03, "elapsed_time": "1:10:12", "remaining_time": "3:30:16", "throughput": 2300.42, "total_tokens": 9690184} {"current_steps": 16810, "total_steps": 67140, "loss": 0.6822, "lr": 4.6635021021202624e-05, "epoch": 2.503723562704796, "percentage": 25.04, "elapsed_time": "1:10:13", "remaining_time": "3:30:15", "throughput": 2300.45, "total_tokens": 9692808} {"current_steps": 16815, "total_steps": 67140, "loss": 0.7127, "lr": 4.6631763848615044e-05, "epoch": 2.504468275245755, "percentage": 25.04, "elapsed_time": "1:10:14", "remaining_time": "3:30:13", "throughput": 2300.49, "total_tokens": 9695528} {"current_steps": 16820, "total_steps": 67140, "loss": 0.534, "lr": 4.662850521424081e-05, "epoch": 2.5052129877867144, "percentage": 25.05, "elapsed_time": "1:10:15", "remaining_time": "3:30:12", "throughput": 2300.55, "total_tokens": 9698440} {"current_steps": 16825, "total_steps": 67140, "loss": 0.752, "lr": 4.662524511830013e-05, "epoch": 2.5059577003276736, "percentage": 25.06, "elapsed_time": "1:10:16", "remaining_time": "3:30:10", "throughput": 2300.58, "total_tokens": 9701096} {"current_steps": 16830, "total_steps": 67140, "loss": 0.8149, "lr": 4.662198356101331e-05, "epoch": 2.506702412868633, "percentage": 25.07, "elapsed_time": "1:10:17", "remaining_time": "3:30:08", "throughput": 2300.65, "total_tokens": 9704008} {"current_steps": 16835, "total_steps": 67140, "loss": 0.5418, "lr": 4.6618720542600744e-05, "epoch": 2.507447125409592, "percentage": 25.07, "elapsed_time": "1:10:19", "remaining_time": "3:30:07", "throughput": 2300.7, "total_tokens": 9706824} {"current_steps": 16840, "total_steps": 67140, "loss": 0.7212, "lr": 4.6615456063282944e-05, "epoch": 2.5081918379505512, "percentage": 25.08, "elapsed_time": "1:10:20", "remaining_time": "3:30:05", "throughput": 2300.75, "total_tokens": 9709576} {"current_steps": 16845, "total_steps": 67140, "loss": 0.5801, "lr": 4.66121901232805e-05, "epoch": 2.5089365504915104, "percentage": 25.09, "elapsed_time": "1:10:21", "remaining_time": "3:30:03", "throughput": 2300.79, "total_tokens": 9712264} {"current_steps": 16850, "total_steps": 67140, "loss": 0.6135, "lr": 4.6608922722814116e-05, "epoch": 2.509681263032469, "percentage": 25.1, "elapsed_time": "1:10:22", "remaining_time": "3:30:02", "throughput": 2300.85, "total_tokens": 9715112} {"current_steps": 16855, "total_steps": 67140, "loss": 0.6004, "lr": 4.6605653862104596e-05, "epoch": 2.510425975573429, "percentage": 25.1, "elapsed_time": "1:10:23", "remaining_time": "3:30:00", "throughput": 2300.89, "total_tokens": 9717832} {"current_steps": 16860, "total_steps": 67140, "loss": 0.5133, "lr": 4.660238354137283e-05, "epoch": 2.5111706881143876, "percentage": 25.11, "elapsed_time": "1:10:24", "remaining_time": "3:29:58", "throughput": 2300.95, "total_tokens": 9720712} {"current_steps": 16865, "total_steps": 67140, "loss": 0.5087, "lr": 4.6599111760839805e-05, "epoch": 2.5119154006553472, "percentage": 25.12, "elapsed_time": "1:10:25", "remaining_time": "3:29:57", "throughput": 2301.04, "total_tokens": 9723784} {"current_steps": 16870, "total_steps": 67140, "loss": 0.5628, "lr": 4.659583852072663e-05, "epoch": 2.512660113196306, "percentage": 25.13, "elapsed_time": "1:10:26", "remaining_time": "3:29:55", "throughput": 2301.13, "total_tokens": 9726824} {"current_steps": 16875, "total_steps": 67140, "loss": 0.5327, "lr": 4.6592563821254486e-05, "epoch": 2.5134048257372656, "percentage": 25.13, "elapsed_time": "1:10:28", "remaining_time": "3:29:54", "throughput": 2301.21, "total_tokens": 9729800} {"current_steps": 16880, "total_steps": 67140, "loss": 0.6174, "lr": 4.658928766264467e-05, "epoch": 2.5141495382782244, "percentage": 25.14, "elapsed_time": "1:10:29", "remaining_time": "3:29:52", "throughput": 2301.28, "total_tokens": 9732680} {"current_steps": 16885, "total_steps": 67140, "loss": 0.8685, "lr": 4.658601004511856e-05, "epoch": 2.514894250819184, "percentage": 25.15, "elapsed_time": "1:10:30", "remaining_time": "3:29:51", "throughput": 2301.36, "total_tokens": 9735688} {"current_steps": 16890, "total_steps": 67140, "loss": 0.7824, "lr": 4.658273096889768e-05, "epoch": 2.515638963360143, "percentage": 25.16, "elapsed_time": "1:10:31", "remaining_time": "3:29:49", "throughput": 2301.45, "total_tokens": 9738728} {"current_steps": 16895, "total_steps": 67140, "loss": 0.7291, "lr": 4.657945043420356e-05, "epoch": 2.516383675901102, "percentage": 25.16, "elapsed_time": "1:10:32", "remaining_time": "3:29:47", "throughput": 2301.5, "total_tokens": 9741512} {"current_steps": 16900, "total_steps": 67140, "loss": 0.6844, "lr": 4.657616844125794e-05, "epoch": 2.517128388442061, "percentage": 25.17, "elapsed_time": "1:10:33", "remaining_time": "3:29:46", "throughput": 2301.53, "total_tokens": 9744200} {"current_steps": 16905, "total_steps": 67140, "loss": 0.8852, "lr": 4.657288499028256e-05, "epoch": 2.5178731009830204, "percentage": 25.18, "elapsed_time": "1:10:34", "remaining_time": "3:29:44", "throughput": 2301.65, "total_tokens": 9747432} {"current_steps": 16910, "total_steps": 67140, "loss": 0.6885, "lr": 4.656960008149933e-05, "epoch": 2.5186178135239796, "percentage": 25.19, "elapsed_time": "1:10:36", "remaining_time": "3:29:43", "throughput": 2301.74, "total_tokens": 9750536} {"current_steps": 16915, "total_steps": 67140, "loss": 0.625, "lr": 4.656631371513022e-05, "epoch": 2.519362526064939, "percentage": 25.19, "elapsed_time": "1:10:37", "remaining_time": "3:29:41", "throughput": 2301.79, "total_tokens": 9753320} {"current_steps": 16920, "total_steps": 67140, "loss": 0.5025, "lr": 4.656302589139732e-05, "epoch": 2.520107238605898, "percentage": 25.2, "elapsed_time": "1:10:38", "remaining_time": "3:29:39", "throughput": 2301.83, "total_tokens": 9756040} {"current_steps": 16925, "total_steps": 67140, "loss": 0.575, "lr": 4.655973661052279e-05, "epoch": 2.5208519511468572, "percentage": 25.21, "elapsed_time": "1:10:39", "remaining_time": "3:29:38", "throughput": 2301.92, "total_tokens": 9759112} {"current_steps": 16930, "total_steps": 67140, "loss": 0.6473, "lr": 4.655644587272891e-05, "epoch": 2.5215966636878164, "percentage": 25.22, "elapsed_time": "1:10:40", "remaining_time": "3:29:36", "throughput": 2302.0, "total_tokens": 9762088} {"current_steps": 16935, "total_steps": 67140, "loss": 0.6486, "lr": 4.655315367823806e-05, "epoch": 2.5223413762287756, "percentage": 25.22, "elapsed_time": "1:10:41", "remaining_time": "3:29:35", "throughput": 2302.03, "total_tokens": 9764776} {"current_steps": 16940, "total_steps": 67140, "loss": 0.6083, "lr": 4.654986002727273e-05, "epoch": 2.523086088769735, "percentage": 25.23, "elapsed_time": "1:10:42", "remaining_time": "3:29:33", "throughput": 2302.09, "total_tokens": 9767656} {"current_steps": 16945, "total_steps": 67140, "loss": 0.7136, "lr": 4.6546564920055455e-05, "epoch": 2.523830801310694, "percentage": 25.24, "elapsed_time": "1:10:44", "remaining_time": "3:29:31", "throughput": 2302.12, "total_tokens": 9770376} {"current_steps": 16950, "total_steps": 67140, "loss": 0.5883, "lr": 4.654326835680894e-05, "epoch": 2.5245755138516532, "percentage": 25.25, "elapsed_time": "1:10:45", "remaining_time": "3:29:30", "throughput": 2302.2, "total_tokens": 9773320} {"current_steps": 16955, "total_steps": 67140, "loss": 0.7595, "lr": 4.6539970337755936e-05, "epoch": 2.5253202263926124, "percentage": 25.25, "elapsed_time": "1:10:46", "remaining_time": "3:29:28", "throughput": 2302.28, "total_tokens": 9776264} {"current_steps": 16960, "total_steps": 67140, "loss": 0.8088, "lr": 4.6536670863119305e-05, "epoch": 2.5260649389335716, "percentage": 25.26, "elapsed_time": "1:10:47", "remaining_time": "3:29:27", "throughput": 2302.36, "total_tokens": 9779304} {"current_steps": 16965, "total_steps": 67140, "loss": 0.7186, "lr": 4.6533369933122014e-05, "epoch": 2.526809651474531, "percentage": 25.27, "elapsed_time": "1:10:48", "remaining_time": "3:29:25", "throughput": 2302.46, "total_tokens": 9782408} {"current_steps": 16970, "total_steps": 67140, "loss": 0.679, "lr": 4.6530067547987145e-05, "epoch": 2.52755436401549, "percentage": 25.28, "elapsed_time": "1:10:49", "remaining_time": "3:29:24", "throughput": 2302.54, "total_tokens": 9785384} {"current_steps": 16975, "total_steps": 67140, "loss": 0.627, "lr": 4.652676370793784e-05, "epoch": 2.5282990765564493, "percentage": 25.28, "elapsed_time": "1:10:50", "remaining_time": "3:29:22", "throughput": 2302.6, "total_tokens": 9788264} {"current_steps": 16980, "total_steps": 67140, "loss": 0.6123, "lr": 4.6523458413197364e-05, "epoch": 2.5290437890974085, "percentage": 25.29, "elapsed_time": "1:10:52", "remaining_time": "3:29:20", "throughput": 2302.65, "total_tokens": 9791048} {"current_steps": 16985, "total_steps": 67140, "loss": 0.7568, "lr": 4.6520151663989075e-05, "epoch": 2.5297885016383677, "percentage": 25.3, "elapsed_time": "1:10:53", "remaining_time": "3:29:19", "throughput": 2302.68, "total_tokens": 9793704} {"current_steps": 16990, "total_steps": 67140, "loss": 0.8096, "lr": 4.6516843460536434e-05, "epoch": 2.530533214179327, "percentage": 25.31, "elapsed_time": "1:10:54", "remaining_time": "3:29:17", "throughput": 2302.77, "total_tokens": 9796712} {"current_steps": 16995, "total_steps": 67140, "loss": 0.6458, "lr": 4.651353380306299e-05, "epoch": 2.531277926720286, "percentage": 25.31, "elapsed_time": "1:10:55", "remaining_time": "3:29:15", "throughput": 2302.81, "total_tokens": 9799432} {"current_steps": 17000, "total_steps": 67140, "loss": 0.6308, "lr": 4.65102226917924e-05, "epoch": 2.5320226392612453, "percentage": 25.32, "elapsed_time": "1:10:56", "remaining_time": "3:29:14", "throughput": 2302.92, "total_tokens": 9802600} {"current_steps": 17005, "total_steps": 67140, "loss": 0.7014, "lr": 4.650691012694842e-05, "epoch": 2.5327673518022045, "percentage": 25.33, "elapsed_time": "1:10:57", "remaining_time": "3:29:12", "throughput": 2303.02, "total_tokens": 9805736} {"current_steps": 17010, "total_steps": 67140, "loss": 0.6256, "lr": 4.650359610875489e-05, "epoch": 2.5335120643431637, "percentage": 25.34, "elapsed_time": "1:10:58", "remaining_time": "3:29:11", "throughput": 2303.06, "total_tokens": 9808392} {"current_steps": 17015, "total_steps": 67140, "loss": 0.4834, "lr": 4.650028063743577e-05, "epoch": 2.534256776884123, "percentage": 25.34, "elapsed_time": "1:11:00", "remaining_time": "3:29:09", "throughput": 2303.15, "total_tokens": 9811464} {"current_steps": 17020, "total_steps": 67140, "loss": 0.58, "lr": 4.649696371321509e-05, "epoch": 2.535001489425082, "percentage": 25.35, "elapsed_time": "1:11:01", "remaining_time": "3:29:07", "throughput": 2303.18, "total_tokens": 9814120} {"current_steps": 17025, "total_steps": 67140, "loss": 0.5879, "lr": 4.6493645336317e-05, "epoch": 2.535746201966041, "percentage": 25.36, "elapsed_time": "1:11:02", "remaining_time": "3:29:06", "throughput": 2303.24, "total_tokens": 9816936} {"current_steps": 17030, "total_steps": 67140, "loss": 0.5954, "lr": 4.6490325506965746e-05, "epoch": 2.5364909145070005, "percentage": 25.36, "elapsed_time": "1:11:03", "remaining_time": "3:29:04", "throughput": 2303.29, "total_tokens": 9819720} {"current_steps": 17035, "total_steps": 67140, "loss": 0.5559, "lr": 4.648700422538567e-05, "epoch": 2.5372356270479592, "percentage": 25.37, "elapsed_time": "1:11:04", "remaining_time": "3:29:03", "throughput": 2303.32, "total_tokens": 9822472} {"current_steps": 17040, "total_steps": 67140, "loss": 0.6838, "lr": 4.648368149180121e-05, "epoch": 2.537980339588919, "percentage": 25.38, "elapsed_time": "1:11:05", "remaining_time": "3:29:01", "throughput": 2303.39, "total_tokens": 9825352} {"current_steps": 17045, "total_steps": 67140, "loss": 0.7494, "lr": 4.64803573064369e-05, "epoch": 2.5387250521298776, "percentage": 25.39, "elapsed_time": "1:11:06", "remaining_time": "3:28:59", "throughput": 2303.47, "total_tokens": 9828296} {"current_steps": 17050, "total_steps": 67140, "loss": 0.6537, "lr": 4.647703166951738e-05, "epoch": 2.5394697646708373, "percentage": 25.39, "elapsed_time": "1:11:07", "remaining_time": "3:28:58", "throughput": 2303.52, "total_tokens": 9831048} {"current_steps": 17055, "total_steps": 67140, "loss": 0.6628, "lr": 4.6473704581267374e-05, "epoch": 2.540214477211796, "percentage": 25.4, "elapsed_time": "1:11:08", "remaining_time": "3:28:56", "throughput": 2303.56, "total_tokens": 9833896} {"current_steps": 17060, "total_steps": 67140, "loss": 0.537, "lr": 4.6470376041911715e-05, "epoch": 2.5409591897527557, "percentage": 25.41, "elapsed_time": "1:11:10", "remaining_time": "3:28:55", "throughput": 2303.65, "total_tokens": 9836904} {"current_steps": 17065, "total_steps": 67140, "loss": 0.6545, "lr": 4.646704605167534e-05, "epoch": 2.5417039022937145, "percentage": 25.42, "elapsed_time": "1:11:11", "remaining_time": "3:28:53", "throughput": 2303.72, "total_tokens": 9839816} {"current_steps": 17070, "total_steps": 67140, "loss": 0.7567, "lr": 4.646371461078327e-05, "epoch": 2.5424486148346737, "percentage": 25.42, "elapsed_time": "1:11:12", "remaining_time": "3:28:51", "throughput": 2303.79, "total_tokens": 9842792} {"current_steps": 17075, "total_steps": 67140, "loss": 0.6938, "lr": 4.646038171946063e-05, "epoch": 2.543193327375633, "percentage": 25.43, "elapsed_time": "1:11:13", "remaining_time": "3:28:50", "throughput": 2303.81, "total_tokens": 9845416} {"current_steps": 17080, "total_steps": 67140, "loss": 0.7519, "lr": 4.645704737793265e-05, "epoch": 2.543938039916592, "percentage": 25.44, "elapsed_time": "1:11:14", "remaining_time": "3:28:48", "throughput": 2303.92, "total_tokens": 9848584} {"current_steps": 17085, "total_steps": 67140, "loss": 0.7972, "lr": 4.645371158642464e-05, "epoch": 2.5446827524575513, "percentage": 25.45, "elapsed_time": "1:11:15", "remaining_time": "3:28:47", "throughput": 2304.04, "total_tokens": 9851816} {"current_steps": 17090, "total_steps": 67140, "loss": 0.6555, "lr": 4.645037434516204e-05, "epoch": 2.5454274649985105, "percentage": 25.45, "elapsed_time": "1:11:17", "remaining_time": "3:28:45", "throughput": 2304.11, "total_tokens": 9854728} {"current_steps": 17095, "total_steps": 67140, "loss": 0.7732, "lr": 4.644703565437033e-05, "epoch": 2.5461721775394697, "percentage": 25.46, "elapsed_time": "1:11:18", "remaining_time": "3:28:44", "throughput": 2304.17, "total_tokens": 9857576} {"current_steps": 17100, "total_steps": 67140, "loss": 0.7215, "lr": 4.644369551427516e-05, "epoch": 2.546916890080429, "percentage": 25.47, "elapsed_time": "1:11:19", "remaining_time": "3:28:42", "throughput": 2304.21, "total_tokens": 9860296} {"current_steps": 17105, "total_steps": 67140, "loss": 0.743, "lr": 4.6440353925102234e-05, "epoch": 2.547661602621388, "percentage": 25.48, "elapsed_time": "1:11:20", "remaining_time": "3:28:40", "throughput": 2304.27, "total_tokens": 9863176} {"current_steps": 17110, "total_steps": 67140, "loss": 0.7104, "lr": 4.643701088707736e-05, "epoch": 2.5484063151623473, "percentage": 25.48, "elapsed_time": "1:11:21", "remaining_time": "3:28:39", "throughput": 2304.35, "total_tokens": 9866152} {"current_steps": 17115, "total_steps": 67140, "loss": 0.7089, "lr": 4.643366640042643e-05, "epoch": 2.5491510277033065, "percentage": 25.49, "elapsed_time": "1:11:22", "remaining_time": "3:28:37", "throughput": 2304.39, "total_tokens": 9868904} {"current_steps": 17120, "total_steps": 67140, "loss": 0.6282, "lr": 4.643032046537549e-05, "epoch": 2.5498957402442657, "percentage": 25.5, "elapsed_time": "1:11:23", "remaining_time": "3:28:35", "throughput": 2304.42, "total_tokens": 9871560} {"current_steps": 17125, "total_steps": 67140, "loss": 0.7688, "lr": 4.642697308215061e-05, "epoch": 2.550640452785225, "percentage": 25.51, "elapsed_time": "1:11:24", "remaining_time": "3:28:34", "throughput": 2304.49, "total_tokens": 9874536} {"current_steps": 17130, "total_steps": 67140, "loss": 0.6773, "lr": 4.6423624250978e-05, "epoch": 2.551385165326184, "percentage": 25.51, "elapsed_time": "1:11:26", "remaining_time": "3:28:32", "throughput": 2304.56, "total_tokens": 9877448} {"current_steps": 17135, "total_steps": 67140, "loss": 0.574, "lr": 4.6420273972083985e-05, "epoch": 2.5521298778671433, "percentage": 25.52, "elapsed_time": "1:11:27", "remaining_time": "3:28:31", "throughput": 2304.62, "total_tokens": 9880296} {"current_steps": 17140, "total_steps": 67140, "loss": 0.657, "lr": 4.641692224569493e-05, "epoch": 2.5528745904081025, "percentage": 25.53, "elapsed_time": "1:11:28", "remaining_time": "3:28:29", "throughput": 2304.64, "total_tokens": 9882920} {"current_steps": 17145, "total_steps": 67140, "loss": 0.6002, "lr": 4.641356907203734e-05, "epoch": 2.5536193029490617, "percentage": 25.54, "elapsed_time": "1:11:29", "remaining_time": "3:28:27", "throughput": 2304.7, "total_tokens": 9885736} {"current_steps": 17150, "total_steps": 67140, "loss": 0.5913, "lr": 4.6410214451337816e-05, "epoch": 2.554364015490021, "percentage": 25.54, "elapsed_time": "1:11:30", "remaining_time": "3:28:26", "throughput": 2304.75, "total_tokens": 9888488} {"current_steps": 17155, "total_steps": 67140, "loss": 0.6907, "lr": 4.6406858383823056e-05, "epoch": 2.55510872803098, "percentage": 25.55, "elapsed_time": "1:11:31", "remaining_time": "3:28:24", "throughput": 2304.8, "total_tokens": 9891368} {"current_steps": 17160, "total_steps": 67140, "loss": 0.674, "lr": 4.640350086971983e-05, "epoch": 2.5558534405719393, "percentage": 25.56, "elapsed_time": "1:11:32", "remaining_time": "3:28:23", "throughput": 2304.87, "total_tokens": 9894280} {"current_steps": 17165, "total_steps": 67140, "loss": 0.7007, "lr": 4.640014190925505e-05, "epoch": 2.5565981531128985, "percentage": 25.57, "elapsed_time": "1:11:33", "remaining_time": "3:28:21", "throughput": 2304.92, "total_tokens": 9897032} {"current_steps": 17170, "total_steps": 67140, "loss": 0.6935, "lr": 4.639678150265567e-05, "epoch": 2.5573428656538577, "percentage": 25.57, "elapsed_time": "1:11:35", "remaining_time": "3:28:19", "throughput": 2305.06, "total_tokens": 9900392} {"current_steps": 17175, "total_steps": 67140, "loss": 0.6511, "lr": 4.639341965014879e-05, "epoch": 2.558087578194817, "percentage": 25.58, "elapsed_time": "1:11:36", "remaining_time": "3:28:18", "throughput": 2305.14, "total_tokens": 9903432} {"current_steps": 17180, "total_steps": 67140, "loss": 0.6134, "lr": 4.63900563519616e-05, "epoch": 2.558832290735776, "percentage": 25.59, "elapsed_time": "1:11:37", "remaining_time": "3:28:16", "throughput": 2305.2, "total_tokens": 9906280} {"current_steps": 17185, "total_steps": 67140, "loss": 0.5683, "lr": 4.638669160832136e-05, "epoch": 2.5595770032767353, "percentage": 25.6, "elapsed_time": "1:11:38", "remaining_time": "3:28:15", "throughput": 2305.24, "total_tokens": 9909000} {"current_steps": 17190, "total_steps": 67140, "loss": 0.6657, "lr": 4.638332541945546e-05, "epoch": 2.5603217158176945, "percentage": 25.6, "elapsed_time": "1:11:39", "remaining_time": "3:28:13", "throughput": 2305.31, "total_tokens": 9911880} {"current_steps": 17195, "total_steps": 67140, "loss": 0.6564, "lr": 4.6379957785591355e-05, "epoch": 2.5610664283586537, "percentage": 25.61, "elapsed_time": "1:11:40", "remaining_time": "3:28:12", "throughput": 2305.38, "total_tokens": 9914856} {"current_steps": 17200, "total_steps": 67140, "loss": 0.5661, "lr": 4.6376588706956635e-05, "epoch": 2.5618111408996125, "percentage": 25.62, "elapsed_time": "1:11:41", "remaining_time": "3:28:10", "throughput": 2305.4, "total_tokens": 9917480} {"current_steps": 17205, "total_steps": 67140, "loss": 0.5941, "lr": 4.637321818377896e-05, "epoch": 2.562555853440572, "percentage": 25.63, "elapsed_time": "1:11:43", "remaining_time": "3:28:08", "throughput": 2305.5, "total_tokens": 9920584} {"current_steps": 17210, "total_steps": 67140, "loss": 0.6037, "lr": 4.636984621628609e-05, "epoch": 2.563300565981531, "percentage": 25.63, "elapsed_time": "1:11:44", "remaining_time": "3:28:07", "throughput": 2305.58, "total_tokens": 9923560} {"current_steps": 17215, "total_steps": 67140, "loss": 0.6485, "lr": 4.6366472804705905e-05, "epoch": 2.5640452785224905, "percentage": 25.64, "elapsed_time": "1:11:45", "remaining_time": "3:28:05", "throughput": 2305.65, "total_tokens": 9926472} {"current_steps": 17220, "total_steps": 67140, "loss": 0.6005, "lr": 4.636309794926636e-05, "epoch": 2.5647899910634493, "percentage": 25.65, "elapsed_time": "1:11:46", "remaining_time": "3:28:04", "throughput": 2305.7, "total_tokens": 9929320} {"current_steps": 17225, "total_steps": 67140, "loss": 0.6491, "lr": 4.635972165019551e-05, "epoch": 2.565534703604409, "percentage": 25.66, "elapsed_time": "1:11:47", "remaining_time": "3:28:02", "throughput": 2305.73, "total_tokens": 9932040} {"current_steps": 17230, "total_steps": 67140, "loss": 0.6882, "lr": 4.635634390772151e-05, "epoch": 2.5662794161453677, "percentage": 25.66, "elapsed_time": "1:11:48", "remaining_time": "3:28:00", "throughput": 2305.76, "total_tokens": 9934696} {"current_steps": 17235, "total_steps": 67140, "loss": 0.5676, "lr": 4.635296472207262e-05, "epoch": 2.5670241286863273, "percentage": 25.67, "elapsed_time": "1:11:49", "remaining_time": "3:27:59", "throughput": 2305.8, "total_tokens": 9937416} {"current_steps": 17240, "total_steps": 67140, "loss": 0.7157, "lr": 4.6349584093477184e-05, "epoch": 2.567768841227286, "percentage": 25.68, "elapsed_time": "1:11:50", "remaining_time": "3:27:57", "throughput": 2305.85, "total_tokens": 9940232} {"current_steps": 17245, "total_steps": 67140, "loss": 0.5812, "lr": 4.634620202216366e-05, "epoch": 2.5685135537682453, "percentage": 25.69, "elapsed_time": "1:11:51", "remaining_time": "3:27:55", "throughput": 2305.87, "total_tokens": 9942824} {"current_steps": 17250, "total_steps": 67140, "loss": 0.6532, "lr": 4.6342818508360595e-05, "epoch": 2.5692582663092045, "percentage": 25.69, "elapsed_time": "1:11:53", "remaining_time": "3:27:54", "throughput": 2305.93, "total_tokens": 9945736} {"current_steps": 17255, "total_steps": 67140, "loss": 0.5925, "lr": 4.633943355229662e-05, "epoch": 2.5700029788501637, "percentage": 25.7, "elapsed_time": "1:11:54", "remaining_time": "3:27:52", "throughput": 2305.99, "total_tokens": 9948616} {"current_steps": 17260, "total_steps": 67140, "loss": 0.7771, "lr": 4.633604715420049e-05, "epoch": 2.570747691391123, "percentage": 25.71, "elapsed_time": "1:11:55", "remaining_time": "3:27:51", "throughput": 2306.08, "total_tokens": 9951752} {"current_steps": 17265, "total_steps": 67140, "loss": 0.6253, "lr": 4.6332659314301034e-05, "epoch": 2.571492403932082, "percentage": 25.71, "elapsed_time": "1:11:56", "remaining_time": "3:27:49", "throughput": 2306.17, "total_tokens": 9954728} {"current_steps": 17270, "total_steps": 67140, "loss": 0.6438, "lr": 4.63292700328272e-05, "epoch": 2.5722371164730413, "percentage": 25.72, "elapsed_time": "1:11:57", "remaining_time": "3:27:48", "throughput": 2306.27, "total_tokens": 9957896} {"current_steps": 17275, "total_steps": 67140, "loss": 0.8543, "lr": 4.632587931000801e-05, "epoch": 2.5729818290140005, "percentage": 25.73, "elapsed_time": "1:11:58", "remaining_time": "3:27:46", "throughput": 2306.37, "total_tokens": 9961064} {"current_steps": 17280, "total_steps": 67140, "loss": 0.6037, "lr": 4.6322487146072614e-05, "epoch": 2.5737265415549597, "percentage": 25.74, "elapsed_time": "1:12:00", "remaining_time": "3:27:45", "throughput": 2306.46, "total_tokens": 9964104} {"current_steps": 17285, "total_steps": 67140, "loss": 0.6527, "lr": 4.6319093541250214e-05, "epoch": 2.574471254095919, "percentage": 25.74, "elapsed_time": "1:12:01", "remaining_time": "3:27:43", "throughput": 2306.52, "total_tokens": 9966984} {"current_steps": 17290, "total_steps": 67140, "loss": 0.6787, "lr": 4.6315698495770155e-05, "epoch": 2.575215966636878, "percentage": 25.75, "elapsed_time": "1:12:02", "remaining_time": "3:27:42", "throughput": 2306.6, "total_tokens": 9970056} {"current_steps": 17295, "total_steps": 67140, "loss": 0.7442, "lr": 4.6312302009861855e-05, "epoch": 2.5759606791778373, "percentage": 25.76, "elapsed_time": "1:12:03", "remaining_time": "3:27:40", "throughput": 2306.69, "total_tokens": 9973096} {"current_steps": 17300, "total_steps": 67140, "loss": 0.5681, "lr": 4.630890408375483e-05, "epoch": 2.5767053917187965, "percentage": 25.77, "elapsed_time": "1:12:04", "remaining_time": "3:27:39", "throughput": 2306.76, "total_tokens": 9976040} {"current_steps": 17305, "total_steps": 67140, "loss": 0.8508, "lr": 4.630550471767871e-05, "epoch": 2.5774501042597557, "percentage": 25.77, "elapsed_time": "1:12:05", "remaining_time": "3:27:37", "throughput": 2306.86, "total_tokens": 9979240} {"current_steps": 17310, "total_steps": 67140, "loss": 0.6897, "lr": 4.6302103911863196e-05, "epoch": 2.578194816800715, "percentage": 25.78, "elapsed_time": "1:12:07", "remaining_time": "3:27:36", "throughput": 2306.93, "total_tokens": 9982152} {"current_steps": 17315, "total_steps": 67140, "loss": 0.6098, "lr": 4.6298701666538114e-05, "epoch": 2.578939529341674, "percentage": 25.79, "elapsed_time": "1:12:08", "remaining_time": "3:27:34", "throughput": 2306.98, "total_tokens": 9985000} {"current_steps": 17320, "total_steps": 67140, "loss": 0.7139, "lr": 4.629529798193336e-05, "epoch": 2.5796842418826333, "percentage": 25.8, "elapsed_time": "1:12:09", "remaining_time": "3:27:32", "throughput": 2307.04, "total_tokens": 9987880} {"current_steps": 17325, "total_steps": 67140, "loss": 0.6591, "lr": 4.629189285827895e-05, "epoch": 2.5804289544235925, "percentage": 25.8, "elapsed_time": "1:12:10", "remaining_time": "3:27:31", "throughput": 2307.12, "total_tokens": 9990888} {"current_steps": 17330, "total_steps": 67140, "loss": 0.6302, "lr": 4.6288486295805e-05, "epoch": 2.5811736669645517, "percentage": 25.81, "elapsed_time": "1:12:11", "remaining_time": "3:27:29", "throughput": 2307.16, "total_tokens": 9993544} {"current_steps": 17335, "total_steps": 67140, "loss": 0.6037, "lr": 4.628507829474168e-05, "epoch": 2.581918379505511, "percentage": 25.82, "elapsed_time": "1:12:12", "remaining_time": "3:27:28", "throughput": 2307.24, "total_tokens": 9996584} {"current_steps": 17340, "total_steps": 67140, "loss": 0.582, "lr": 4.628166885531932e-05, "epoch": 2.58266309204647, "percentage": 25.83, "elapsed_time": "1:12:13", "remaining_time": "3:27:26", "throughput": 2307.28, "total_tokens": 9999336} {"current_steps": 17345, "total_steps": 67140, "loss": 0.5724, "lr": 4.6278257977768305e-05, "epoch": 2.5834078045874294, "percentage": 25.83, "elapsed_time": "1:12:14", "remaining_time": "3:27:25", "throughput": 2307.34, "total_tokens": 10002184} {"current_steps": 17350, "total_steps": 67140, "loss": 0.5368, "lr": 4.627484566231912e-05, "epoch": 2.5841525171283886, "percentage": 25.84, "elapsed_time": "1:12:16", "remaining_time": "3:27:23", "throughput": 2307.4, "total_tokens": 10005096} {"current_steps": 17355, "total_steps": 67140, "loss": 0.5559, "lr": 4.627143190920237e-05, "epoch": 2.5848972296693478, "percentage": 25.85, "elapsed_time": "1:12:17", "remaining_time": "3:27:21", "throughput": 2307.48, "total_tokens": 10008104} {"current_steps": 17360, "total_steps": 67140, "loss": 0.6635, "lr": 4.626801671864872e-05, "epoch": 2.585641942210307, "percentage": 25.86, "elapsed_time": "1:12:18", "remaining_time": "3:27:20", "throughput": 2307.51, "total_tokens": 10010792} {"current_steps": 17365, "total_steps": 67140, "loss": 0.7799, "lr": 4.6264600090888984e-05, "epoch": 2.586386654751266, "percentage": 25.86, "elapsed_time": "1:12:19", "remaining_time": "3:27:18", "throughput": 2307.58, "total_tokens": 10013768} {"current_steps": 17370, "total_steps": 67140, "loss": 0.7563, "lr": 4.626118202615403e-05, "epoch": 2.5871313672922254, "percentage": 25.87, "elapsed_time": "1:12:20", "remaining_time": "3:27:17", "throughput": 2307.61, "total_tokens": 10016488} {"current_steps": 17375, "total_steps": 67140, "loss": 0.8006, "lr": 4.6257762524674826e-05, "epoch": 2.587876079833184, "percentage": 25.88, "elapsed_time": "1:12:21", "remaining_time": "3:27:15", "throughput": 2307.68, "total_tokens": 10019432} {"current_steps": 17380, "total_steps": 67140, "loss": 0.6808, "lr": 4.625434158668246e-05, "epoch": 2.5886207923741438, "percentage": 25.89, "elapsed_time": "1:12:22", "remaining_time": "3:27:13", "throughput": 2307.73, "total_tokens": 10022216} {"current_steps": 17385, "total_steps": 67140, "loss": 0.8279, "lr": 4.625091921240811e-05, "epoch": 2.5893655049151025, "percentage": 25.89, "elapsed_time": "1:12:24", "remaining_time": "3:27:12", "throughput": 2307.79, "total_tokens": 10025096} {"current_steps": 17390, "total_steps": 67140, "loss": 0.5909, "lr": 4.624749540208304e-05, "epoch": 2.590110217456062, "percentage": 25.9, "elapsed_time": "1:12:25", "remaining_time": "3:27:10", "throughput": 2307.87, "total_tokens": 10028136} {"current_steps": 17395, "total_steps": 67140, "loss": 0.7309, "lr": 4.6244070155938614e-05, "epoch": 2.590854929997021, "percentage": 25.91, "elapsed_time": "1:12:26", "remaining_time": "3:27:09", "throughput": 2307.92, "total_tokens": 10030888} {"current_steps": 17400, "total_steps": 67140, "loss": 0.7829, "lr": 4.624064347420629e-05, "epoch": 2.5915996425379806, "percentage": 25.92, "elapsed_time": "1:12:27", "remaining_time": "3:27:07", "throughput": 2307.95, "total_tokens": 10033576} {"current_steps": 17405, "total_steps": 67140, "loss": 0.6834, "lr": 4.623721535711765e-05, "epoch": 2.5923443550789393, "percentage": 25.92, "elapsed_time": "1:12:28", "remaining_time": "3:27:06", "throughput": 2308.01, "total_tokens": 10036520} {"current_steps": 17410, "total_steps": 67140, "loss": 0.8289, "lr": 4.623378580490434e-05, "epoch": 2.593089067619899, "percentage": 25.93, "elapsed_time": "1:12:29", "remaining_time": "3:27:04", "throughput": 2308.06, "total_tokens": 10039368} {"current_steps": 17415, "total_steps": 67140, "loss": 0.6588, "lr": 4.6230354817798104e-05, "epoch": 2.5938337801608577, "percentage": 25.94, "elapsed_time": "1:12:30", "remaining_time": "3:27:02", "throughput": 2308.12, "total_tokens": 10042216} {"current_steps": 17420, "total_steps": 67140, "loss": 0.5983, "lr": 4.622692239603082e-05, "epoch": 2.594578492701817, "percentage": 25.95, "elapsed_time": "1:12:31", "remaining_time": "3:27:01", "throughput": 2308.22, "total_tokens": 10045352} {"current_steps": 17425, "total_steps": 67140, "loss": 0.7545, "lr": 4.6223488539834415e-05, "epoch": 2.595323205242776, "percentage": 25.95, "elapsed_time": "1:12:33", "remaining_time": "3:26:59", "throughput": 2308.29, "total_tokens": 10048296} {"current_steps": 17430, "total_steps": 67140, "loss": 0.7119, "lr": 4.622005324944095e-05, "epoch": 2.5960679177837354, "percentage": 25.96, "elapsed_time": "1:12:34", "remaining_time": "3:26:58", "throughput": 2308.41, "total_tokens": 10051560} {"current_steps": 17435, "total_steps": 67140, "loss": 0.7179, "lr": 4.621661652508255e-05, "epoch": 2.5968126303246946, "percentage": 25.97, "elapsed_time": "1:12:35", "remaining_time": "3:26:56", "throughput": 2308.48, "total_tokens": 10054504} {"current_steps": 17440, "total_steps": 67140, "loss": 0.7993, "lr": 4.621317836699147e-05, "epoch": 2.5975573428656538, "percentage": 25.98, "elapsed_time": "1:12:36", "remaining_time": "3:26:55", "throughput": 2308.6, "total_tokens": 10057800} {"current_steps": 17445, "total_steps": 67140, "loss": 0.7161, "lr": 4.6209738775400045e-05, "epoch": 2.598302055406613, "percentage": 25.98, "elapsed_time": "1:12:37", "remaining_time": "3:26:53", "throughput": 2308.65, "total_tokens": 10060616} {"current_steps": 17450, "total_steps": 67140, "loss": 0.6857, "lr": 4.6206297750540706e-05, "epoch": 2.599046767947572, "percentage": 25.99, "elapsed_time": "1:12:38", "remaining_time": "3:26:52", "throughput": 2308.71, "total_tokens": 10063464} {"current_steps": 17455, "total_steps": 67140, "loss": 0.5574, "lr": 4.620285529264599e-05, "epoch": 2.5997914804885314, "percentage": 26.0, "elapsed_time": "1:12:40", "remaining_time": "3:26:50", "throughput": 2308.74, "total_tokens": 10066184} {"current_steps": 17460, "total_steps": 67140, "loss": 0.7752, "lr": 4.619941140194851e-05, "epoch": 2.6005361930294906, "percentage": 26.01, "elapsed_time": "1:12:41", "remaining_time": "3:26:49", "throughput": 2308.8, "total_tokens": 10069096} {"current_steps": 17465, "total_steps": 67140, "loss": 0.6389, "lr": 4.6195966078680995e-05, "epoch": 2.6012809055704498, "percentage": 26.01, "elapsed_time": "1:12:42", "remaining_time": "3:26:47", "throughput": 2308.86, "total_tokens": 10071976} {"current_steps": 17470, "total_steps": 67140, "loss": 0.5883, "lr": 4.619251932307627e-05, "epoch": 2.602025618111409, "percentage": 26.02, "elapsed_time": "1:12:43", "remaining_time": "3:26:45", "throughput": 2308.87, "total_tokens": 10074536} {"current_steps": 17475, "total_steps": 67140, "loss": 0.7063, "lr": 4.618907113536726e-05, "epoch": 2.602770330652368, "percentage": 26.03, "elapsed_time": "1:12:44", "remaining_time": "3:26:44", "throughput": 2308.91, "total_tokens": 10077320} {"current_steps": 17480, "total_steps": 67140, "loss": 0.6477, "lr": 4.618562151578696e-05, "epoch": 2.6035150431933274, "percentage": 26.04, "elapsed_time": "1:12:45", "remaining_time": "3:26:42", "throughput": 2308.97, "total_tokens": 10080136} {"current_steps": 17485, "total_steps": 67140, "loss": 0.7011, "lr": 4.61821704645685e-05, "epoch": 2.6042597557342866, "percentage": 26.04, "elapsed_time": "1:12:46", "remaining_time": "3:26:41", "throughput": 2309.06, "total_tokens": 10083208} {"current_steps": 17490, "total_steps": 67140, "loss": 0.5879, "lr": 4.6178717981945074e-05, "epoch": 2.605004468275246, "percentage": 26.05, "elapsed_time": "1:12:47", "remaining_time": "3:26:39", "throughput": 2309.13, "total_tokens": 10086152} {"current_steps": 17495, "total_steps": 67140, "loss": 0.5943, "lr": 4.617526406815e-05, "epoch": 2.605749180816205, "percentage": 26.06, "elapsed_time": "1:12:49", "remaining_time": "3:26:38", "throughput": 2309.19, "total_tokens": 10089096} {"current_steps": 17500, "total_steps": 67140, "loss": 0.6304, "lr": 4.617180872341667e-05, "epoch": 2.606493893357164, "percentage": 26.06, "elapsed_time": "1:12:50", "remaining_time": "3:26:36", "throughput": 2309.24, "total_tokens": 10091912} {"current_steps": 17505, "total_steps": 67140, "loss": 0.7192, "lr": 4.616835194797858e-05, "epoch": 2.6072386058981234, "percentage": 26.07, "elapsed_time": "1:12:51", "remaining_time": "3:26:34", "throughput": 2309.31, "total_tokens": 10094856} {"current_steps": 17510, "total_steps": 67140, "loss": 0.7367, "lr": 4.616489374206934e-05, "epoch": 2.6079833184390826, "percentage": 26.08, "elapsed_time": "1:12:52", "remaining_time": "3:26:33", "throughput": 2309.36, "total_tokens": 10097672} {"current_steps": 17515, "total_steps": 67140, "loss": 0.6974, "lr": 4.6161434105922616e-05, "epoch": 2.608728030980042, "percentage": 26.09, "elapsed_time": "1:12:53", "remaining_time": "3:26:31", "throughput": 2309.38, "total_tokens": 10100328} {"current_steps": 17520, "total_steps": 67140, "loss": 0.5563, "lr": 4.615797303977223e-05, "epoch": 2.609472743521001, "percentage": 26.09, "elapsed_time": "1:12:54", "remaining_time": "3:26:30", "throughput": 2309.41, "total_tokens": 10103016} {"current_steps": 17525, "total_steps": 67140, "loss": 0.751, "lr": 4.615451054385204e-05, "epoch": 2.61021745606196, "percentage": 26.1, "elapsed_time": "1:12:55", "remaining_time": "3:26:28", "throughput": 2309.49, "total_tokens": 10105960} {"current_steps": 17530, "total_steps": 67140, "loss": 0.6572, "lr": 4.615104661839603e-05, "epoch": 2.6109621686029194, "percentage": 26.11, "elapsed_time": "1:12:56", "remaining_time": "3:26:26", "throughput": 2309.53, "total_tokens": 10108712} {"current_steps": 17535, "total_steps": 67140, "loss": 0.5526, "lr": 4.6147581263638286e-05, "epoch": 2.6117068811438786, "percentage": 26.12, "elapsed_time": "1:12:58", "remaining_time": "3:26:25", "throughput": 2309.57, "total_tokens": 10111528} {"current_steps": 17540, "total_steps": 67140, "loss": 0.6077, "lr": 4.614411447981298e-05, "epoch": 2.612451593684838, "percentage": 26.12, "elapsed_time": "1:12:59", "remaining_time": "3:26:23", "throughput": 2309.62, "total_tokens": 10114312} {"current_steps": 17545, "total_steps": 67140, "loss": 0.6754, "lr": 4.6140646267154384e-05, "epoch": 2.613196306225797, "percentage": 26.13, "elapsed_time": "1:13:00", "remaining_time": "3:26:22", "throughput": 2309.68, "total_tokens": 10117224} {"current_steps": 17550, "total_steps": 67140, "loss": 0.5067, "lr": 4.613717662589687e-05, "epoch": 2.6139410187667558, "percentage": 26.14, "elapsed_time": "1:13:01", "remaining_time": "3:26:20", "throughput": 2309.72, "total_tokens": 10119912} {"current_steps": 17555, "total_steps": 67140, "loss": 0.7656, "lr": 4.613370555627489e-05, "epoch": 2.6146857313077154, "percentage": 26.15, "elapsed_time": "1:13:02", "remaining_time": "3:26:18", "throughput": 2309.81, "total_tokens": 10123016} {"current_steps": 17560, "total_steps": 67140, "loss": 0.6377, "lr": 4.6130233058523015e-05, "epoch": 2.615430443848674, "percentage": 26.15, "elapsed_time": "1:13:03", "remaining_time": "3:26:17", "throughput": 2309.85, "total_tokens": 10125800} {"current_steps": 17565, "total_steps": 67140, "loss": 0.6473, "lr": 4.6126759132875896e-05, "epoch": 2.616175156389634, "percentage": 26.16, "elapsed_time": "1:13:04", "remaining_time": "3:26:15", "throughput": 2309.86, "total_tokens": 10128392} {"current_steps": 17570, "total_steps": 67140, "loss": 0.6268, "lr": 4.612328377956829e-05, "epoch": 2.6169198689305926, "percentage": 26.17, "elapsed_time": "1:13:05", "remaining_time": "3:26:13", "throughput": 2309.86, "total_tokens": 10130856} {"current_steps": 17575, "total_steps": 67140, "loss": 0.6064, "lr": 4.6119806998835056e-05, "epoch": 2.6176645814715522, "percentage": 26.18, "elapsed_time": "1:13:07", "remaining_time": "3:26:12", "throughput": 2309.89, "total_tokens": 10133512} {"current_steps": 17580, "total_steps": 67140, "loss": 0.7625, "lr": 4.611632879091112e-05, "epoch": 2.618409294012511, "percentage": 26.18, "elapsed_time": "1:13:08", "remaining_time": "3:26:10", "throughput": 2309.94, "total_tokens": 10136392} {"current_steps": 17585, "total_steps": 67140, "loss": 0.5343, "lr": 4.6112849156031544e-05, "epoch": 2.6191540065534706, "percentage": 26.19, "elapsed_time": "1:13:09", "remaining_time": "3:26:09", "throughput": 2309.96, "total_tokens": 10138984} {"current_steps": 17590, "total_steps": 67140, "loss": 0.7283, "lr": 4.610936809443146e-05, "epoch": 2.6198987190944294, "percentage": 26.2, "elapsed_time": "1:13:10", "remaining_time": "3:26:07", "throughput": 2310.01, "total_tokens": 10141800} {"current_steps": 17595, "total_steps": 67140, "loss": 0.6381, "lr": 4.610588560634611e-05, "epoch": 2.6206434316353886, "percentage": 26.21, "elapsed_time": "1:13:11", "remaining_time": "3:26:05", "throughput": 2310.02, "total_tokens": 10144360} {"current_steps": 17600, "total_steps": 67140, "loss": 0.7025, "lr": 4.610240169201081e-05, "epoch": 2.621388144176348, "percentage": 26.21, "elapsed_time": "1:13:12", "remaining_time": "3:26:04", "throughput": 2310.05, "total_tokens": 10147080} {"current_steps": 17605, "total_steps": 67140, "loss": 0.7131, "lr": 4.6098916351661006e-05, "epoch": 2.622132856717307, "percentage": 26.22, "elapsed_time": "1:13:13", "remaining_time": "3:26:02", "throughput": 2310.14, "total_tokens": 10150120} {"current_steps": 17610, "total_steps": 67140, "loss": 0.7084, "lr": 4.609542958553221e-05, "epoch": 2.622877569258266, "percentage": 26.23, "elapsed_time": "1:13:14", "remaining_time": "3:26:00", "throughput": 2310.16, "total_tokens": 10152744} {"current_steps": 17615, "total_steps": 67140, "loss": 0.7597, "lr": 4.609194139386006e-05, "epoch": 2.6236222817992254, "percentage": 26.24, "elapsed_time": "1:13:15", "remaining_time": "3:25:59", "throughput": 2310.2, "total_tokens": 10155464} {"current_steps": 17620, "total_steps": 67140, "loss": 0.4726, "lr": 4.608845177688026e-05, "epoch": 2.6243669943401846, "percentage": 26.24, "elapsed_time": "1:13:17", "remaining_time": "3:25:57", "throughput": 2310.24, "total_tokens": 10158248} {"current_steps": 17625, "total_steps": 67140, "loss": 0.6825, "lr": 4.608496073482863e-05, "epoch": 2.625111706881144, "percentage": 26.25, "elapsed_time": "1:13:18", "remaining_time": "3:25:56", "throughput": 2310.28, "total_tokens": 10161000} {"current_steps": 17630, "total_steps": 67140, "loss": 0.5672, "lr": 4.608146826794107e-05, "epoch": 2.625856419422103, "percentage": 26.26, "elapsed_time": "1:13:19", "remaining_time": "3:25:54", "throughput": 2310.35, "total_tokens": 10163912} {"current_steps": 17635, "total_steps": 67140, "loss": 0.5408, "lr": 4.607797437645361e-05, "epoch": 2.626601131963062, "percentage": 26.27, "elapsed_time": "1:13:20", "remaining_time": "3:25:52", "throughput": 2310.39, "total_tokens": 10166632} {"current_steps": 17640, "total_steps": 67140, "loss": 0.6417, "lr": 4.607447906060233e-05, "epoch": 2.6273458445040214, "percentage": 26.27, "elapsed_time": "1:13:21", "remaining_time": "3:25:51", "throughput": 2310.52, "total_tokens": 10170024} {"current_steps": 17645, "total_steps": 67140, "loss": 0.51, "lr": 4.607098232062344e-05, "epoch": 2.6280905570449806, "percentage": 26.28, "elapsed_time": "1:13:22", "remaining_time": "3:25:49", "throughput": 2310.56, "total_tokens": 10172808} {"current_steps": 17650, "total_steps": 67140, "loss": 0.6444, "lr": 4.6067484156753234e-05, "epoch": 2.62883526958594, "percentage": 26.29, "elapsed_time": "1:13:23", "remaining_time": "3:25:48", "throughput": 2310.68, "total_tokens": 10176072} {"current_steps": 17655, "total_steps": 67140, "loss": 0.7282, "lr": 4.6063984569228103e-05, "epoch": 2.629579982126899, "percentage": 26.3, "elapsed_time": "1:13:25", "remaining_time": "3:25:46", "throughput": 2310.73, "total_tokens": 10178920} {"current_steps": 17660, "total_steps": 67140, "loss": 0.8127, "lr": 4.606048355828453e-05, "epoch": 2.6303246946678582, "percentage": 26.3, "elapsed_time": "1:13:26", "remaining_time": "3:25:45", "throughput": 2310.87, "total_tokens": 10182408} {"current_steps": 17665, "total_steps": 67140, "loss": 0.6402, "lr": 4.6056981124159104e-05, "epoch": 2.6310694072088174, "percentage": 26.31, "elapsed_time": "1:13:27", "remaining_time": "3:25:44", "throughput": 2310.92, "total_tokens": 10185256} {"current_steps": 17670, "total_steps": 67140, "loss": 0.7727, "lr": 4.605347726708851e-05, "epoch": 2.6318141197497766, "percentage": 26.32, "elapsed_time": "1:13:28", "remaining_time": "3:25:42", "throughput": 2310.99, "total_tokens": 10188232} {"current_steps": 17675, "total_steps": 67140, "loss": 0.7643, "lr": 4.604997198730951e-05, "epoch": 2.632558832290736, "percentage": 26.33, "elapsed_time": "1:13:29", "remaining_time": "3:25:41", "throughput": 2311.07, "total_tokens": 10191272} {"current_steps": 17680, "total_steps": 67140, "loss": 0.9372, "lr": 4.6046465285058996e-05, "epoch": 2.633303544831695, "percentage": 26.33, "elapsed_time": "1:13:30", "remaining_time": "3:25:39", "throughput": 2311.13, "total_tokens": 10194088} {"current_steps": 17685, "total_steps": 67140, "loss": 0.6386, "lr": 4.604295716057393e-05, "epoch": 2.6340482573726542, "percentage": 26.34, "elapsed_time": "1:13:31", "remaining_time": "3:25:37", "throughput": 2311.17, "total_tokens": 10196840} {"current_steps": 17690, "total_steps": 67140, "loss": 0.6039, "lr": 4.6039447614091365e-05, "epoch": 2.6347929699136134, "percentage": 26.35, "elapsed_time": "1:13:33", "remaining_time": "3:25:36", "throughput": 2311.23, "total_tokens": 10199720} {"current_steps": 17695, "total_steps": 67140, "loss": 0.6248, "lr": 4.6035936645848476e-05, "epoch": 2.6355376824545726, "percentage": 26.36, "elapsed_time": "1:13:34", "remaining_time": "3:25:34", "throughput": 2311.32, "total_tokens": 10202760} {"current_steps": 17700, "total_steps": 67140, "loss": 0.7281, "lr": 4.6032424256082504e-05, "epoch": 2.636282394995532, "percentage": 26.36, "elapsed_time": "1:13:35", "remaining_time": "3:25:33", "throughput": 2311.41, "total_tokens": 10205896} {"current_steps": 17705, "total_steps": 67140, "loss": 0.7972, "lr": 4.602891044503083e-05, "epoch": 2.637027107536491, "percentage": 26.37, "elapsed_time": "1:13:36", "remaining_time": "3:25:31", "throughput": 2311.48, "total_tokens": 10208808} {"current_steps": 17710, "total_steps": 67140, "loss": 0.6337, "lr": 4.6025395212930864e-05, "epoch": 2.6377718200774503, "percentage": 26.38, "elapsed_time": "1:13:37", "remaining_time": "3:25:30", "throughput": 2311.57, "total_tokens": 10211944} {"current_steps": 17715, "total_steps": 67140, "loss": 0.5812, "lr": 4.602187856002019e-05, "epoch": 2.6385165326184095, "percentage": 26.39, "elapsed_time": "1:13:38", "remaining_time": "3:25:28", "throughput": 2311.61, "total_tokens": 10214728} {"current_steps": 17720, "total_steps": 67140, "loss": 0.5814, "lr": 4.601836048653642e-05, "epoch": 2.6392612451593687, "percentage": 26.39, "elapsed_time": "1:13:40", "remaining_time": "3:25:27", "throughput": 2311.68, "total_tokens": 10217640} {"current_steps": 17725, "total_steps": 67140, "loss": 0.6303, "lr": 4.601484099271731e-05, "epoch": 2.6400059577003274, "percentage": 26.4, "elapsed_time": "1:13:41", "remaining_time": "3:25:25", "throughput": 2311.73, "total_tokens": 10220456} {"current_steps": 17730, "total_steps": 67140, "loss": 0.7494, "lr": 4.601132007880068e-05, "epoch": 2.640750670241287, "percentage": 26.41, "elapsed_time": "1:13:42", "remaining_time": "3:25:24", "throughput": 2311.83, "total_tokens": 10223656} {"current_steps": 17735, "total_steps": 67140, "loss": 0.5154, "lr": 4.600779774502447e-05, "epoch": 2.641495382782246, "percentage": 26.41, "elapsed_time": "1:13:43", "remaining_time": "3:25:22", "throughput": 2311.9, "total_tokens": 10226600} {"current_steps": 17740, "total_steps": 67140, "loss": 0.6777, "lr": 4.60042739916267e-05, "epoch": 2.6422400953232055, "percentage": 26.42, "elapsed_time": "1:13:44", "remaining_time": "3:25:21", "throughput": 2312.0, "total_tokens": 10229768} {"current_steps": 17745, "total_steps": 67140, "loss": 0.5444, "lr": 4.600074881884549e-05, "epoch": 2.6429848078641642, "percentage": 26.43, "elapsed_time": "1:13:45", "remaining_time": "3:25:19", "throughput": 2312.06, "total_tokens": 10232648} {"current_steps": 17750, "total_steps": 67140, "loss": 0.6638, "lr": 4.599722222691906e-05, "epoch": 2.643729520405124, "percentage": 26.44, "elapsed_time": "1:13:46", "remaining_time": "3:25:18", "throughput": 2312.09, "total_tokens": 10235400} {"current_steps": 17755, "total_steps": 67140, "loss": 0.6295, "lr": 4.599369421608571e-05, "epoch": 2.6444742329460826, "percentage": 26.44, "elapsed_time": "1:13:48", "remaining_time": "3:25:16", "throughput": 2312.15, "total_tokens": 10238312} {"current_steps": 17760, "total_steps": 67140, "loss": 0.672, "lr": 4.5990164786583865e-05, "epoch": 2.645218945487042, "percentage": 26.45, "elapsed_time": "1:13:49", "remaining_time": "3:25:14", "throughput": 2312.22, "total_tokens": 10241160} {"current_steps": 17765, "total_steps": 67140, "loss": 0.6818, "lr": 4.598663393865203e-05, "epoch": 2.645963658028001, "percentage": 26.46, "elapsed_time": "1:13:50", "remaining_time": "3:25:13", "throughput": 2312.27, "total_tokens": 10244040} {"current_steps": 17770, "total_steps": 67140, "loss": 0.5792, "lr": 4.598310167252879e-05, "epoch": 2.6467083705689602, "percentage": 26.47, "elapsed_time": "1:13:51", "remaining_time": "3:25:11", "throughput": 2312.3, "total_tokens": 10246792} {"current_steps": 17775, "total_steps": 67140, "loss": 0.6851, "lr": 4.5979567988452856e-05, "epoch": 2.6474530831099194, "percentage": 26.47, "elapsed_time": "1:13:52", "remaining_time": "3:25:10", "throughput": 2312.38, "total_tokens": 10249864} {"current_steps": 17780, "total_steps": 67140, "loss": 0.5169, "lr": 4.597603288666301e-05, "epoch": 2.6481977956508786, "percentage": 26.48, "elapsed_time": "1:13:53", "remaining_time": "3:25:08", "throughput": 2312.47, "total_tokens": 10252936} {"current_steps": 17785, "total_steps": 67140, "loss": 0.4991, "lr": 4.597249636739815e-05, "epoch": 2.648942508191838, "percentage": 26.49, "elapsed_time": "1:13:54", "remaining_time": "3:25:07", "throughput": 2312.51, "total_tokens": 10255720} {"current_steps": 17790, "total_steps": 67140, "loss": 0.76, "lr": 4.5968958430897246e-05, "epoch": 2.649687220732797, "percentage": 26.5, "elapsed_time": "1:13:56", "remaining_time": "3:25:05", "throughput": 2312.62, "total_tokens": 10258952} {"current_steps": 17795, "total_steps": 67140, "loss": 0.7238, "lr": 4.596541907739939e-05, "epoch": 2.6504319332737563, "percentage": 26.5, "elapsed_time": "1:13:57", "remaining_time": "3:25:04", "throughput": 2312.68, "total_tokens": 10261864} {"current_steps": 17800, "total_steps": 67140, "loss": 0.8975, "lr": 4.5961878307143746e-05, "epoch": 2.6511766458147155, "percentage": 26.51, "elapsed_time": "1:13:58", "remaining_time": "3:25:02", "throughput": 2312.74, "total_tokens": 10264808} {"current_steps": 17805, "total_steps": 67140, "loss": 0.6006, "lr": 4.595833612036959e-05, "epoch": 2.6519213583556747, "percentage": 26.52, "elapsed_time": "1:13:59", "remaining_time": "3:25:01", "throughput": 2312.83, "total_tokens": 10267912} {"current_steps": 17810, "total_steps": 67140, "loss": 0.5429, "lr": 4.59547925173163e-05, "epoch": 2.652666070896634, "percentage": 26.53, "elapsed_time": "1:14:00", "remaining_time": "3:24:59", "throughput": 2312.91, "total_tokens": 10270888} {"current_steps": 17815, "total_steps": 67140, "loss": 0.5225, "lr": 4.595124749822332e-05, "epoch": 2.653410783437593, "percentage": 26.53, "elapsed_time": "1:14:01", "remaining_time": "3:24:58", "throughput": 2312.96, "total_tokens": 10273736} {"current_steps": 17820, "total_steps": 67140, "loss": 0.6855, "lr": 4.594770106333022e-05, "epoch": 2.6541554959785523, "percentage": 26.54, "elapsed_time": "1:14:02", "remaining_time": "3:24:56", "throughput": 2313.02, "total_tokens": 10276648} {"current_steps": 17825, "total_steps": 67140, "loss": 0.6313, "lr": 4.594415321287664e-05, "epoch": 2.6549002085195115, "percentage": 26.55, "elapsed_time": "1:14:04", "remaining_time": "3:24:55", "throughput": 2313.13, "total_tokens": 10279912} {"current_steps": 17830, "total_steps": 67140, "loss": 0.8666, "lr": 4.594060394710235e-05, "epoch": 2.6556449210604707, "percentage": 26.56, "elapsed_time": "1:14:05", "remaining_time": "3:24:53", "throughput": 2313.2, "total_tokens": 10282856} {"current_steps": 17835, "total_steps": 67140, "loss": 0.5743, "lr": 4.593705326624718e-05, "epoch": 2.65638963360143, "percentage": 26.56, "elapsed_time": "1:14:06", "remaining_time": "3:24:52", "throughput": 2313.24, "total_tokens": 10285640} {"current_steps": 17840, "total_steps": 67140, "loss": 0.7771, "lr": 4.593350117055107e-05, "epoch": 2.657134346142389, "percentage": 26.57, "elapsed_time": "1:14:07", "remaining_time": "3:24:50", "throughput": 2313.3, "total_tokens": 10288552} {"current_steps": 17845, "total_steps": 67140, "loss": 0.7768, "lr": 4.592994766025407e-05, "epoch": 2.6578790586833483, "percentage": 26.58, "elapsed_time": "1:14:08", "remaining_time": "3:24:49", "throughput": 2313.33, "total_tokens": 10291272} {"current_steps": 17850, "total_steps": 67140, "loss": 0.7371, "lr": 4.592639273559629e-05, "epoch": 2.6586237712243075, "percentage": 26.59, "elapsed_time": "1:14:09", "remaining_time": "3:24:47", "throughput": 2313.41, "total_tokens": 10294312} {"current_steps": 17855, "total_steps": 67140, "loss": 0.7335, "lr": 4.5922836396817973e-05, "epoch": 2.6593684837652667, "percentage": 26.59, "elapsed_time": "1:14:11", "remaining_time": "3:24:46", "throughput": 2313.52, "total_tokens": 10297576} {"current_steps": 17860, "total_steps": 67140, "loss": 0.5141, "lr": 4.591927864415944e-05, "epoch": 2.660113196306226, "percentage": 26.6, "elapsed_time": "1:14:12", "remaining_time": "3:24:44", "throughput": 2313.53, "total_tokens": 10300104} {"current_steps": 17865, "total_steps": 67140, "loss": 0.6959, "lr": 4.591571947786111e-05, "epoch": 2.660857908847185, "percentage": 26.61, "elapsed_time": "1:14:13", "remaining_time": "3:24:42", "throughput": 2313.6, "total_tokens": 10303080} {"current_steps": 17870, "total_steps": 67140, "loss": 0.7229, "lr": 4.591215889816349e-05, "epoch": 2.6616026213881443, "percentage": 26.62, "elapsed_time": "1:14:14", "remaining_time": "3:24:41", "throughput": 2313.63, "total_tokens": 10305832} {"current_steps": 17875, "total_steps": 67140, "loss": 0.7403, "lr": 4.59085969053072e-05, "epoch": 2.6623473339291035, "percentage": 26.62, "elapsed_time": "1:14:15", "remaining_time": "3:24:39", "throughput": 2313.63, "total_tokens": 10308360} {"current_steps": 17880, "total_steps": 67140, "loss": 0.6843, "lr": 4.5905033499532936e-05, "epoch": 2.6630920464700627, "percentage": 26.63, "elapsed_time": "1:14:16", "remaining_time": "3:24:38", "throughput": 2313.7, "total_tokens": 10311304} {"current_steps": 17885, "total_steps": 67140, "loss": 0.7637, "lr": 4.590146868108151e-05, "epoch": 2.663836759011022, "percentage": 26.64, "elapsed_time": "1:14:17", "remaining_time": "3:24:36", "throughput": 2313.72, "total_tokens": 10313928} {"current_steps": 17890, "total_steps": 67140, "loss": 0.71, "lr": 4.589790245019379e-05, "epoch": 2.6645814715519807, "percentage": 26.65, "elapsed_time": "1:14:18", "remaining_time": "3:24:35", "throughput": 2313.81, "total_tokens": 10317064} {"current_steps": 17895, "total_steps": 67140, "loss": 0.6136, "lr": 4.5894334807110806e-05, "epoch": 2.6653261840929403, "percentage": 26.65, "elapsed_time": "1:14:20", "remaining_time": "3:24:33", "throughput": 2313.85, "total_tokens": 10319816} {"current_steps": 17900, "total_steps": 67140, "loss": 0.6334, "lr": 4.589076575207362e-05, "epoch": 2.666070896633899, "percentage": 26.66, "elapsed_time": "1:14:21", "remaining_time": "3:24:31", "throughput": 2313.87, "total_tokens": 10322472} {"current_steps": 17905, "total_steps": 67140, "loss": 0.6077, "lr": 4.588719528532342e-05, "epoch": 2.6668156091748587, "percentage": 26.67, "elapsed_time": "1:14:22", "remaining_time": "3:24:30", "throughput": 2313.92, "total_tokens": 10325352} {"current_steps": 17910, "total_steps": 67140, "loss": 0.6298, "lr": 4.5883623407101475e-05, "epoch": 2.6675603217158175, "percentage": 26.68, "elapsed_time": "1:14:23", "remaining_time": "3:24:28", "throughput": 2314.04, "total_tokens": 10328584} {"current_steps": 17915, "total_steps": 67140, "loss": 0.5797, "lr": 4.5880050117649174e-05, "epoch": 2.668305034256777, "percentage": 26.68, "elapsed_time": "1:14:24", "remaining_time": "3:24:27", "throughput": 2314.07, "total_tokens": 10331304} {"current_steps": 17920, "total_steps": 67140, "loss": 0.6436, "lr": 4.5876475417207974e-05, "epoch": 2.669049746797736, "percentage": 26.69, "elapsed_time": "1:14:25", "remaining_time": "3:24:25", "throughput": 2314.13, "total_tokens": 10334248} {"current_steps": 17925, "total_steps": 67140, "loss": 0.6589, "lr": 4.5872899306019454e-05, "epoch": 2.6697944593386955, "percentage": 26.7, "elapsed_time": "1:14:26", "remaining_time": "3:24:24", "throughput": 2314.16, "total_tokens": 10336968} {"current_steps": 17930, "total_steps": 67140, "loss": 0.6202, "lr": 4.586932178432525e-05, "epoch": 2.6705391718796543, "percentage": 26.71, "elapsed_time": "1:14:27", "remaining_time": "3:24:22", "throughput": 2314.18, "total_tokens": 10339560} {"current_steps": 17935, "total_steps": 67140, "loss": 0.6133, "lr": 4.586574285236714e-05, "epoch": 2.6712838844206135, "percentage": 26.71, "elapsed_time": "1:14:29", "remaining_time": "3:24:20", "throughput": 2314.25, "total_tokens": 10342504} {"current_steps": 17940, "total_steps": 67140, "loss": 0.6373, "lr": 4.586216251038695e-05, "epoch": 2.6720285969615727, "percentage": 26.72, "elapsed_time": "1:14:30", "remaining_time": "3:24:19", "throughput": 2314.29, "total_tokens": 10345320} {"current_steps": 17945, "total_steps": 67140, "loss": 0.619, "lr": 4.585858075862665e-05, "epoch": 2.672773309502532, "percentage": 26.73, "elapsed_time": "1:14:31", "remaining_time": "3:24:17", "throughput": 2314.35, "total_tokens": 10348200} {"current_steps": 17950, "total_steps": 67140, "loss": 0.4838, "lr": 4.585499759732825e-05, "epoch": 2.673518022043491, "percentage": 26.74, "elapsed_time": "1:14:32", "remaining_time": "3:24:16", "throughput": 2314.44, "total_tokens": 10351304} {"current_steps": 17955, "total_steps": 67140, "loss": 0.6174, "lr": 4.585141302673392e-05, "epoch": 2.6742627345844503, "percentage": 26.74, "elapsed_time": "1:14:33", "remaining_time": "3:24:14", "throughput": 2314.48, "total_tokens": 10354024} {"current_steps": 17960, "total_steps": 67140, "loss": 0.7483, "lr": 4.584782704708587e-05, "epoch": 2.6750074471254095, "percentage": 26.75, "elapsed_time": "1:14:34", "remaining_time": "3:24:13", "throughput": 2314.61, "total_tokens": 10357448} {"current_steps": 17965, "total_steps": 67140, "loss": 0.695, "lr": 4.584423965862642e-05, "epoch": 2.6757521596663687, "percentage": 26.76, "elapsed_time": "1:14:35", "remaining_time": "3:24:11", "throughput": 2314.68, "total_tokens": 10360424} {"current_steps": 17970, "total_steps": 67140, "loss": 0.4903, "lr": 4.5840650861598e-05, "epoch": 2.676496872207328, "percentage": 26.76, "elapsed_time": "1:14:37", "remaining_time": "3:24:10", "throughput": 2314.77, "total_tokens": 10363464} {"current_steps": 17975, "total_steps": 67140, "loss": 0.6309, "lr": 4.583706065624314e-05, "epoch": 2.677241584748287, "percentage": 26.77, "elapsed_time": "1:14:38", "remaining_time": "3:24:08", "throughput": 2314.86, "total_tokens": 10366536} {"current_steps": 17980, "total_steps": 67140, "loss": 0.6964, "lr": 4.583346904280442e-05, "epoch": 2.6779862972892463, "percentage": 26.78, "elapsed_time": "1:14:39", "remaining_time": "3:24:07", "throughput": 2314.91, "total_tokens": 10369416} {"current_steps": 17985, "total_steps": 67140, "loss": 0.8247, "lr": 4.582987602152458e-05, "epoch": 2.6787310098302055, "percentage": 26.79, "elapsed_time": "1:14:40", "remaining_time": "3:24:05", "throughput": 2314.98, "total_tokens": 10372360} {"current_steps": 17990, "total_steps": 67140, "loss": 0.6419, "lr": 4.58262815926464e-05, "epoch": 2.6794757223711647, "percentage": 26.79, "elapsed_time": "1:14:41", "remaining_time": "3:24:04", "throughput": 2315.01, "total_tokens": 10375112} {"current_steps": 17995, "total_steps": 67140, "loss": 0.596, "lr": 4.5822685756412785e-05, "epoch": 2.680220434912124, "percentage": 26.8, "elapsed_time": "1:14:42", "remaining_time": "3:24:02", "throughput": 2315.08, "total_tokens": 10378088} {"current_steps": 18000, "total_steps": 67140, "loss": 0.5851, "lr": 4.5819088513066725e-05, "epoch": 2.680965147453083, "percentage": 26.81, "elapsed_time": "1:14:43", "remaining_time": "3:24:01", "throughput": 2315.13, "total_tokens": 10380904} {"current_steps": 18005, "total_steps": 67140, "loss": 0.6223, "lr": 4.581548986285131e-05, "epoch": 2.6817098599940423, "percentage": 26.82, "elapsed_time": "1:14:45", "remaining_time": "3:23:59", "throughput": 2315.17, "total_tokens": 10383624} {"current_steps": 18010, "total_steps": 67140, "loss": 0.5877, "lr": 4.5811889806009716e-05, "epoch": 2.6824545725350015, "percentage": 26.82, "elapsed_time": "1:14:46", "remaining_time": "3:23:58", "throughput": 2315.22, "total_tokens": 10386536} {"current_steps": 18015, "total_steps": 67140, "loss": 0.638, "lr": 4.580828834278523e-05, "epoch": 2.6831992850759607, "percentage": 26.83, "elapsed_time": "1:14:47", "remaining_time": "3:23:56", "throughput": 2315.28, "total_tokens": 10389448} {"current_steps": 18020, "total_steps": 67140, "loss": 0.6337, "lr": 4.580468547342121e-05, "epoch": 2.68394399761692, "percentage": 26.84, "elapsed_time": "1:14:48", "remaining_time": "3:23:54", "throughput": 2315.3, "total_tokens": 10392104} {"current_steps": 18025, "total_steps": 67140, "loss": 0.768, "lr": 4.5801081198161134e-05, "epoch": 2.684688710157879, "percentage": 26.85, "elapsed_time": "1:14:49", "remaining_time": "3:23:53", "throughput": 2315.35, "total_tokens": 10394920} {"current_steps": 18030, "total_steps": 67140, "loss": 0.6816, "lr": 4.5797475517248565e-05, "epoch": 2.6854334226988383, "percentage": 26.85, "elapsed_time": "1:14:50", "remaining_time": "3:23:51", "throughput": 2315.35, "total_tokens": 10397448} {"current_steps": 18035, "total_steps": 67140, "loss": 0.808, "lr": 4.579386843092715e-05, "epoch": 2.6861781352397975, "percentage": 26.86, "elapsed_time": "1:14:51", "remaining_time": "3:23:49", "throughput": 2315.34, "total_tokens": 10399880} {"current_steps": 18040, "total_steps": 67140, "loss": 0.5774, "lr": 4.579025993944065e-05, "epoch": 2.6869228477807567, "percentage": 26.87, "elapsed_time": "1:14:52", "remaining_time": "3:23:48", "throughput": 2315.37, "total_tokens": 10402568} {"current_steps": 18045, "total_steps": 67140, "loss": 0.735, "lr": 4.578665004303292e-05, "epoch": 2.687667560321716, "percentage": 26.88, "elapsed_time": "1:14:53", "remaining_time": "3:23:46", "throughput": 2315.42, "total_tokens": 10405384} {"current_steps": 18050, "total_steps": 67140, "loss": 0.7912, "lr": 4.578303874194789e-05, "epoch": 2.688412272862675, "percentage": 26.88, "elapsed_time": "1:14:55", "remaining_time": "3:23:45", "throughput": 2315.47, "total_tokens": 10408264} {"current_steps": 18055, "total_steps": 67140, "loss": 0.7603, "lr": 4.577942603642959e-05, "epoch": 2.6891569854036343, "percentage": 26.89, "elapsed_time": "1:14:56", "remaining_time": "3:23:43", "throughput": 2315.53, "total_tokens": 10411112} {"current_steps": 18060, "total_steps": 67140, "loss": 0.4269, "lr": 4.5775811926722166e-05, "epoch": 2.6899016979445936, "percentage": 26.9, "elapsed_time": "1:14:57", "remaining_time": "3:23:41", "throughput": 2315.56, "total_tokens": 10413800} {"current_steps": 18065, "total_steps": 67140, "loss": 0.7137, "lr": 4.577219641306984e-05, "epoch": 2.6906464104855523, "percentage": 26.91, "elapsed_time": "1:14:58", "remaining_time": "3:23:40", "throughput": 2315.58, "total_tokens": 10416456} {"current_steps": 18070, "total_steps": 67140, "loss": 0.631, "lr": 4.5768579495716935e-05, "epoch": 2.691391123026512, "percentage": 26.91, "elapsed_time": "1:14:59", "remaining_time": "3:23:38", "throughput": 2315.64, "total_tokens": 10419432} {"current_steps": 18075, "total_steps": 67140, "loss": 0.6162, "lr": 4.5764961174907865e-05, "epoch": 2.6921358355674707, "percentage": 26.92, "elapsed_time": "1:15:00", "remaining_time": "3:23:37", "throughput": 2315.74, "total_tokens": 10422568} {"current_steps": 18080, "total_steps": 67140, "loss": 0.6326, "lr": 4.576134145088715e-05, "epoch": 2.6928805481084304, "percentage": 26.93, "elapsed_time": "1:15:01", "remaining_time": "3:23:35", "throughput": 2315.76, "total_tokens": 10425192} {"current_steps": 18085, "total_steps": 67140, "loss": 0.6738, "lr": 4.575772032389938e-05, "epoch": 2.693625260649389, "percentage": 26.94, "elapsed_time": "1:15:02", "remaining_time": "3:23:34", "throughput": 2315.81, "total_tokens": 10428040} {"current_steps": 18090, "total_steps": 67140, "loss": 0.7877, "lr": 4.575409779418927e-05, "epoch": 2.6943699731903488, "percentage": 26.94, "elapsed_time": "1:15:04", "remaining_time": "3:23:32", "throughput": 2315.85, "total_tokens": 10430824} {"current_steps": 18095, "total_steps": 67140, "loss": 0.6212, "lr": 4.5750473862001606e-05, "epoch": 2.6951146857313075, "percentage": 26.95, "elapsed_time": "1:15:05", "remaining_time": "3:23:31", "throughput": 2315.9, "total_tokens": 10433608} {"current_steps": 18100, "total_steps": 67140, "loss": 0.6936, "lr": 4.5746848527581287e-05, "epoch": 2.695859398272267, "percentage": 26.96, "elapsed_time": "1:15:06", "remaining_time": "3:23:29", "throughput": 2315.93, "total_tokens": 10436392} {"current_steps": 18105, "total_steps": 67140, "loss": 0.7742, "lr": 4.5743221791173296e-05, "epoch": 2.696604110813226, "percentage": 26.97, "elapsed_time": "1:15:07", "remaining_time": "3:23:27", "throughput": 2315.97, "total_tokens": 10439080} {"current_steps": 18110, "total_steps": 67140, "loss": 0.7664, "lr": 4.573959365302272e-05, "epoch": 2.697348823354185, "percentage": 26.97, "elapsed_time": "1:15:08", "remaining_time": "3:23:26", "throughput": 2316.03, "total_tokens": 10442024} {"current_steps": 18115, "total_steps": 67140, "loss": 0.6361, "lr": 4.5735964113374715e-05, "epoch": 2.6980935358951443, "percentage": 26.98, "elapsed_time": "1:15:09", "remaining_time": "3:23:24", "throughput": 2316.06, "total_tokens": 10444744} {"current_steps": 18120, "total_steps": 67140, "loss": 0.5901, "lr": 4.573233317247456e-05, "epoch": 2.6988382484361035, "percentage": 26.99, "elapsed_time": "1:15:10", "remaining_time": "3:23:23", "throughput": 2316.12, "total_tokens": 10447624} {"current_steps": 18125, "total_steps": 67140, "loss": 0.4826, "lr": 4.572870083056763e-05, "epoch": 2.6995829609770627, "percentage": 27.0, "elapsed_time": "1:15:11", "remaining_time": "3:23:21", "throughput": 2316.18, "total_tokens": 10450536} {"current_steps": 18130, "total_steps": 67140, "loss": 0.5965, "lr": 4.5725067087899364e-05, "epoch": 2.700327673518022, "percentage": 27.0, "elapsed_time": "1:15:13", "remaining_time": "3:23:20", "throughput": 2316.23, "total_tokens": 10453352} {"current_steps": 18135, "total_steps": 67140, "loss": 0.6833, "lr": 4.572143194471533e-05, "epoch": 2.701072386058981, "percentage": 27.01, "elapsed_time": "1:15:14", "remaining_time": "3:23:18", "throughput": 2316.34, "total_tokens": 10456648} {"current_steps": 18140, "total_steps": 67140, "loss": 0.8512, "lr": 4.5717795401261175e-05, "epoch": 2.7018170985999403, "percentage": 27.02, "elapsed_time": "1:15:15", "remaining_time": "3:23:17", "throughput": 2316.42, "total_tokens": 10459656} {"current_steps": 18145, "total_steps": 67140, "loss": 0.5679, "lr": 4.571415745778264e-05, "epoch": 2.7025618111408996, "percentage": 27.03, "elapsed_time": "1:15:16", "remaining_time": "3:23:15", "throughput": 2316.49, "total_tokens": 10462696} {"current_steps": 18150, "total_steps": 67140, "loss": 0.6157, "lr": 4.571051811452556e-05, "epoch": 2.7033065236818588, "percentage": 27.03, "elapsed_time": "1:15:17", "remaining_time": "3:23:14", "throughput": 2316.57, "total_tokens": 10465736} {"current_steps": 18155, "total_steps": 67140, "loss": 0.7309, "lr": 4.570687737173587e-05, "epoch": 2.704051236222818, "percentage": 27.04, "elapsed_time": "1:15:18", "remaining_time": "3:23:12", "throughput": 2316.63, "total_tokens": 10468552} {"current_steps": 18160, "total_steps": 67140, "loss": 0.5498, "lr": 4.570323522965959e-05, "epoch": 2.704795948763777, "percentage": 27.05, "elapsed_time": "1:15:20", "remaining_time": "3:23:11", "throughput": 2316.68, "total_tokens": 10471432} {"current_steps": 18165, "total_steps": 67140, "loss": 0.5233, "lr": 4.569959168854285e-05, "epoch": 2.7055406613047364, "percentage": 27.06, "elapsed_time": "1:15:21", "remaining_time": "3:23:09", "throughput": 2316.67, "total_tokens": 10473864} {"current_steps": 18170, "total_steps": 67140, "loss": 0.5126, "lr": 4.5695946748631866e-05, "epoch": 2.7062853738456956, "percentage": 27.06, "elapsed_time": "1:15:22", "remaining_time": "3:23:07", "throughput": 2316.69, "total_tokens": 10476456} {"current_steps": 18175, "total_steps": 67140, "loss": 0.4702, "lr": 4.5692300410172936e-05, "epoch": 2.7070300863866548, "percentage": 27.07, "elapsed_time": "1:15:23", "remaining_time": "3:23:06", "throughput": 2316.75, "total_tokens": 10479336} {"current_steps": 18180, "total_steps": 67140, "loss": 0.6021, "lr": 4.568865267341248e-05, "epoch": 2.707774798927614, "percentage": 27.08, "elapsed_time": "1:15:24", "remaining_time": "3:23:04", "throughput": 2316.77, "total_tokens": 10481960} {"current_steps": 18185, "total_steps": 67140, "loss": 0.692, "lr": 4.5685003538596994e-05, "epoch": 2.708519511468573, "percentage": 27.09, "elapsed_time": "1:15:25", "remaining_time": "3:23:02", "throughput": 2316.81, "total_tokens": 10484744} {"current_steps": 18190, "total_steps": 67140, "loss": 0.5122, "lr": 4.568135300597306e-05, "epoch": 2.7092642240095324, "percentage": 27.09, "elapsed_time": "1:15:26", "remaining_time": "3:23:01", "throughput": 2316.8, "total_tokens": 10487144} {"current_steps": 18195, "total_steps": 67140, "loss": 0.6979, "lr": 4.567770107578737e-05, "epoch": 2.7100089365504916, "percentage": 27.1, "elapsed_time": "1:15:27", "remaining_time": "3:22:59", "throughput": 2316.87, "total_tokens": 10490120} {"current_steps": 18200, "total_steps": 67140, "loss": 0.5286, "lr": 4.567404774828672e-05, "epoch": 2.710753649091451, "percentage": 27.11, "elapsed_time": "1:15:28", "remaining_time": "3:22:58", "throughput": 2316.95, "total_tokens": 10493192} {"current_steps": 18205, "total_steps": 67140, "loss": 0.6255, "lr": 4.567039302371797e-05, "epoch": 2.71149836163241, "percentage": 27.11, "elapsed_time": "1:15:30", "remaining_time": "3:22:56", "throughput": 2317.03, "total_tokens": 10496264} {"current_steps": 18210, "total_steps": 67140, "loss": 0.5212, "lr": 4.566673690232811e-05, "epoch": 2.712243074173369, "percentage": 27.12, "elapsed_time": "1:15:31", "remaining_time": "3:22:55", "throughput": 2317.09, "total_tokens": 10499112} {"current_steps": 18215, "total_steps": 67140, "loss": 0.6594, "lr": 4.566307938436419e-05, "epoch": 2.7129877867143284, "percentage": 27.13, "elapsed_time": "1:15:32", "remaining_time": "3:22:53", "throughput": 2317.13, "total_tokens": 10501896} {"current_steps": 18220, "total_steps": 67140, "loss": 0.6853, "lr": 4.565942047007337e-05, "epoch": 2.7137324992552876, "percentage": 27.14, "elapsed_time": "1:15:33", "remaining_time": "3:22:52", "throughput": 2317.21, "total_tokens": 10504968} {"current_steps": 18225, "total_steps": 67140, "loss": 0.5729, "lr": 4.5655760159702914e-05, "epoch": 2.714477211796247, "percentage": 27.14, "elapsed_time": "1:15:34", "remaining_time": "3:22:50", "throughput": 2317.3, "total_tokens": 10508136} {"current_steps": 18230, "total_steps": 67140, "loss": 0.6835, "lr": 4.565209845350017e-05, "epoch": 2.715221924337206, "percentage": 27.15, "elapsed_time": "1:15:35", "remaining_time": "3:22:49", "throughput": 2317.38, "total_tokens": 10511176} {"current_steps": 18235, "total_steps": 67140, "loss": 0.6219, "lr": 4.564843535171257e-05, "epoch": 2.715966636878165, "percentage": 27.16, "elapsed_time": "1:15:36", "remaining_time": "3:22:47", "throughput": 2317.41, "total_tokens": 10513896} {"current_steps": 18240, "total_steps": 67140, "loss": 0.5876, "lr": 4.5644770854587666e-05, "epoch": 2.716711349419124, "percentage": 27.17, "elapsed_time": "1:15:38", "remaining_time": "3:22:46", "throughput": 2317.47, "total_tokens": 10516808} {"current_steps": 18245, "total_steps": 67140, "loss": 0.606, "lr": 4.564110496237308e-05, "epoch": 2.7174560619600836, "percentage": 27.17, "elapsed_time": "1:15:39", "remaining_time": "3:22:44", "throughput": 2317.49, "total_tokens": 10519464} {"current_steps": 18250, "total_steps": 67140, "loss": 0.4443, "lr": 4.563743767531654e-05, "epoch": 2.7182007745010424, "percentage": 27.18, "elapsed_time": "1:15:40", "remaining_time": "3:22:42", "throughput": 2317.52, "total_tokens": 10522152} {"current_steps": 18255, "total_steps": 67140, "loss": 0.6722, "lr": 4.563376899366587e-05, "epoch": 2.718945487042002, "percentage": 27.19, "elapsed_time": "1:15:41", "remaining_time": "3:22:41", "throughput": 2317.58, "total_tokens": 10525064} {"current_steps": 18260, "total_steps": 67140, "loss": 0.577, "lr": 4.5630098917668986e-05, "epoch": 2.7196901995829608, "percentage": 27.2, "elapsed_time": "1:15:42", "remaining_time": "3:22:39", "throughput": 2317.61, "total_tokens": 10527752} {"current_steps": 18265, "total_steps": 67140, "loss": 0.6831, "lr": 4.5626427447573884e-05, "epoch": 2.7204349121239204, "percentage": 27.2, "elapsed_time": "1:15:43", "remaining_time": "3:22:38", "throughput": 2317.66, "total_tokens": 10530568} {"current_steps": 18270, "total_steps": 67140, "loss": 0.6754, "lr": 4.562275458362868e-05, "epoch": 2.721179624664879, "percentage": 27.21, "elapsed_time": "1:15:44", "remaining_time": "3:22:36", "throughput": 2317.71, "total_tokens": 10533448} {"current_steps": 18275, "total_steps": 67140, "loss": 0.6142, "lr": 4.561908032608157e-05, "epoch": 2.721924337205839, "percentage": 27.22, "elapsed_time": "1:15:45", "remaining_time": "3:22:35", "throughput": 2317.75, "total_tokens": 10536264} {"current_steps": 18280, "total_steps": 67140, "loss": 0.6424, "lr": 4.561540467518084e-05, "epoch": 2.7226690497467976, "percentage": 27.23, "elapsed_time": "1:15:47", "remaining_time": "3:22:33", "throughput": 2317.88, "total_tokens": 10539688} {"current_steps": 18285, "total_steps": 67140, "loss": 0.6275, "lr": 4.561172763117488e-05, "epoch": 2.723413762287757, "percentage": 27.23, "elapsed_time": "1:15:48", "remaining_time": "3:22:32", "throughput": 2317.94, "total_tokens": 10542568} {"current_steps": 18290, "total_steps": 67140, "loss": 0.7245, "lr": 4.5608049194312165e-05, "epoch": 2.724158474828716, "percentage": 27.24, "elapsed_time": "1:15:49", "remaining_time": "3:22:30", "throughput": 2317.98, "total_tokens": 10545416} {"current_steps": 18295, "total_steps": 67140, "loss": 0.7191, "lr": 4.560436936484127e-05, "epoch": 2.724903187369675, "percentage": 27.25, "elapsed_time": "1:15:50", "remaining_time": "3:22:29", "throughput": 2318.06, "total_tokens": 10548488} {"current_steps": 18300, "total_steps": 67140, "loss": 0.8177, "lr": 4.5600688143010874e-05, "epoch": 2.7256478999106344, "percentage": 27.26, "elapsed_time": "1:15:51", "remaining_time": "3:22:27", "throughput": 2318.08, "total_tokens": 10551144} {"current_steps": 18305, "total_steps": 67140, "loss": 0.8314, "lr": 4.559700552906972e-05, "epoch": 2.7263926124515936, "percentage": 27.26, "elapsed_time": "1:15:52", "remaining_time": "3:22:26", "throughput": 2318.16, "total_tokens": 10554152} {"current_steps": 18310, "total_steps": 67140, "loss": 0.7545, "lr": 4.559332152326667e-05, "epoch": 2.727137324992553, "percentage": 27.27, "elapsed_time": "1:15:53", "remaining_time": "3:22:24", "throughput": 2318.2, "total_tokens": 10556936} {"current_steps": 18315, "total_steps": 67140, "loss": 0.6951, "lr": 4.558963612585069e-05, "epoch": 2.727882037533512, "percentage": 27.28, "elapsed_time": "1:15:55", "remaining_time": "3:22:23", "throughput": 2318.24, "total_tokens": 10559688} {"current_steps": 18320, "total_steps": 67140, "loss": 0.607, "lr": 4.558594933707081e-05, "epoch": 2.728626750074471, "percentage": 27.29, "elapsed_time": "1:15:56", "remaining_time": "3:22:21", "throughput": 2318.34, "total_tokens": 10562952} {"current_steps": 18325, "total_steps": 67140, "loss": 0.6481, "lr": 4.5582261157176164e-05, "epoch": 2.7293714626154304, "percentage": 27.29, "elapsed_time": "1:15:57", "remaining_time": "3:22:20", "throughput": 2318.37, "total_tokens": 10565672} {"current_steps": 18330, "total_steps": 67140, "loss": 0.6526, "lr": 4.5578571586416e-05, "epoch": 2.7301161751563896, "percentage": 27.3, "elapsed_time": "1:15:58", "remaining_time": "3:22:18", "throughput": 2318.45, "total_tokens": 10568712} {"current_steps": 18335, "total_steps": 67140, "loss": 0.7393, "lr": 4.557488062503962e-05, "epoch": 2.730860887697349, "percentage": 27.31, "elapsed_time": "1:15:59", "remaining_time": "3:22:17", "throughput": 2318.48, "total_tokens": 10571368} {"current_steps": 18340, "total_steps": 67140, "loss": 0.671, "lr": 4.557118827329647e-05, "epoch": 2.731605600238308, "percentage": 27.32, "elapsed_time": "1:16:00", "remaining_time": "3:22:15", "throughput": 2318.5, "total_tokens": 10574088} {"current_steps": 18345, "total_steps": 67140, "loss": 0.8387, "lr": 4.556749453143605e-05, "epoch": 2.732350312779267, "percentage": 27.32, "elapsed_time": "1:16:01", "remaining_time": "3:22:13", "throughput": 2318.54, "total_tokens": 10576872} {"current_steps": 18350, "total_steps": 67140, "loss": 0.5984, "lr": 4.556379939970797e-05, "epoch": 2.7330950253202264, "percentage": 27.33, "elapsed_time": "1:16:02", "remaining_time": "3:22:12", "throughput": 2318.6, "total_tokens": 10579752} {"current_steps": 18355, "total_steps": 67140, "loss": 0.7034, "lr": 4.5560102878361935e-05, "epoch": 2.7338397378611856, "percentage": 27.34, "elapsed_time": "1:16:04", "remaining_time": "3:22:10", "throughput": 2318.62, "total_tokens": 10582408} {"current_steps": 18360, "total_steps": 67140, "loss": 0.5796, "lr": 4.5556404967647736e-05, "epoch": 2.734584450402145, "percentage": 27.35, "elapsed_time": "1:16:05", "remaining_time": "3:22:09", "throughput": 2318.65, "total_tokens": 10585096} {"current_steps": 18365, "total_steps": 67140, "loss": 0.7078, "lr": 4.5552705667815265e-05, "epoch": 2.735329162943104, "percentage": 27.35, "elapsed_time": "1:16:06", "remaining_time": "3:22:07", "throughput": 2318.66, "total_tokens": 10587688} {"current_steps": 18370, "total_steps": 67140, "loss": 0.6946, "lr": 4.5549004979114506e-05, "epoch": 2.7360738754840632, "percentage": 27.36, "elapsed_time": "1:16:07", "remaining_time": "3:22:06", "throughput": 2318.74, "total_tokens": 10590760} {"current_steps": 18375, "total_steps": 67140, "loss": 0.6982, "lr": 4.5545302901795536e-05, "epoch": 2.7368185880250224, "percentage": 27.37, "elapsed_time": "1:16:08", "remaining_time": "3:22:04", "throughput": 2318.78, "total_tokens": 10593544} {"current_steps": 18380, "total_steps": 67140, "loss": 0.7057, "lr": 4.5541599436108535e-05, "epoch": 2.7375633005659816, "percentage": 27.38, "elapsed_time": "1:16:09", "remaining_time": "3:22:02", "throughput": 2318.85, "total_tokens": 10596552} {"current_steps": 18385, "total_steps": 67140, "loss": 0.7987, "lr": 4.553789458230375e-05, "epoch": 2.738308013106941, "percentage": 27.38, "elapsed_time": "1:16:10", "remaining_time": "3:22:01", "throughput": 2318.9, "total_tokens": 10599432} {"current_steps": 18390, "total_steps": 67140, "loss": 0.5382, "lr": 4.553418834063156e-05, "epoch": 2.7390527256479, "percentage": 27.39, "elapsed_time": "1:16:12", "remaining_time": "3:22:00", "throughput": 2319.0, "total_tokens": 10602600} {"current_steps": 18395, "total_steps": 67140, "loss": 0.5489, "lr": 4.55304807113424e-05, "epoch": 2.7397974381888592, "percentage": 27.4, "elapsed_time": "1:16:13", "remaining_time": "3:21:58", "throughput": 2319.05, "total_tokens": 10605448} {"current_steps": 18400, "total_steps": 67140, "loss": 0.7049, "lr": 4.5526771694686835e-05, "epoch": 2.7405421507298184, "percentage": 27.41, "elapsed_time": "1:16:14", "remaining_time": "3:21:57", "throughput": 2319.09, "total_tokens": 10608296} {"current_steps": 18405, "total_steps": 67140, "loss": 0.7826, "lr": 4.552306129091548e-05, "epoch": 2.7412868632707776, "percentage": 27.41, "elapsed_time": "1:16:15", "remaining_time": "3:21:55", "throughput": 2319.15, "total_tokens": 10611272} {"current_steps": 18410, "total_steps": 67140, "loss": 0.6403, "lr": 4.551934950027909e-05, "epoch": 2.742031575811737, "percentage": 27.42, "elapsed_time": "1:16:16", "remaining_time": "3:21:54", "throughput": 2319.25, "total_tokens": 10614440} {"current_steps": 18415, "total_steps": 67140, "loss": 0.564, "lr": 4.551563632302849e-05, "epoch": 2.7427762883526956, "percentage": 27.43, "elapsed_time": "1:16:17", "remaining_time": "3:21:52", "throughput": 2319.29, "total_tokens": 10617192} {"current_steps": 18420, "total_steps": 67140, "loss": 0.6385, "lr": 4.551192175941459e-05, "epoch": 2.7435210008936552, "percentage": 27.44, "elapsed_time": "1:16:18", "remaining_time": "3:21:50", "throughput": 2319.31, "total_tokens": 10619880} {"current_steps": 18425, "total_steps": 67140, "loss": 0.5747, "lr": 4.550820580968842e-05, "epoch": 2.744265713434614, "percentage": 27.44, "elapsed_time": "1:16:19", "remaining_time": "3:21:49", "throughput": 2319.33, "total_tokens": 10622536} {"current_steps": 18430, "total_steps": 67140, "loss": 0.7289, "lr": 4.550448847410108e-05, "epoch": 2.7450104259755737, "percentage": 27.45, "elapsed_time": "1:16:21", "remaining_time": "3:21:48", "throughput": 2319.44, "total_tokens": 10625864} {"current_steps": 18435, "total_steps": 67140, "loss": 0.62, "lr": 4.550076975290377e-05, "epoch": 2.7457551385165324, "percentage": 27.46, "elapsed_time": "1:16:22", "remaining_time": "3:21:46", "throughput": 2319.5, "total_tokens": 10628776} {"current_steps": 18440, "total_steps": 67140, "loss": 0.6689, "lr": 4.549704964634779e-05, "epoch": 2.746499851057492, "percentage": 27.46, "elapsed_time": "1:16:23", "remaining_time": "3:21:44", "throughput": 2319.54, "total_tokens": 10631496} {"current_steps": 18445, "total_steps": 67140, "loss": 0.6943, "lr": 4.549332815468453e-05, "epoch": 2.747244563598451, "percentage": 27.47, "elapsed_time": "1:16:24", "remaining_time": "3:21:43", "throughput": 2319.62, "total_tokens": 10634600} {"current_steps": 18450, "total_steps": 67140, "loss": 0.8144, "lr": 4.5489605278165484e-05, "epoch": 2.7479892761394105, "percentage": 27.48, "elapsed_time": "1:16:25", "remaining_time": "3:21:41", "throughput": 2319.65, "total_tokens": 10637320} {"current_steps": 18455, "total_steps": 67140, "loss": 0.539, "lr": 4.548588101704221e-05, "epoch": 2.7487339886803692, "percentage": 27.49, "elapsed_time": "1:16:26", "remaining_time": "3:21:40", "throughput": 2319.68, "total_tokens": 10640008} {"current_steps": 18460, "total_steps": 67140, "loss": 0.6281, "lr": 4.5482155371566384e-05, "epoch": 2.7494787012213284, "percentage": 27.49, "elapsed_time": "1:16:27", "remaining_time": "3:21:38", "throughput": 2319.73, "total_tokens": 10642856} {"current_steps": 18465, "total_steps": 67140, "loss": 0.7667, "lr": 4.5478428341989774e-05, "epoch": 2.7502234137622876, "percentage": 27.5, "elapsed_time": "1:16:29", "remaining_time": "3:21:37", "throughput": 2319.83, "total_tokens": 10646024} {"current_steps": 18470, "total_steps": 67140, "loss": 0.5883, "lr": 4.547469992856424e-05, "epoch": 2.750968126303247, "percentage": 27.51, "elapsed_time": "1:16:30", "remaining_time": "3:21:35", "throughput": 2319.9, "total_tokens": 10649064} {"current_steps": 18475, "total_steps": 67140, "loss": 0.8485, "lr": 4.5470970131541727e-05, "epoch": 2.751712838844206, "percentage": 27.52, "elapsed_time": "1:16:31", "remaining_time": "3:21:34", "throughput": 2319.94, "total_tokens": 10651784} {"current_steps": 18480, "total_steps": 67140, "loss": 0.5814, "lr": 4.546723895117428e-05, "epoch": 2.7524575513851652, "percentage": 27.52, "elapsed_time": "1:16:32", "remaining_time": "3:21:32", "throughput": 2320.02, "total_tokens": 10654920} {"current_steps": 18485, "total_steps": 67140, "loss": 0.5936, "lr": 4.546350638771404e-05, "epoch": 2.7532022639261244, "percentage": 27.53, "elapsed_time": "1:16:33", "remaining_time": "3:21:31", "throughput": 2320.09, "total_tokens": 10657928} {"current_steps": 18490, "total_steps": 67140, "loss": 0.5842, "lr": 4.5459772441413234e-05, "epoch": 2.7539469764670836, "percentage": 27.54, "elapsed_time": "1:16:34", "remaining_time": "3:21:29", "throughput": 2320.15, "total_tokens": 10660808} {"current_steps": 18495, "total_steps": 67140, "loss": 0.7254, "lr": 4.5456037112524195e-05, "epoch": 2.754691689008043, "percentage": 27.55, "elapsed_time": "1:16:36", "remaining_time": "3:21:28", "throughput": 2320.19, "total_tokens": 10663592} {"current_steps": 18500, "total_steps": 67140, "loss": 0.7564, "lr": 4.545230040129933e-05, "epoch": 2.755436401549002, "percentage": 27.55, "elapsed_time": "1:16:37", "remaining_time": "3:21:26", "throughput": 2320.24, "total_tokens": 10666408} {"current_steps": 18505, "total_steps": 67140, "loss": 0.565, "lr": 4.544856230799116e-05, "epoch": 2.7561811140899612, "percentage": 27.56, "elapsed_time": "1:16:38", "remaining_time": "3:21:25", "throughput": 2320.26, "total_tokens": 10669096} {"current_steps": 18510, "total_steps": 67140, "loss": 0.5877, "lr": 4.544482283285228e-05, "epoch": 2.7569258266309205, "percentage": 27.57, "elapsed_time": "1:16:39", "remaining_time": "3:21:23", "throughput": 2320.32, "total_tokens": 10672008} {"current_steps": 18515, "total_steps": 67140, "loss": 0.6538, "lr": 4.54410819761354e-05, "epoch": 2.7576705391718797, "percentage": 27.58, "elapsed_time": "1:16:40", "remaining_time": "3:21:22", "throughput": 2320.38, "total_tokens": 10674920} {"current_steps": 18520, "total_steps": 67140, "loss": 0.7748, "lr": 4.5437339738093315e-05, "epoch": 2.758415251712839, "percentage": 27.58, "elapsed_time": "1:16:41", "remaining_time": "3:21:20", "throughput": 2320.42, "total_tokens": 10677736} {"current_steps": 18525, "total_steps": 67140, "loss": 0.6841, "lr": 4.54335961189789e-05, "epoch": 2.759159964253798, "percentage": 27.59, "elapsed_time": "1:16:42", "remaining_time": "3:21:18", "throughput": 2320.46, "total_tokens": 10680488} {"current_steps": 18530, "total_steps": 67140, "loss": 0.5243, "lr": 4.542985111904513e-05, "epoch": 2.7599046767947573, "percentage": 27.6, "elapsed_time": "1:16:43", "remaining_time": "3:21:17", "throughput": 2320.54, "total_tokens": 10683528} {"current_steps": 18535, "total_steps": 67140, "loss": 0.7317, "lr": 4.542610473854508e-05, "epoch": 2.7606493893357165, "percentage": 27.61, "elapsed_time": "1:16:45", "remaining_time": "3:21:16", "throughput": 2320.61, "total_tokens": 10686568} {"current_steps": 18540, "total_steps": 67140, "loss": 0.5815, "lr": 4.542235697773193e-05, "epoch": 2.7613941018766757, "percentage": 27.61, "elapsed_time": "1:16:46", "remaining_time": "3:21:14", "throughput": 2320.65, "total_tokens": 10689320} {"current_steps": 18545, "total_steps": 67140, "loss": 0.692, "lr": 4.5418607836858914e-05, "epoch": 2.762138814417635, "percentage": 27.62, "elapsed_time": "1:16:47", "remaining_time": "3:21:12", "throughput": 2320.69, "total_tokens": 10692136} {"current_steps": 18550, "total_steps": 67140, "loss": 0.7532, "lr": 4.5414857316179415e-05, "epoch": 2.762883526958594, "percentage": 27.63, "elapsed_time": "1:16:48", "remaining_time": "3:21:11", "throughput": 2320.77, "total_tokens": 10695176} {"current_steps": 18555, "total_steps": 67140, "loss": 0.8353, "lr": 4.541110541594684e-05, "epoch": 2.7636282394995533, "percentage": 27.64, "elapsed_time": "1:16:49", "remaining_time": "3:21:09", "throughput": 2320.8, "total_tokens": 10697928} {"current_steps": 18560, "total_steps": 67140, "loss": 0.6269, "lr": 4.540735213641476e-05, "epoch": 2.7643729520405125, "percentage": 27.64, "elapsed_time": "1:16:50", "remaining_time": "3:21:08", "throughput": 2320.81, "total_tokens": 10700552} {"current_steps": 18565, "total_steps": 67140, "loss": 0.7805, "lr": 4.540359747783679e-05, "epoch": 2.7651176645814717, "percentage": 27.65, "elapsed_time": "1:16:51", "remaining_time": "3:21:06", "throughput": 2320.86, "total_tokens": 10703336} {"current_steps": 18570, "total_steps": 67140, "loss": 0.8187, "lr": 4.539984144046665e-05, "epoch": 2.765862377122431, "percentage": 27.66, "elapsed_time": "1:16:52", "remaining_time": "3:21:05", "throughput": 2320.88, "total_tokens": 10706024} {"current_steps": 18575, "total_steps": 67140, "loss": 0.743, "lr": 4.539608402455817e-05, "epoch": 2.76660708966339, "percentage": 27.67, "elapsed_time": "1:16:54", "remaining_time": "3:21:03", "throughput": 2320.95, "total_tokens": 10709032} {"current_steps": 18580, "total_steps": 67140, "loss": 0.5605, "lr": 4.5392325230365264e-05, "epoch": 2.7673518022043493, "percentage": 27.67, "elapsed_time": "1:16:55", "remaining_time": "3:21:02", "throughput": 2321.01, "total_tokens": 10711976} {"current_steps": 18585, "total_steps": 67140, "loss": 0.5845, "lr": 4.538856505814191e-05, "epoch": 2.7680965147453085, "percentage": 27.68, "elapsed_time": "1:16:56", "remaining_time": "3:21:00", "throughput": 2321.05, "total_tokens": 10714760} {"current_steps": 18590, "total_steps": 67140, "loss": 0.8418, "lr": 4.5384803508142235e-05, "epoch": 2.7688412272862672, "percentage": 27.69, "elapsed_time": "1:16:57", "remaining_time": "3:20:59", "throughput": 2321.11, "total_tokens": 10717704} {"current_steps": 18595, "total_steps": 67140, "loss": 0.6809, "lr": 4.538104058062042e-05, "epoch": 2.769585939827227, "percentage": 27.7, "elapsed_time": "1:16:58", "remaining_time": "3:20:57", "throughput": 2321.16, "total_tokens": 10720552} {"current_steps": 18600, "total_steps": 67140, "loss": 0.6268, "lr": 4.537727627583074e-05, "epoch": 2.7703306523681857, "percentage": 27.7, "elapsed_time": "1:16:59", "remaining_time": "3:20:56", "throughput": 2321.25, "total_tokens": 10723752} {"current_steps": 18605, "total_steps": 67140, "loss": 0.8203, "lr": 4.5373510594027576e-05, "epoch": 2.7710753649091453, "percentage": 27.71, "elapsed_time": "1:17:00", "remaining_time": "3:20:54", "throughput": 2321.27, "total_tokens": 10726440} {"current_steps": 18610, "total_steps": 67140, "loss": 0.6686, "lr": 4.53697435354654e-05, "epoch": 2.771820077450104, "percentage": 27.72, "elapsed_time": "1:17:02", "remaining_time": "3:20:52", "throughput": 2321.27, "total_tokens": 10728904} {"current_steps": 18615, "total_steps": 67140, "loss": 0.6822, "lr": 4.536597510039878e-05, "epoch": 2.7725647899910637, "percentage": 27.73, "elapsed_time": "1:17:03", "remaining_time": "3:20:51", "throughput": 2321.29, "total_tokens": 10731560} {"current_steps": 18620, "total_steps": 67140, "loss": 0.6602, "lr": 4.536220528908236e-05, "epoch": 2.7733095025320225, "percentage": 27.73, "elapsed_time": "1:17:04", "remaining_time": "3:20:49", "throughput": 2321.33, "total_tokens": 10734312} {"current_steps": 18625, "total_steps": 67140, "loss": 0.7095, "lr": 4.535843410177089e-05, "epoch": 2.7740542150729817, "percentage": 27.74, "elapsed_time": "1:17:05", "remaining_time": "3:20:48", "throughput": 2321.4, "total_tokens": 10737288} {"current_steps": 18630, "total_steps": 67140, "loss": 0.6952, "lr": 4.5354661538719224e-05, "epoch": 2.774798927613941, "percentage": 27.75, "elapsed_time": "1:17:06", "remaining_time": "3:20:46", "throughput": 2321.46, "total_tokens": 10740200} {"current_steps": 18635, "total_steps": 67140, "loss": 0.6384, "lr": 4.5350887600182275e-05, "epoch": 2.7755436401549, "percentage": 27.76, "elapsed_time": "1:17:07", "remaining_time": "3:20:45", "throughput": 2321.49, "total_tokens": 10742984} {"current_steps": 18640, "total_steps": 67140, "loss": 0.811, "lr": 4.534711228641509e-05, "epoch": 2.7762883526958593, "percentage": 27.76, "elapsed_time": "1:17:08", "remaining_time": "3:20:43", "throughput": 2321.52, "total_tokens": 10745704} {"current_steps": 18645, "total_steps": 67140, "loss": 0.6571, "lr": 4.5343335597672776e-05, "epoch": 2.7770330652368185, "percentage": 27.77, "elapsed_time": "1:17:09", "remaining_time": "3:20:41", "throughput": 2321.53, "total_tokens": 10748264} {"current_steps": 18650, "total_steps": 67140, "loss": 0.6152, "lr": 4.5339557534210565e-05, "epoch": 2.7777777777777777, "percentage": 27.78, "elapsed_time": "1:17:10", "remaining_time": "3:20:40", "throughput": 2321.6, "total_tokens": 10751272} {"current_steps": 18655, "total_steps": 67140, "loss": 0.5738, "lr": 4.533577809628374e-05, "epoch": 2.778522490318737, "percentage": 27.79, "elapsed_time": "1:17:12", "remaining_time": "3:20:39", "throughput": 2321.66, "total_tokens": 10754280} {"current_steps": 18660, "total_steps": 67140, "loss": 0.6842, "lr": 4.533199728414771e-05, "epoch": 2.779267202859696, "percentage": 27.79, "elapsed_time": "1:17:13", "remaining_time": "3:20:37", "throughput": 2321.76, "total_tokens": 10757384} {"current_steps": 18665, "total_steps": 67140, "loss": 0.6379, "lr": 4.532821509805797e-05, "epoch": 2.7800119154006553, "percentage": 27.8, "elapsed_time": "1:17:14", "remaining_time": "3:20:36", "throughput": 2321.81, "total_tokens": 10760296} {"current_steps": 18670, "total_steps": 67140, "loss": 0.6259, "lr": 4.53244315382701e-05, "epoch": 2.7807566279416145, "percentage": 27.81, "elapsed_time": "1:17:15", "remaining_time": "3:20:34", "throughput": 2321.86, "total_tokens": 10763112} {"current_steps": 18675, "total_steps": 67140, "loss": 0.6603, "lr": 4.532064660503978e-05, "epoch": 2.7815013404825737, "percentage": 27.82, "elapsed_time": "1:17:16", "remaining_time": "3:20:33", "throughput": 2321.9, "total_tokens": 10765928} {"current_steps": 18680, "total_steps": 67140, "loss": 0.5477, "lr": 4.531686029862279e-05, "epoch": 2.782246053023533, "percentage": 27.82, "elapsed_time": "1:17:17", "remaining_time": "3:20:31", "throughput": 2321.93, "total_tokens": 10768680} {"current_steps": 18685, "total_steps": 67140, "loss": 0.86, "lr": 4.531307261927497e-05, "epoch": 2.782990765564492, "percentage": 27.83, "elapsed_time": "1:17:18", "remaining_time": "3:20:30", "throughput": 2322.01, "total_tokens": 10771720} {"current_steps": 18690, "total_steps": 67140, "loss": 0.5978, "lr": 4.530928356725229e-05, "epoch": 2.7837354781054513, "percentage": 27.84, "elapsed_time": "1:17:20", "remaining_time": "3:20:28", "throughput": 2322.01, "total_tokens": 10774216} {"current_steps": 18695, "total_steps": 67140, "loss": 0.7811, "lr": 4.530549314281081e-05, "epoch": 2.7844801906464105, "percentage": 27.84, "elapsed_time": "1:17:21", "remaining_time": "3:20:26", "throughput": 2322.04, "total_tokens": 10777000} {"current_steps": 18700, "total_steps": 67140, "loss": 0.6484, "lr": 4.530170134620665e-05, "epoch": 2.7852249031873697, "percentage": 27.85, "elapsed_time": "1:17:22", "remaining_time": "3:20:25", "throughput": 2322.06, "total_tokens": 10779656} {"current_steps": 18705, "total_steps": 67140, "loss": 0.6449, "lr": 4.529790817769606e-05, "epoch": 2.785969615728329, "percentage": 27.86, "elapsed_time": "1:17:23", "remaining_time": "3:20:23", "throughput": 2322.11, "total_tokens": 10782504} {"current_steps": 18710, "total_steps": 67140, "loss": 0.6865, "lr": 4.529411363753535e-05, "epoch": 2.786714328269288, "percentage": 27.87, "elapsed_time": "1:17:24", "remaining_time": "3:20:22", "throughput": 2322.14, "total_tokens": 10785320} {"current_steps": 18715, "total_steps": 67140, "loss": 0.6723, "lr": 4.5290317725980964e-05, "epoch": 2.7874590408102473, "percentage": 27.87, "elapsed_time": "1:17:25", "remaining_time": "3:20:20", "throughput": 2322.21, "total_tokens": 10788328} {"current_steps": 18720, "total_steps": 67140, "loss": 0.5373, "lr": 4.5286520443289396e-05, "epoch": 2.7882037533512065, "percentage": 27.88, "elapsed_time": "1:17:26", "remaining_time": "3:20:19", "throughput": 2322.22, "total_tokens": 10790888} {"current_steps": 18725, "total_steps": 67140, "loss": 0.7521, "lr": 4.528272178971725e-05, "epoch": 2.7889484658921657, "percentage": 27.89, "elapsed_time": "1:17:27", "remaining_time": "3:20:17", "throughput": 2322.3, "total_tokens": 10793960} {"current_steps": 18730, "total_steps": 67140, "loss": 0.7141, "lr": 4.5278921765521234e-05, "epoch": 2.789693178433125, "percentage": 27.9, "elapsed_time": "1:17:29", "remaining_time": "3:20:16", "throughput": 2322.36, "total_tokens": 10796872} {"current_steps": 18735, "total_steps": 67140, "loss": 0.6621, "lr": 4.5275120370958124e-05, "epoch": 2.790437890974084, "percentage": 27.9, "elapsed_time": "1:17:30", "remaining_time": "3:20:14", "throughput": 2322.44, "total_tokens": 10799880} {"current_steps": 18740, "total_steps": 67140, "loss": 0.7092, "lr": 4.5271317606284826e-05, "epoch": 2.7911826035150433, "percentage": 27.91, "elapsed_time": "1:17:31", "remaining_time": "3:20:13", "throughput": 2322.46, "total_tokens": 10802568} {"current_steps": 18745, "total_steps": 67140, "loss": 0.5316, "lr": 4.5267513471758295e-05, "epoch": 2.7919273160560025, "percentage": 27.92, "elapsed_time": "1:17:32", "remaining_time": "3:20:11", "throughput": 2322.52, "total_tokens": 10805480} {"current_steps": 18750, "total_steps": 67140, "loss": 0.8538, "lr": 4.5263707967635596e-05, "epoch": 2.7926720285969617, "percentage": 27.93, "elapsed_time": "1:17:33", "remaining_time": "3:20:10", "throughput": 2322.62, "total_tokens": 10808680} {"current_steps": 18755, "total_steps": 67140, "loss": 0.7165, "lr": 4.5259901094173915e-05, "epoch": 2.7934167411379205, "percentage": 27.93, "elapsed_time": "1:17:34", "remaining_time": "3:20:08", "throughput": 2322.7, "total_tokens": 10811720} {"current_steps": 18760, "total_steps": 67140, "loss": 0.6674, "lr": 4.525609285163048e-05, "epoch": 2.79416145367888, "percentage": 27.94, "elapsed_time": "1:17:35", "remaining_time": "3:20:07", "throughput": 2322.75, "total_tokens": 10814568} {"current_steps": 18765, "total_steps": 67140, "loss": 0.7939, "lr": 4.525228324026265e-05, "epoch": 2.794906166219839, "percentage": 27.95, "elapsed_time": "1:17:37", "remaining_time": "3:20:05", "throughput": 2322.8, "total_tokens": 10817448} {"current_steps": 18770, "total_steps": 67140, "loss": 0.6553, "lr": 4.5248472260327854e-05, "epoch": 2.7956508787607985, "percentage": 27.96, "elapsed_time": "1:17:38", "remaining_time": "3:20:04", "throughput": 2322.88, "total_tokens": 10820584} {"current_steps": 18775, "total_steps": 67140, "loss": 0.7658, "lr": 4.5244659912083626e-05, "epoch": 2.7963955913017573, "percentage": 27.96, "elapsed_time": "1:17:39", "remaining_time": "3:20:02", "throughput": 2322.93, "total_tokens": 10823400} {"current_steps": 18780, "total_steps": 67140, "loss": 0.6688, "lr": 4.524084619578759e-05, "epoch": 2.797140303842717, "percentage": 27.97, "elapsed_time": "1:17:40", "remaining_time": "3:20:01", "throughput": 2322.94, "total_tokens": 10826024} {"current_steps": 18785, "total_steps": 67140, "loss": 0.6143, "lr": 4.523703111169746e-05, "epoch": 2.7978850163836757, "percentage": 27.98, "elapsed_time": "1:17:41", "remaining_time": "3:19:59", "throughput": 2323.01, "total_tokens": 10829000} {"current_steps": 18790, "total_steps": 67140, "loss": 0.7525, "lr": 4.5233214660071055e-05, "epoch": 2.7986297289246354, "percentage": 27.99, "elapsed_time": "1:17:42", "remaining_time": "3:19:58", "throughput": 2323.06, "total_tokens": 10831912} {"current_steps": 18795, "total_steps": 67140, "loss": 0.6673, "lr": 4.522939684116626e-05, "epoch": 2.799374441465594, "percentage": 27.99, "elapsed_time": "1:17:43", "remaining_time": "3:19:56", "throughput": 2323.15, "total_tokens": 10835048} {"current_steps": 18800, "total_steps": 67140, "loss": 0.7122, "lr": 4.522557765524107e-05, "epoch": 2.8001191540065533, "percentage": 28.0, "elapsed_time": "1:17:45", "remaining_time": "3:19:55", "throughput": 2323.21, "total_tokens": 10837992} {"current_steps": 18805, "total_steps": 67140, "loss": 0.4997, "lr": 4.5221757102553576e-05, "epoch": 2.8008638665475125, "percentage": 28.01, "elapsed_time": "1:17:46", "remaining_time": "3:19:53", "throughput": 2323.25, "total_tokens": 10840808} {"current_steps": 18810, "total_steps": 67140, "loss": 0.7277, "lr": 4.521793518336195e-05, "epoch": 2.8016085790884717, "percentage": 28.02, "elapsed_time": "1:17:47", "remaining_time": "3:19:52", "throughput": 2323.32, "total_tokens": 10843720} {"current_steps": 18815, "total_steps": 67140, "loss": 0.6048, "lr": 4.521411189792447e-05, "epoch": 2.802353291629431, "percentage": 28.02, "elapsed_time": "1:17:48", "remaining_time": "3:19:50", "throughput": 2323.41, "total_tokens": 10846920} {"current_steps": 18820, "total_steps": 67140, "loss": 0.5384, "lr": 4.521028724649949e-05, "epoch": 2.80309800417039, "percentage": 28.03, "elapsed_time": "1:17:49", "remaining_time": "3:19:49", "throughput": 2323.47, "total_tokens": 10849832} {"current_steps": 18825, "total_steps": 67140, "loss": 0.6709, "lr": 4.520646122934547e-05, "epoch": 2.8038427167113493, "percentage": 28.04, "elapsed_time": "1:17:50", "remaining_time": "3:19:47", "throughput": 2323.5, "total_tokens": 10852584} {"current_steps": 18830, "total_steps": 67140, "loss": 0.6786, "lr": 4.5202633846720944e-05, "epoch": 2.8045874292523085, "percentage": 28.05, "elapsed_time": "1:17:51", "remaining_time": "3:19:46", "throughput": 2323.58, "total_tokens": 10855624} {"current_steps": 18835, "total_steps": 67140, "loss": 0.7021, "lr": 4.519880509888457e-05, "epoch": 2.8053321417932677, "percentage": 28.05, "elapsed_time": "1:17:53", "remaining_time": "3:19:44", "throughput": 2323.64, "total_tokens": 10858632} {"current_steps": 18840, "total_steps": 67140, "loss": 0.5694, "lr": 4.519497498609506e-05, "epoch": 2.806076854334227, "percentage": 28.06, "elapsed_time": "1:17:54", "remaining_time": "3:19:43", "throughput": 2323.7, "total_tokens": 10861544} {"current_steps": 18845, "total_steps": 67140, "loss": 0.6537, "lr": 4.519114350861125e-05, "epoch": 2.806821566875186, "percentage": 28.07, "elapsed_time": "1:17:55", "remaining_time": "3:19:41", "throughput": 2323.75, "total_tokens": 10864392} {"current_steps": 18850, "total_steps": 67140, "loss": 0.7102, "lr": 4.5187310666692065e-05, "epoch": 2.8075662794161453, "percentage": 28.08, "elapsed_time": "1:17:56", "remaining_time": "3:19:40", "throughput": 2323.79, "total_tokens": 10867176} {"current_steps": 18855, "total_steps": 67140, "loss": 0.6376, "lr": 4.5183476460596486e-05, "epoch": 2.8083109919571045, "percentage": 28.08, "elapsed_time": "1:17:57", "remaining_time": "3:19:38", "throughput": 2323.84, "total_tokens": 10869992} {"current_steps": 18860, "total_steps": 67140, "loss": 0.6495, "lr": 4.5179640890583634e-05, "epoch": 2.8090557044980637, "percentage": 28.09, "elapsed_time": "1:17:58", "remaining_time": "3:19:37", "throughput": 2323.92, "total_tokens": 10873096} {"current_steps": 18865, "total_steps": 67140, "loss": 0.6543, "lr": 4.51758039569127e-05, "epoch": 2.809800417039023, "percentage": 28.1, "elapsed_time": "1:17:59", "remaining_time": "3:19:35", "throughput": 2323.94, "total_tokens": 10875720} {"current_steps": 18870, "total_steps": 67140, "loss": 0.796, "lr": 4.517196565984296e-05, "epoch": 2.810545129579982, "percentage": 28.11, "elapsed_time": "1:18:01", "remaining_time": "3:19:34", "throughput": 2324.01, "total_tokens": 10878728} {"current_steps": 18875, "total_steps": 67140, "loss": 0.6736, "lr": 4.5168125999633794e-05, "epoch": 2.8112898421209414, "percentage": 28.11, "elapsed_time": "1:18:02", "remaining_time": "3:19:32", "throughput": 2324.05, "total_tokens": 10881480} {"current_steps": 18880, "total_steps": 67140, "loss": 0.7421, "lr": 4.5164284976544664e-05, "epoch": 2.8120345546619006, "percentage": 28.12, "elapsed_time": "1:18:03", "remaining_time": "3:19:30", "throughput": 2324.05, "total_tokens": 10883976} {"current_steps": 18885, "total_steps": 67140, "loss": 0.6129, "lr": 4.516044259083514e-05, "epoch": 2.8127792672028598, "percentage": 28.13, "elapsed_time": "1:18:04", "remaining_time": "3:19:29", "throughput": 2324.08, "total_tokens": 10886728} {"current_steps": 18890, "total_steps": 67140, "loss": 0.4869, "lr": 4.515659884276487e-05, "epoch": 2.813523979743819, "percentage": 28.14, "elapsed_time": "1:18:05", "remaining_time": "3:19:27", "throughput": 2324.14, "total_tokens": 10889608} {"current_steps": 18895, "total_steps": 67140, "loss": 0.6479, "lr": 4.515275373259361e-05, "epoch": 2.814268692284778, "percentage": 28.14, "elapsed_time": "1:18:06", "remaining_time": "3:19:26", "throughput": 2324.17, "total_tokens": 10892328} {"current_steps": 18900, "total_steps": 67140, "loss": 0.6145, "lr": 4.5148907260581185e-05, "epoch": 2.8150134048257374, "percentage": 28.15, "elapsed_time": "1:18:07", "remaining_time": "3:19:24", "throughput": 2324.23, "total_tokens": 10895304} {"current_steps": 18905, "total_steps": 67140, "loss": 0.536, "lr": 4.5145059426987523e-05, "epoch": 2.8157581173666966, "percentage": 28.16, "elapsed_time": "1:18:08", "remaining_time": "3:19:23", "throughput": 2324.28, "total_tokens": 10898184} {"current_steps": 18910, "total_steps": 67140, "loss": 0.9269, "lr": 4.514121023207265e-05, "epoch": 2.8165028299076558, "percentage": 28.17, "elapsed_time": "1:18:09", "remaining_time": "3:19:21", "throughput": 2324.31, "total_tokens": 10900968} {"current_steps": 18915, "total_steps": 67140, "loss": 0.5173, "lr": 4.513735967609668e-05, "epoch": 2.817247542448615, "percentage": 28.17, "elapsed_time": "1:18:11", "remaining_time": "3:19:20", "throughput": 2324.32, "total_tokens": 10903624} {"current_steps": 18920, "total_steps": 67140, "loss": 0.7203, "lr": 4.5133507759319816e-05, "epoch": 2.817992254989574, "percentage": 28.18, "elapsed_time": "1:18:12", "remaining_time": "3:19:18", "throughput": 2324.4, "total_tokens": 10906696} {"current_steps": 18925, "total_steps": 67140, "loss": 0.6988, "lr": 4.512965448200235e-05, "epoch": 2.8187369675305334, "percentage": 28.19, "elapsed_time": "1:18:13", "remaining_time": "3:19:17", "throughput": 2324.42, "total_tokens": 10909320} {"current_steps": 18930, "total_steps": 67140, "loss": 0.6732, "lr": 4.5125799844404683e-05, "epoch": 2.819481680071492, "percentage": 28.19, "elapsed_time": "1:18:14", "remaining_time": "3:19:15", "throughput": 2324.45, "total_tokens": 10912008} {"current_steps": 18935, "total_steps": 67140, "loss": 0.6576, "lr": 4.512194384678728e-05, "epoch": 2.820226392612452, "percentage": 28.2, "elapsed_time": "1:18:15", "remaining_time": "3:19:14", "throughput": 2324.51, "total_tokens": 10914920} {"current_steps": 18940, "total_steps": 67140, "loss": 0.6642, "lr": 4.511808648941073e-05, "epoch": 2.8209711051534105, "percentage": 28.21, "elapsed_time": "1:18:16", "remaining_time": "3:19:12", "throughput": 2324.54, "total_tokens": 10917640} {"current_steps": 18945, "total_steps": 67140, "loss": 0.7181, "lr": 4.511422777253568e-05, "epoch": 2.82171581769437, "percentage": 28.22, "elapsed_time": "1:18:17", "remaining_time": "3:19:10", "throughput": 2324.59, "total_tokens": 10920520} {"current_steps": 18950, "total_steps": 67140, "loss": 0.6838, "lr": 4.51103676964229e-05, "epoch": 2.822460530235329, "percentage": 28.22, "elapsed_time": "1:18:18", "remaining_time": "3:19:09", "throughput": 2324.64, "total_tokens": 10923400} {"current_steps": 18955, "total_steps": 67140, "loss": 0.6749, "lr": 4.5106506261333234e-05, "epoch": 2.8232052427762886, "percentage": 28.23, "elapsed_time": "1:18:20", "remaining_time": "3:19:08", "throughput": 2324.7, "total_tokens": 10926312} {"current_steps": 18960, "total_steps": 67140, "loss": 0.7443, "lr": 4.5102643467527616e-05, "epoch": 2.8239499553172474, "percentage": 28.24, "elapsed_time": "1:18:21", "remaining_time": "3:19:06", "throughput": 2324.73, "total_tokens": 10929096} {"current_steps": 18965, "total_steps": 67140, "loss": 0.6173, "lr": 4.509877931526709e-05, "epoch": 2.824694667858207, "percentage": 28.25, "elapsed_time": "1:18:22", "remaining_time": "3:19:04", "throughput": 2324.74, "total_tokens": 10931656} {"current_steps": 18970, "total_steps": 67140, "loss": 0.6472, "lr": 4.5094913804812776e-05, "epoch": 2.8254393803991658, "percentage": 28.25, "elapsed_time": "1:18:23", "remaining_time": "3:19:03", "throughput": 2324.78, "total_tokens": 10934408} {"current_steps": 18975, "total_steps": 67140, "loss": 0.672, "lr": 4.509104693642588e-05, "epoch": 2.826184092940125, "percentage": 28.26, "elapsed_time": "1:18:24", "remaining_time": "3:19:01", "throughput": 2324.81, "total_tokens": 10937160} {"current_steps": 18980, "total_steps": 67140, "loss": 0.6692, "lr": 4.508717871036772e-05, "epoch": 2.826928805481084, "percentage": 28.27, "elapsed_time": "1:18:25", "remaining_time": "3:19:00", "throughput": 2324.88, "total_tokens": 10940136} {"current_steps": 18985, "total_steps": 67140, "loss": 0.6898, "lr": 4.508330912689969e-05, "epoch": 2.8276735180220434, "percentage": 28.28, "elapsed_time": "1:18:26", "remaining_time": "3:18:58", "throughput": 2324.94, "total_tokens": 10943080} {"current_steps": 18990, "total_steps": 67140, "loss": 0.6789, "lr": 4.5079438186283285e-05, "epoch": 2.8284182305630026, "percentage": 28.28, "elapsed_time": "1:18:27", "remaining_time": "3:18:57", "throughput": 2324.94, "total_tokens": 10945640} {"current_steps": 18995, "total_steps": 67140, "loss": 0.6553, "lr": 4.507556588878009e-05, "epoch": 2.8291629431039618, "percentage": 28.29, "elapsed_time": "1:18:29", "remaining_time": "3:18:55", "throughput": 2324.98, "total_tokens": 10948456} {"current_steps": 19000, "total_steps": 67140, "loss": 0.6335, "lr": 4.5071692234651764e-05, "epoch": 2.829907655644921, "percentage": 28.3, "elapsed_time": "1:18:30", "remaining_time": "3:18:54", "throughput": 2325.03, "total_tokens": 10951336} {"current_steps": 19005, "total_steps": 67140, "loss": 0.5832, "lr": 4.506781722416008e-05, "epoch": 2.83065236818588, "percentage": 28.31, "elapsed_time": "1:18:31", "remaining_time": "3:18:52", "throughput": 2325.09, "total_tokens": 10954312} {"current_steps": 19010, "total_steps": 67140, "loss": 0.6795, "lr": 4.5063940857566896e-05, "epoch": 2.8313970807268394, "percentage": 28.31, "elapsed_time": "1:18:32", "remaining_time": "3:18:51", "throughput": 2325.14, "total_tokens": 10957192} {"current_steps": 19015, "total_steps": 67140, "loss": 0.7242, "lr": 4.506006313513418e-05, "epoch": 2.8321417932677986, "percentage": 28.32, "elapsed_time": "1:18:33", "remaining_time": "3:18:49", "throughput": 2325.15, "total_tokens": 10959720} {"current_steps": 19020, "total_steps": 67140, "loss": 0.6329, "lr": 4.505618405712394e-05, "epoch": 2.832886505808758, "percentage": 28.33, "elapsed_time": "1:18:34", "remaining_time": "3:18:48", "throughput": 2325.21, "total_tokens": 10962696} {"current_steps": 19025, "total_steps": 67140, "loss": 0.7335, "lr": 4.505230362379833e-05, "epoch": 2.833631218349717, "percentage": 28.34, "elapsed_time": "1:18:35", "remaining_time": "3:18:46", "throughput": 2325.27, "total_tokens": 10965672} {"current_steps": 19030, "total_steps": 67140, "loss": 0.6864, "lr": 4.504842183541956e-05, "epoch": 2.834375930890676, "percentage": 28.34, "elapsed_time": "1:18:37", "remaining_time": "3:18:45", "throughput": 2325.34, "total_tokens": 10968616} {"current_steps": 19035, "total_steps": 67140, "loss": 0.5469, "lr": 4.5044538692249964e-05, "epoch": 2.8351206434316354, "percentage": 28.35, "elapsed_time": "1:18:38", "remaining_time": "3:18:43", "throughput": 2325.4, "total_tokens": 10971592} {"current_steps": 19040, "total_steps": 67140, "loss": 0.806, "lr": 4.504065419455193e-05, "epoch": 2.8358653559725946, "percentage": 28.36, "elapsed_time": "1:18:39", "remaining_time": "3:18:42", "throughput": 2325.47, "total_tokens": 10974696} {"current_steps": 19045, "total_steps": 67140, "loss": 0.5983, "lr": 4.503676834258798e-05, "epoch": 2.836610068513554, "percentage": 28.37, "elapsed_time": "1:18:40", "remaining_time": "3:18:40", "throughput": 2325.49, "total_tokens": 10977384} {"current_steps": 19050, "total_steps": 67140, "loss": 0.6415, "lr": 4.503288113662068e-05, "epoch": 2.837354781054513, "percentage": 28.37, "elapsed_time": "1:18:41", "remaining_time": "3:18:39", "throughput": 2325.55, "total_tokens": 10980264} {"current_steps": 19055, "total_steps": 67140, "loss": 0.6579, "lr": 4.5028992576912714e-05, "epoch": 2.838099493595472, "percentage": 28.38, "elapsed_time": "1:18:42", "remaining_time": "3:18:37", "throughput": 2325.59, "total_tokens": 10983112} {"current_steps": 19060, "total_steps": 67140, "loss": 0.7824, "lr": 4.502510266372687e-05, "epoch": 2.8388442061364314, "percentage": 28.39, "elapsed_time": "1:18:43", "remaining_time": "3:18:36", "throughput": 2325.64, "total_tokens": 10985960} {"current_steps": 19065, "total_steps": 67140, "loss": 0.5099, "lr": 4.5021211397326e-05, "epoch": 2.8395889186773906, "percentage": 28.4, "elapsed_time": "1:18:45", "remaining_time": "3:18:34", "throughput": 2325.7, "total_tokens": 10988968} {"current_steps": 19070, "total_steps": 67140, "loss": 0.7511, "lr": 4.501731877797306e-05, "epoch": 2.84033363121835, "percentage": 28.4, "elapsed_time": "1:18:46", "remaining_time": "3:18:33", "throughput": 2325.76, "total_tokens": 10991880} {"current_steps": 19075, "total_steps": 67140, "loss": 0.7486, "lr": 4.5013424805931104e-05, "epoch": 2.841078343759309, "percentage": 28.41, "elapsed_time": "1:18:47", "remaining_time": "3:18:31", "throughput": 2325.8, "total_tokens": 10994632} {"current_steps": 19080, "total_steps": 67140, "loss": 0.8078, "lr": 4.5009529481463274e-05, "epoch": 2.841823056300268, "percentage": 28.42, "elapsed_time": "1:18:48", "remaining_time": "3:18:30", "throughput": 2325.84, "total_tokens": 10997384} {"current_steps": 19085, "total_steps": 67140, "loss": 0.639, "lr": 4.5005632804832786e-05, "epoch": 2.8425677688412274, "percentage": 28.43, "elapsed_time": "1:18:49", "remaining_time": "3:18:28", "throughput": 2325.88, "total_tokens": 11000168} {"current_steps": 19090, "total_steps": 67140, "loss": 0.66, "lr": 4.500173477630298e-05, "epoch": 2.8433124813821866, "percentage": 28.43, "elapsed_time": "1:18:50", "remaining_time": "3:18:27", "throughput": 2325.94, "total_tokens": 11003144} {"current_steps": 19095, "total_steps": 67140, "loss": 0.8041, "lr": 4.499783539613726e-05, "epoch": 2.844057193923146, "percentage": 28.44, "elapsed_time": "1:18:51", "remaining_time": "3:18:25", "throughput": 2326.03, "total_tokens": 11006376} {"current_steps": 19100, "total_steps": 67140, "loss": 0.6417, "lr": 4.4993934664599116e-05, "epoch": 2.844801906464105, "percentage": 28.45, "elapsed_time": "1:18:52", "remaining_time": "3:18:24", "throughput": 2326.09, "total_tokens": 11009288} {"current_steps": 19105, "total_steps": 67140, "loss": 0.7184, "lr": 4.4990032581952166e-05, "epoch": 2.845546619005064, "percentage": 28.46, "elapsed_time": "1:18:54", "remaining_time": "3:18:22", "throughput": 2326.15, "total_tokens": 11012232} {"current_steps": 19110, "total_steps": 67140, "loss": 0.5898, "lr": 4.498612914846008e-05, "epoch": 2.8462913315460234, "percentage": 28.46, "elapsed_time": "1:18:55", "remaining_time": "3:18:21", "throughput": 2326.2, "total_tokens": 11015144} {"current_steps": 19115, "total_steps": 67140, "loss": 0.6563, "lr": 4.498222436438665e-05, "epoch": 2.847036044086982, "percentage": 28.47, "elapsed_time": "1:18:56", "remaining_time": "3:18:19", "throughput": 2326.27, "total_tokens": 11018152} {"current_steps": 19120, "total_steps": 67140, "loss": 0.8028, "lr": 4.497831822999574e-05, "epoch": 2.847780756627942, "percentage": 28.48, "elapsed_time": "1:18:57", "remaining_time": "3:18:18", "throughput": 2326.33, "total_tokens": 11021096} {"current_steps": 19125, "total_steps": 67140, "loss": 0.8063, "lr": 4.497441074555131e-05, "epoch": 2.8485254691689006, "percentage": 28.49, "elapsed_time": "1:18:58", "remaining_time": "3:18:16", "throughput": 2326.38, "total_tokens": 11023944} {"current_steps": 19130, "total_steps": 67140, "loss": 0.6133, "lr": 4.497050191131741e-05, "epoch": 2.8492701817098602, "percentage": 28.49, "elapsed_time": "1:18:59", "remaining_time": "3:18:15", "throughput": 2326.41, "total_tokens": 11026696} {"current_steps": 19135, "total_steps": 67140, "loss": 0.6381, "lr": 4.4966591727558184e-05, "epoch": 2.850014894250819, "percentage": 28.5, "elapsed_time": "1:19:00", "remaining_time": "3:18:13", "throughput": 2326.5, "total_tokens": 11029864} {"current_steps": 19140, "total_steps": 67140, "loss": 0.8244, "lr": 4.496268019453787e-05, "epoch": 2.8507596067917786, "percentage": 28.51, "elapsed_time": "1:19:02", "remaining_time": "3:18:12", "throughput": 2326.62, "total_tokens": 11033256} {"current_steps": 19145, "total_steps": 67140, "loss": 0.6974, "lr": 4.495876731252079e-05, "epoch": 2.8515043193327374, "percentage": 28.52, "elapsed_time": "1:19:03", "remaining_time": "3:18:11", "throughput": 2326.71, "total_tokens": 11036392} {"current_steps": 19150, "total_steps": 67140, "loss": 0.6813, "lr": 4.495485308177136e-05, "epoch": 2.8522490318736966, "percentage": 28.52, "elapsed_time": "1:19:04", "remaining_time": "3:18:09", "throughput": 2326.76, "total_tokens": 11039176} {"current_steps": 19155, "total_steps": 67140, "loss": 0.6211, "lr": 4.495093750255409e-05, "epoch": 2.852993744414656, "percentage": 28.53, "elapsed_time": "1:19:05", "remaining_time": "3:18:08", "throughput": 2326.84, "total_tokens": 11042280} {"current_steps": 19160, "total_steps": 67140, "loss": 0.6929, "lr": 4.494702057513358e-05, "epoch": 2.853738456955615, "percentage": 28.54, "elapsed_time": "1:19:06", "remaining_time": "3:18:06", "throughput": 2326.87, "total_tokens": 11045000} {"current_steps": 19165, "total_steps": 67140, "loss": 0.6047, "lr": 4.4943102299774513e-05, "epoch": 2.854483169496574, "percentage": 28.54, "elapsed_time": "1:19:07", "remaining_time": "3:18:05", "throughput": 2326.96, "total_tokens": 11048200} {"current_steps": 19170, "total_steps": 67140, "loss": 0.637, "lr": 4.493918267674168e-05, "epoch": 2.8552278820375334, "percentage": 28.55, "elapsed_time": "1:19:09", "remaining_time": "3:18:03", "throughput": 2327.01, "total_tokens": 11051016} {"current_steps": 19175, "total_steps": 67140, "loss": 0.7688, "lr": 4.4935261706299944e-05, "epoch": 2.8559725945784926, "percentage": 28.56, "elapsed_time": "1:19:10", "remaining_time": "3:18:02", "throughput": 2327.06, "total_tokens": 11053928} {"current_steps": 19180, "total_steps": 67140, "loss": 0.5514, "lr": 4.4931339388714276e-05, "epoch": 2.856717307119452, "percentage": 28.57, "elapsed_time": "1:19:11", "remaining_time": "3:18:00", "throughput": 2327.1, "total_tokens": 11056744} {"current_steps": 19185, "total_steps": 67140, "loss": 0.6926, "lr": 4.4927415724249735e-05, "epoch": 2.857462019660411, "percentage": 28.57, "elapsed_time": "1:19:12", "remaining_time": "3:17:59", "throughput": 2327.11, "total_tokens": 11059368} {"current_steps": 19190, "total_steps": 67140, "loss": 0.6936, "lr": 4.492349071317145e-05, "epoch": 2.8582067322013702, "percentage": 28.58, "elapsed_time": "1:19:13", "remaining_time": "3:17:57", "throughput": 2327.14, "total_tokens": 11062088} {"current_steps": 19195, "total_steps": 67140, "loss": 0.6003, "lr": 4.491956435574466e-05, "epoch": 2.8589514447423294, "percentage": 28.59, "elapsed_time": "1:19:14", "remaining_time": "3:17:56", "throughput": 2327.19, "total_tokens": 11064936} {"current_steps": 19200, "total_steps": 67140, "loss": 0.7297, "lr": 4.491563665223471e-05, "epoch": 2.8596961572832886, "percentage": 28.6, "elapsed_time": "1:19:15", "remaining_time": "3:17:54", "throughput": 2327.21, "total_tokens": 11067624} {"current_steps": 19205, "total_steps": 67140, "loss": 0.8199, "lr": 4.491170760290699e-05, "epoch": 2.860440869824248, "percentage": 28.6, "elapsed_time": "1:19:16", "remaining_time": "3:17:53", "throughput": 2327.28, "total_tokens": 11070600} {"current_steps": 19210, "total_steps": 67140, "loss": 0.7355, "lr": 4.4907777208027044e-05, "epoch": 2.861185582365207, "percentage": 28.61, "elapsed_time": "1:19:18", "remaining_time": "3:17:51", "throughput": 2327.35, "total_tokens": 11073608} {"current_steps": 19215, "total_steps": 67140, "loss": 0.6853, "lr": 4.490384546786044e-05, "epoch": 2.8619302949061662, "percentage": 28.62, "elapsed_time": "1:19:19", "remaining_time": "3:17:49", "throughput": 2327.38, "total_tokens": 11076328} {"current_steps": 19220, "total_steps": 67140, "loss": 0.6445, "lr": 4.489991238267289e-05, "epoch": 2.8626750074471254, "percentage": 28.63, "elapsed_time": "1:19:20", "remaining_time": "3:17:48", "throughput": 2327.4, "total_tokens": 11078984} {"current_steps": 19225, "total_steps": 67140, "loss": 0.6441, "lr": 4.489597795273016e-05, "epoch": 2.8634197199880846, "percentage": 28.63, "elapsed_time": "1:19:21", "remaining_time": "3:17:46", "throughput": 2327.45, "total_tokens": 11081800} {"current_steps": 19230, "total_steps": 67140, "loss": 0.6584, "lr": 4.4892042178298136e-05, "epoch": 2.864164432529044, "percentage": 28.64, "elapsed_time": "1:19:22", "remaining_time": "3:17:45", "throughput": 2327.54, "total_tokens": 11084936} {"current_steps": 19235, "total_steps": 67140, "loss": 0.8239, "lr": 4.488810505964278e-05, "epoch": 2.864909145070003, "percentage": 28.65, "elapsed_time": "1:19:23", "remaining_time": "3:17:43", "throughput": 2327.59, "total_tokens": 11087848} {"current_steps": 19240, "total_steps": 67140, "loss": 0.7525, "lr": 4.488416659703014e-05, "epoch": 2.8656538576109623, "percentage": 28.66, "elapsed_time": "1:19:24", "remaining_time": "3:17:42", "throughput": 2327.63, "total_tokens": 11090632} {"current_steps": 19245, "total_steps": 67140, "loss": 0.6153, "lr": 4.4880226790726366e-05, "epoch": 2.8663985701519215, "percentage": 28.66, "elapsed_time": "1:19:25", "remaining_time": "3:17:40", "throughput": 2327.69, "total_tokens": 11093640} {"current_steps": 19250, "total_steps": 67140, "loss": 0.5943, "lr": 4.4876285640997694e-05, "epoch": 2.8671432826928807, "percentage": 28.67, "elapsed_time": "1:19:27", "remaining_time": "3:17:39", "throughput": 2327.69, "total_tokens": 11096168} {"current_steps": 19255, "total_steps": 67140, "loss": 0.6046, "lr": 4.487234314811044e-05, "epoch": 2.86788799523384, "percentage": 28.68, "elapsed_time": "1:19:28", "remaining_time": "3:17:37", "throughput": 2327.72, "total_tokens": 11098920} {"current_steps": 19260, "total_steps": 67140, "loss": 0.6619, "lr": 4.486839931233104e-05, "epoch": 2.868632707774799, "percentage": 28.69, "elapsed_time": "1:19:29", "remaining_time": "3:17:36", "throughput": 2327.79, "total_tokens": 11101896} {"current_steps": 19265, "total_steps": 67140, "loss": 0.6768, "lr": 4.486445413392599e-05, "epoch": 2.8693774203157583, "percentage": 28.69, "elapsed_time": "1:19:30", "remaining_time": "3:17:34", "throughput": 2327.86, "total_tokens": 11104936} {"current_steps": 19270, "total_steps": 67140, "loss": 0.559, "lr": 4.48605076131619e-05, "epoch": 2.8701221328567175, "percentage": 28.7, "elapsed_time": "1:19:31", "remaining_time": "3:17:33", "throughput": 2327.91, "total_tokens": 11107816} {"current_steps": 19275, "total_steps": 67140, "loss": 0.6214, "lr": 4.485655975030545e-05, "epoch": 2.8708668453976767, "percentage": 28.71, "elapsed_time": "1:19:32", "remaining_time": "3:17:31", "throughput": 2327.93, "total_tokens": 11110440} {"current_steps": 19280, "total_steps": 67140, "loss": 0.7715, "lr": 4.485261054562342e-05, "epoch": 2.8716115579386354, "percentage": 28.72, "elapsed_time": "1:19:33", "remaining_time": "3:17:30", "throughput": 2327.97, "total_tokens": 11113288} {"current_steps": 19285, "total_steps": 67140, "loss": 0.635, "lr": 4.484865999938268e-05, "epoch": 2.872356270479595, "percentage": 28.72, "elapsed_time": "1:19:34", "remaining_time": "3:17:28", "throughput": 2327.99, "total_tokens": 11116008} {"current_steps": 19290, "total_steps": 67140, "loss": 0.6744, "lr": 4.4844708111850195e-05, "epoch": 2.873100983020554, "percentage": 28.73, "elapsed_time": "1:19:36", "remaining_time": "3:17:27", "throughput": 2328.06, "total_tokens": 11119016} {"current_steps": 19295, "total_steps": 67140, "loss": 0.7233, "lr": 4.4840754883293025e-05, "epoch": 2.8738456955615135, "percentage": 28.74, "elapsed_time": "1:19:37", "remaining_time": "3:17:25", "throughput": 2328.09, "total_tokens": 11121768} {"current_steps": 19300, "total_steps": 67140, "loss": 0.5869, "lr": 4.483680031397831e-05, "epoch": 2.8745904081024722, "percentage": 28.75, "elapsed_time": "1:19:38", "remaining_time": "3:17:24", "throughput": 2328.13, "total_tokens": 11124552} {"current_steps": 19305, "total_steps": 67140, "loss": 0.6719, "lr": 4.4832844404173266e-05, "epoch": 2.875335120643432, "percentage": 28.75, "elapsed_time": "1:19:39", "remaining_time": "3:17:22", "throughput": 2328.18, "total_tokens": 11127464} {"current_steps": 19310, "total_steps": 67140, "loss": 0.7438, "lr": 4.482888715414525e-05, "epoch": 2.8760798331843906, "percentage": 28.76, "elapsed_time": "1:19:40", "remaining_time": "3:17:21", "throughput": 2328.25, "total_tokens": 11130472} {"current_steps": 19315, "total_steps": 67140, "loss": 0.6187, "lr": 4.482492856416165e-05, "epoch": 2.8768245457253503, "percentage": 28.77, "elapsed_time": "1:19:41", "remaining_time": "3:17:19", "throughput": 2328.26, "total_tokens": 11133064} {"current_steps": 19320, "total_steps": 67140, "loss": 0.6081, "lr": 4.482096863448998e-05, "epoch": 2.877569258266309, "percentage": 28.78, "elapsed_time": "1:19:42", "remaining_time": "3:17:18", "throughput": 2328.33, "total_tokens": 11136136} {"current_steps": 19325, "total_steps": 67140, "loss": 0.6194, "lr": 4.481700736539784e-05, "epoch": 2.8783139708072683, "percentage": 28.78, "elapsed_time": "1:19:44", "remaining_time": "3:17:16", "throughput": 2328.38, "total_tokens": 11138984} {"current_steps": 19330, "total_steps": 67140, "loss": 0.6274, "lr": 4.48130447571529e-05, "epoch": 2.8790586833482275, "percentage": 28.79, "elapsed_time": "1:19:45", "remaining_time": "3:17:15", "throughput": 2328.45, "total_tokens": 11141992} {"current_steps": 19335, "total_steps": 67140, "loss": 0.4918, "lr": 4.480908081002296e-05, "epoch": 2.8798033958891867, "percentage": 28.8, "elapsed_time": "1:19:46", "remaining_time": "3:17:13", "throughput": 2328.49, "total_tokens": 11144872} {"current_steps": 19340, "total_steps": 67140, "loss": 0.7153, "lr": 4.480511552427587e-05, "epoch": 2.880548108430146, "percentage": 28.81, "elapsed_time": "1:19:47", "remaining_time": "3:17:12", "throughput": 2328.55, "total_tokens": 11147848} {"current_steps": 19345, "total_steps": 67140, "loss": 0.6557, "lr": 4.48011489001796e-05, "epoch": 2.881292820971105, "percentage": 28.81, "elapsed_time": "1:19:48", "remaining_time": "3:17:10", "throughput": 2328.57, "total_tokens": 11150536} {"current_steps": 19350, "total_steps": 67140, "loss": 0.5512, "lr": 4.479718093800219e-05, "epoch": 2.8820375335120643, "percentage": 28.82, "elapsed_time": "1:19:49", "remaining_time": "3:17:09", "throughput": 2328.63, "total_tokens": 11153448} {"current_steps": 19355, "total_steps": 67140, "loss": 0.6157, "lr": 4.4793211638011786e-05, "epoch": 2.8827822460530235, "percentage": 28.83, "elapsed_time": "1:19:50", "remaining_time": "3:17:07", "throughput": 2328.64, "total_tokens": 11156040} {"current_steps": 19360, "total_steps": 67140, "loss": 0.5591, "lr": 4.478924100047661e-05, "epoch": 2.8835269585939827, "percentage": 28.84, "elapsed_time": "1:19:51", "remaining_time": "3:17:06", "throughput": 2328.72, "total_tokens": 11159112} {"current_steps": 19365, "total_steps": 67140, "loss": 0.8111, "lr": 4.478526902566498e-05, "epoch": 2.884271671134942, "percentage": 28.84, "elapsed_time": "1:19:53", "remaining_time": "3:17:04", "throughput": 2328.78, "total_tokens": 11162088} {"current_steps": 19370, "total_steps": 67140, "loss": 0.5491, "lr": 4.4781295713845314e-05, "epoch": 2.885016383675901, "percentage": 28.85, "elapsed_time": "1:19:54", "remaining_time": "3:17:03", "throughput": 2328.83, "total_tokens": 11164936} {"current_steps": 19375, "total_steps": 67140, "loss": 0.6925, "lr": 4.477732106528611e-05, "epoch": 2.8857610962168603, "percentage": 28.86, "elapsed_time": "1:19:55", "remaining_time": "3:17:01", "throughput": 2328.87, "total_tokens": 11167784} {"current_steps": 19380, "total_steps": 67140, "loss": 0.7392, "lr": 4.4773345080255955e-05, "epoch": 2.8865058087578195, "percentage": 28.87, "elapsed_time": "1:19:56", "remaining_time": "3:17:00", "throughput": 2328.99, "total_tokens": 11171144} {"current_steps": 19385, "total_steps": 67140, "loss": 0.6984, "lr": 4.4769367759023536e-05, "epoch": 2.8872505212987787, "percentage": 28.87, "elapsed_time": "1:19:57", "remaining_time": "3:16:59", "throughput": 2329.07, "total_tokens": 11174312} {"current_steps": 19390, "total_steps": 67140, "loss": 0.6656, "lr": 4.4765389101857616e-05, "epoch": 2.887995233839738, "percentage": 28.88, "elapsed_time": "1:19:58", "remaining_time": "3:16:58", "throughput": 2329.18, "total_tokens": 11177704} {"current_steps": 19395, "total_steps": 67140, "loss": 0.6187, "lr": 4.4761409109027065e-05, "epoch": 2.888739946380697, "percentage": 28.89, "elapsed_time": "1:20:00", "remaining_time": "3:16:56", "throughput": 2329.26, "total_tokens": 11180808} {"current_steps": 19400, "total_steps": 67140, "loss": 0.7377, "lr": 4.4757427780800825e-05, "epoch": 2.8894846589216563, "percentage": 28.89, "elapsed_time": "1:20:01", "remaining_time": "3:16:55", "throughput": 2329.31, "total_tokens": 11183656} {"current_steps": 19405, "total_steps": 67140, "loss": 0.6785, "lr": 4.475344511744794e-05, "epoch": 2.8902293714626155, "percentage": 28.9, "elapsed_time": "1:20:02", "remaining_time": "3:16:53", "throughput": 2329.36, "total_tokens": 11186568} {"current_steps": 19410, "total_steps": 67140, "loss": 0.682, "lr": 4.4749461119237555e-05, "epoch": 2.8909740840035747, "percentage": 28.91, "elapsed_time": "1:20:03", "remaining_time": "3:16:52", "throughput": 2329.38, "total_tokens": 11189224} {"current_steps": 19415, "total_steps": 67140, "loss": 0.7662, "lr": 4.4745475786438886e-05, "epoch": 2.891718796544534, "percentage": 28.92, "elapsed_time": "1:20:04", "remaining_time": "3:16:50", "throughput": 2329.43, "total_tokens": 11192072} {"current_steps": 19420, "total_steps": 67140, "loss": 0.689, "lr": 4.4741489119321235e-05, "epoch": 2.892463509085493, "percentage": 28.92, "elapsed_time": "1:20:05", "remaining_time": "3:16:49", "throughput": 2329.53, "total_tokens": 11195304} {"current_steps": 19425, "total_steps": 67140, "loss": 0.6073, "lr": 4.4737501118154014e-05, "epoch": 2.8932082216264523, "percentage": 28.93, "elapsed_time": "1:20:06", "remaining_time": "3:16:47", "throughput": 2329.58, "total_tokens": 11198248} {"current_steps": 19430, "total_steps": 67140, "loss": 0.7378, "lr": 4.473351178320671e-05, "epoch": 2.8939529341674115, "percentage": 28.94, "elapsed_time": "1:20:08", "remaining_time": "3:16:46", "throughput": 2329.6, "total_tokens": 11200872} {"current_steps": 19435, "total_steps": 67140, "loss": 0.6804, "lr": 4.472952111474892e-05, "epoch": 2.8946976467083707, "percentage": 28.95, "elapsed_time": "1:20:09", "remaining_time": "3:16:44", "throughput": 2329.64, "total_tokens": 11203688} {"current_steps": 19440, "total_steps": 67140, "loss": 0.6558, "lr": 4.47255291130503e-05, "epoch": 2.89544235924933, "percentage": 28.95, "elapsed_time": "1:20:10", "remaining_time": "3:16:43", "throughput": 2329.72, "total_tokens": 11206728} {"current_steps": 19445, "total_steps": 67140, "loss": 0.6568, "lr": 4.472153577838062e-05, "epoch": 2.896187071790289, "percentage": 28.96, "elapsed_time": "1:20:11", "remaining_time": "3:16:41", "throughput": 2329.76, "total_tokens": 11209544} {"current_steps": 19450, "total_steps": 67140, "loss": 0.8088, "lr": 4.471754111100974e-05, "epoch": 2.8969317843312483, "percentage": 28.97, "elapsed_time": "1:20:12", "remaining_time": "3:16:40", "throughput": 2329.81, "total_tokens": 11212328} {"current_steps": 19455, "total_steps": 67140, "loss": 0.7508, "lr": 4.471354511120759e-05, "epoch": 2.897676496872207, "percentage": 28.98, "elapsed_time": "1:20:13", "remaining_time": "3:16:38", "throughput": 2329.83, "total_tokens": 11215016} {"current_steps": 19460, "total_steps": 67140, "loss": 0.7926, "lr": 4.470954777924421e-05, "epoch": 2.8984212094131667, "percentage": 28.98, "elapsed_time": "1:20:14", "remaining_time": "3:16:36", "throughput": 2329.86, "total_tokens": 11217736} {"current_steps": 19465, "total_steps": 67140, "loss": 0.5963, "lr": 4.4705549115389735e-05, "epoch": 2.8991659219541255, "percentage": 28.99, "elapsed_time": "1:20:15", "remaining_time": "3:16:35", "throughput": 2329.9, "total_tokens": 11220616} {"current_steps": 19470, "total_steps": 67140, "loss": 0.623, "lr": 4.470154911991435e-05, "epoch": 2.899910634495085, "percentage": 29.0, "elapsed_time": "1:20:17", "remaining_time": "3:16:33", "throughput": 2329.93, "total_tokens": 11223336} {"current_steps": 19475, "total_steps": 67140, "loss": 0.6382, "lr": 4.469754779308839e-05, "epoch": 2.900655347036044, "percentage": 29.01, "elapsed_time": "1:20:18", "remaining_time": "3:16:32", "throughput": 2330.0, "total_tokens": 11226376} {"current_steps": 19480, "total_steps": 67140, "loss": 0.7202, "lr": 4.4693545135182235e-05, "epoch": 2.9014000595770035, "percentage": 29.01, "elapsed_time": "1:20:19", "remaining_time": "3:16:30", "throughput": 2330.01, "total_tokens": 11229000} {"current_steps": 19485, "total_steps": 67140, "loss": 0.7024, "lr": 4.468954114646637e-05, "epoch": 2.9021447721179623, "percentage": 29.02, "elapsed_time": "1:20:20", "remaining_time": "3:16:29", "throughput": 2330.1, "total_tokens": 11232200} {"current_steps": 19490, "total_steps": 67140, "loss": 0.6159, "lr": 4.468553582721135e-05, "epoch": 2.9028894846589215, "percentage": 29.03, "elapsed_time": "1:20:21", "remaining_time": "3:16:28", "throughput": 2330.14, "total_tokens": 11235048} {"current_steps": 19495, "total_steps": 67140, "loss": 0.6754, "lr": 4.4681529177687876e-05, "epoch": 2.9036341971998807, "percentage": 29.04, "elapsed_time": "1:20:22", "remaining_time": "3:16:26", "throughput": 2330.17, "total_tokens": 11237768} {"current_steps": 19500, "total_steps": 67140, "loss": 0.6632, "lr": 4.467752119816667e-05, "epoch": 2.90437890974084, "percentage": 29.04, "elapsed_time": "1:20:23", "remaining_time": "3:16:25", "throughput": 2330.22, "total_tokens": 11240680} {"current_steps": 19505, "total_steps": 67140, "loss": 0.5289, "lr": 4.467351188891858e-05, "epoch": 2.905123622281799, "percentage": 29.05, "elapsed_time": "1:20:25", "remaining_time": "3:16:23", "throughput": 2330.28, "total_tokens": 11243688} {"current_steps": 19510, "total_steps": 67140, "loss": 0.4815, "lr": 4.466950125021455e-05, "epoch": 2.9058683348227583, "percentage": 29.06, "elapsed_time": "1:20:26", "remaining_time": "3:16:22", "throughput": 2330.31, "total_tokens": 11246408} {"current_steps": 19515, "total_steps": 67140, "loss": 0.7512, "lr": 4.466548928232559e-05, "epoch": 2.9066130473637175, "percentage": 29.07, "elapsed_time": "1:20:27", "remaining_time": "3:16:20", "throughput": 2330.38, "total_tokens": 11249512} {"current_steps": 19520, "total_steps": 67140, "loss": 0.657, "lr": 4.4661475985522825e-05, "epoch": 2.9073577599046767, "percentage": 29.07, "elapsed_time": "1:20:28", "remaining_time": "3:16:19", "throughput": 2330.43, "total_tokens": 11252392} {"current_steps": 19525, "total_steps": 67140, "loss": 0.5859, "lr": 4.4657461360077444e-05, "epoch": 2.908102472445636, "percentage": 29.08, "elapsed_time": "1:20:29", "remaining_time": "3:16:17", "throughput": 2330.47, "total_tokens": 11255240} {"current_steps": 19530, "total_steps": 67140, "loss": 0.5207, "lr": 4.4653445406260744e-05, "epoch": 2.908847184986595, "percentage": 29.09, "elapsed_time": "1:20:30", "remaining_time": "3:16:16", "throughput": 2330.5, "total_tokens": 11257928} {"current_steps": 19535, "total_steps": 67140, "loss": 0.7392, "lr": 4.4649428124344114e-05, "epoch": 2.9095918975275543, "percentage": 29.1, "elapsed_time": "1:20:31", "remaining_time": "3:16:14", "throughput": 2330.54, "total_tokens": 11260744} {"current_steps": 19540, "total_steps": 67140, "loss": 0.6362, "lr": 4.464540951459902e-05, "epoch": 2.9103366100685135, "percentage": 29.1, "elapsed_time": "1:20:32", "remaining_time": "3:16:13", "throughput": 2330.58, "total_tokens": 11263560} {"current_steps": 19545, "total_steps": 67140, "loss": 0.5321, "lr": 4.464138957729702e-05, "epoch": 2.9110813226094727, "percentage": 29.11, "elapsed_time": "1:20:34", "remaining_time": "3:16:11", "throughput": 2330.58, "total_tokens": 11266120} {"current_steps": 19550, "total_steps": 67140, "loss": 0.6835, "lr": 4.463736831270977e-05, "epoch": 2.911826035150432, "percentage": 29.12, "elapsed_time": "1:20:35", "remaining_time": "3:16:10", "throughput": 2330.64, "total_tokens": 11269032} {"current_steps": 19555, "total_steps": 67140, "loss": 0.7322, "lr": 4.463334572110901e-05, "epoch": 2.912570747691391, "percentage": 29.13, "elapsed_time": "1:20:36", "remaining_time": "3:16:08", "throughput": 2330.69, "total_tokens": 11271976} {"current_steps": 19560, "total_steps": 67140, "loss": 0.6879, "lr": 4.462932180276657e-05, "epoch": 2.9133154602323503, "percentage": 29.13, "elapsed_time": "1:20:37", "remaining_time": "3:16:07", "throughput": 2330.78, "total_tokens": 11275112} {"current_steps": 19565, "total_steps": 67140, "loss": 0.5367, "lr": 4.462529655795437e-05, "epoch": 2.9140601727733095, "percentage": 29.14, "elapsed_time": "1:20:38", "remaining_time": "3:16:05", "throughput": 2330.81, "total_tokens": 11277864} {"current_steps": 19570, "total_steps": 67140, "loss": 0.6477, "lr": 4.462126998694442e-05, "epoch": 2.9148048853142687, "percentage": 29.15, "elapsed_time": "1:20:39", "remaining_time": "3:16:04", "throughput": 2330.85, "total_tokens": 11280648} {"current_steps": 19575, "total_steps": 67140, "loss": 0.8943, "lr": 4.4617242090008816e-05, "epoch": 2.915549597855228, "percentage": 29.16, "elapsed_time": "1:20:40", "remaining_time": "3:16:02", "throughput": 2330.87, "total_tokens": 11283304} {"current_steps": 19580, "total_steps": 67140, "loss": 0.7892, "lr": 4.461321286741975e-05, "epoch": 2.916294310396187, "percentage": 29.16, "elapsed_time": "1:20:41", "remaining_time": "3:16:01", "throughput": 2330.91, "total_tokens": 11286120} {"current_steps": 19585, "total_steps": 67140, "loss": 0.676, "lr": 4.46091823194495e-05, "epoch": 2.9170390229371463, "percentage": 29.17, "elapsed_time": "1:20:43", "remaining_time": "3:15:59", "throughput": 2330.93, "total_tokens": 11288904} {"current_steps": 19590, "total_steps": 67140, "loss": 0.7358, "lr": 4.460515044637043e-05, "epoch": 2.9177837354781055, "percentage": 29.18, "elapsed_time": "1:20:44", "remaining_time": "3:15:58", "throughput": 2330.96, "total_tokens": 11291688} {"current_steps": 19595, "total_steps": 67140, "loss": 0.6913, "lr": 4.460111724845501e-05, "epoch": 2.9185284480190647, "percentage": 29.19, "elapsed_time": "1:20:45", "remaining_time": "3:15:56", "throughput": 2331.06, "total_tokens": 11294888} {"current_steps": 19600, "total_steps": 67140, "loss": 0.6813, "lr": 4.4597082725975775e-05, "epoch": 2.919273160560024, "percentage": 29.19, "elapsed_time": "1:20:46", "remaining_time": "3:15:55", "throughput": 2331.1, "total_tokens": 11297704} {"current_steps": 19605, "total_steps": 67140, "loss": 0.6343, "lr": 4.459304687920536e-05, "epoch": 2.920017873100983, "percentage": 29.2, "elapsed_time": "1:20:47", "remaining_time": "3:15:53", "throughput": 2331.16, "total_tokens": 11300680} {"current_steps": 19610, "total_steps": 67140, "loss": 0.5573, "lr": 4.458900970841651e-05, "epoch": 2.9207625856419424, "percentage": 29.21, "elapsed_time": "1:20:48", "remaining_time": "3:15:52", "throughput": 2331.22, "total_tokens": 11303592} {"current_steps": 19615, "total_steps": 67140, "loss": 0.5805, "lr": 4.4584971213882014e-05, "epoch": 2.9215072981829016, "percentage": 29.22, "elapsed_time": "1:20:49", "remaining_time": "3:15:50", "throughput": 2331.23, "total_tokens": 11306216} {"current_steps": 19620, "total_steps": 67140, "loss": 0.6256, "lr": 4.458093139587479e-05, "epoch": 2.9222520107238603, "percentage": 29.22, "elapsed_time": "1:20:51", "remaining_time": "3:15:49", "throughput": 2331.27, "total_tokens": 11309064} {"current_steps": 19625, "total_steps": 67140, "loss": 0.7903, "lr": 4.4576890254667844e-05, "epoch": 2.92299672326482, "percentage": 29.23, "elapsed_time": "1:20:52", "remaining_time": "3:15:47", "throughput": 2331.31, "total_tokens": 11311848} {"current_steps": 19630, "total_steps": 67140, "loss": 0.6465, "lr": 4.457284779053423e-05, "epoch": 2.9237414358057787, "percentage": 29.24, "elapsed_time": "1:20:53", "remaining_time": "3:15:46", "throughput": 2331.37, "total_tokens": 11314792} {"current_steps": 19635, "total_steps": 67140, "loss": 0.7324, "lr": 4.4568804003747155e-05, "epoch": 2.9244861483467384, "percentage": 29.24, "elapsed_time": "1:20:54", "remaining_time": "3:15:44", "throughput": 2331.38, "total_tokens": 11317416} {"current_steps": 19640, "total_steps": 67140, "loss": 0.6521, "lr": 4.4564758894579863e-05, "epoch": 2.925230860887697, "percentage": 29.25, "elapsed_time": "1:20:55", "remaining_time": "3:15:43", "throughput": 2331.42, "total_tokens": 11320232} {"current_steps": 19645, "total_steps": 67140, "loss": 0.577, "lr": 4.456071246330571e-05, "epoch": 2.9259755734286568, "percentage": 29.26, "elapsed_time": "1:20:56", "remaining_time": "3:15:41", "throughput": 2331.5, "total_tokens": 11323304} {"current_steps": 19650, "total_steps": 67140, "loss": 0.6795, "lr": 4.455666471019814e-05, "epoch": 2.9267202859696155, "percentage": 29.27, "elapsed_time": "1:20:57", "remaining_time": "3:15:40", "throughput": 2331.55, "total_tokens": 11326216} {"current_steps": 19655, "total_steps": 67140, "loss": 0.6471, "lr": 4.455261563553067e-05, "epoch": 2.927464998510575, "percentage": 29.27, "elapsed_time": "1:20:58", "remaining_time": "3:15:38", "throughput": 2331.62, "total_tokens": 11329288} {"current_steps": 19660, "total_steps": 67140, "loss": 0.7028, "lr": 4.454856523957694e-05, "epoch": 2.928209711051534, "percentage": 29.28, "elapsed_time": "1:21:00", "remaining_time": "3:15:37", "throughput": 2331.66, "total_tokens": 11332136} {"current_steps": 19665, "total_steps": 67140, "loss": 0.7237, "lr": 4.4544513522610644e-05, "epoch": 2.928954423592493, "percentage": 29.29, "elapsed_time": "1:21:01", "remaining_time": "3:15:35", "throughput": 2331.71, "total_tokens": 11334952} {"current_steps": 19670, "total_steps": 67140, "loss": 0.5897, "lr": 4.454046048490559e-05, "epoch": 2.9296991361334523, "percentage": 29.3, "elapsed_time": "1:21:02", "remaining_time": "3:15:34", "throughput": 2331.74, "total_tokens": 11337736} {"current_steps": 19675, "total_steps": 67140, "loss": 0.7176, "lr": 4.4536406126735664e-05, "epoch": 2.9304438486744115, "percentage": 29.3, "elapsed_time": "1:21:03", "remaining_time": "3:15:32", "throughput": 2331.78, "total_tokens": 11340552} {"current_steps": 19680, "total_steps": 67140, "loss": 0.6776, "lr": 4.4532350448374835e-05, "epoch": 2.9311885612153707, "percentage": 29.31, "elapsed_time": "1:21:04", "remaining_time": "3:15:31", "throughput": 2331.83, "total_tokens": 11343464} {"current_steps": 19685, "total_steps": 67140, "loss": 0.7148, "lr": 4.452829345009718e-05, "epoch": 2.93193327375633, "percentage": 29.32, "elapsed_time": "1:21:05", "remaining_time": "3:15:29", "throughput": 2331.88, "total_tokens": 11346312} {"current_steps": 19690, "total_steps": 67140, "loss": 0.6864, "lr": 4.452423513217685e-05, "epoch": 2.932677986297289, "percentage": 29.33, "elapsed_time": "1:21:06", "remaining_time": "3:15:28", "throughput": 2331.93, "total_tokens": 11349192} {"current_steps": 19695, "total_steps": 67140, "loss": 0.6214, "lr": 4.4520175494888086e-05, "epoch": 2.9334226988382484, "percentage": 29.33, "elapsed_time": "1:21:07", "remaining_time": "3:15:26", "throughput": 2331.97, "total_tokens": 11352008} {"current_steps": 19700, "total_steps": 67140, "loss": 0.6006, "lr": 4.4516114538505225e-05, "epoch": 2.9341674113792076, "percentage": 29.34, "elapsed_time": "1:21:09", "remaining_time": "3:15:25", "throughput": 2332.03, "total_tokens": 11354984} {"current_steps": 19705, "total_steps": 67140, "loss": 0.6244, "lr": 4.45120522633027e-05, "epoch": 2.9349121239201668, "percentage": 29.35, "elapsed_time": "1:21:10", "remaining_time": "3:15:24", "throughput": 2332.08, "total_tokens": 11357864} {"current_steps": 19710, "total_steps": 67140, "loss": 0.8144, "lr": 4.4507988669555e-05, "epoch": 2.935656836461126, "percentage": 29.36, "elapsed_time": "1:21:11", "remaining_time": "3:15:22", "throughput": 2332.1, "total_tokens": 11360552} {"current_steps": 19715, "total_steps": 67140, "loss": 0.6137, "lr": 4.450392375753675e-05, "epoch": 2.936401549002085, "percentage": 29.36, "elapsed_time": "1:21:12", "remaining_time": "3:15:20", "throughput": 2332.12, "total_tokens": 11363208} {"current_steps": 19720, "total_steps": 67140, "loss": 0.8258, "lr": 4.449985752752261e-05, "epoch": 2.9371462615430444, "percentage": 29.37, "elapsed_time": "1:21:13", "remaining_time": "3:15:19", "throughput": 2332.18, "total_tokens": 11366152} {"current_steps": 19725, "total_steps": 67140, "loss": 0.734, "lr": 4.44957899797874e-05, "epoch": 2.9378909740840036, "percentage": 29.38, "elapsed_time": "1:21:14", "remaining_time": "3:15:17", "throughput": 2332.22, "total_tokens": 11369000} {"current_steps": 19730, "total_steps": 67140, "loss": 0.69, "lr": 4.449172111460597e-05, "epoch": 2.9386356866249628, "percentage": 29.39, "elapsed_time": "1:21:15", "remaining_time": "3:15:16", "throughput": 2332.26, "total_tokens": 11371784} {"current_steps": 19735, "total_steps": 67140, "loss": 0.7051, "lr": 4.448765093225326e-05, "epoch": 2.939380399165922, "percentage": 29.39, "elapsed_time": "1:21:17", "remaining_time": "3:15:15", "throughput": 2332.33, "total_tokens": 11374856} {"current_steps": 19740, "total_steps": 67140, "loss": 0.6556, "lr": 4.448357943300434e-05, "epoch": 2.940125111706881, "percentage": 29.4, "elapsed_time": "1:21:18", "remaining_time": "3:15:13", "throughput": 2332.39, "total_tokens": 11377800} {"current_steps": 19745, "total_steps": 67140, "loss": 0.594, "lr": 4.4479506617134324e-05, "epoch": 2.9408698242478404, "percentage": 29.41, "elapsed_time": "1:21:19", "remaining_time": "3:15:11", "throughput": 2332.39, "total_tokens": 11380360} {"current_steps": 19750, "total_steps": 67140, "loss": 0.6536, "lr": 4.447543248491846e-05, "epoch": 2.9416145367887996, "percentage": 29.42, "elapsed_time": "1:21:20", "remaining_time": "3:15:10", "throughput": 2332.49, "total_tokens": 11383624} {"current_steps": 19755, "total_steps": 67140, "loss": 0.7118, "lr": 4.447135703663205e-05, "epoch": 2.942359249329759, "percentage": 29.42, "elapsed_time": "1:21:21", "remaining_time": "3:15:09", "throughput": 2332.54, "total_tokens": 11386568} {"current_steps": 19760, "total_steps": 67140, "loss": 0.6514, "lr": 4.4467280272550495e-05, "epoch": 2.943103961870718, "percentage": 29.43, "elapsed_time": "1:21:22", "remaining_time": "3:15:07", "throughput": 2332.61, "total_tokens": 11389608} {"current_steps": 19765, "total_steps": 67140, "loss": 0.6279, "lr": 4.4463202192949284e-05, "epoch": 2.943848674411677, "percentage": 29.44, "elapsed_time": "1:21:24", "remaining_time": "3:15:06", "throughput": 2332.8, "total_tokens": 11393768} {"current_steps": 19770, "total_steps": 67140, "loss": 0.6903, "lr": 4.4459122798104004e-05, "epoch": 2.9445933869526364, "percentage": 29.45, "elapsed_time": "1:21:25", "remaining_time": "3:15:05", "throughput": 2332.88, "total_tokens": 11396840} {"current_steps": 19775, "total_steps": 67140, "loss": 0.7113, "lr": 4.445504208829032e-05, "epoch": 2.9453380994935956, "percentage": 29.45, "elapsed_time": "1:21:26", "remaining_time": "3:15:04", "throughput": 2332.94, "total_tokens": 11399848} {"current_steps": 19780, "total_steps": 67140, "loss": 0.7173, "lr": 4.445096006378399e-05, "epoch": 2.946082812034555, "percentage": 29.46, "elapsed_time": "1:21:27", "remaining_time": "3:15:02", "throughput": 2333.02, "total_tokens": 11403016} {"current_steps": 19785, "total_steps": 67140, "loss": 0.7427, "lr": 4.4446876724860856e-05, "epoch": 2.946827524575514, "percentage": 29.47, "elapsed_time": "1:21:28", "remaining_time": "3:15:01", "throughput": 2333.07, "total_tokens": 11405960} {"current_steps": 19790, "total_steps": 67140, "loss": 0.6333, "lr": 4.444279207179687e-05, "epoch": 2.947572237116473, "percentage": 29.48, "elapsed_time": "1:21:29", "remaining_time": "3:14:59", "throughput": 2333.11, "total_tokens": 11408776} {"current_steps": 19795, "total_steps": 67140, "loss": 0.5618, "lr": 4.443870610486803e-05, "epoch": 2.948316949657432, "percentage": 29.48, "elapsed_time": "1:21:31", "remaining_time": "3:14:58", "throughput": 2333.18, "total_tokens": 11411784} {"current_steps": 19800, "total_steps": 67140, "loss": 0.7268, "lr": 4.4434618824350475e-05, "epoch": 2.9490616621983916, "percentage": 29.49, "elapsed_time": "1:21:32", "remaining_time": "3:14:56", "throughput": 2333.16, "total_tokens": 11414248} {"current_steps": 19805, "total_steps": 67140, "loss": 0.5883, "lr": 4.4430530230520386e-05, "epoch": 2.9498063747393504, "percentage": 29.5, "elapsed_time": "1:21:33", "remaining_time": "3:14:55", "throughput": 2333.2, "total_tokens": 11417032} {"current_steps": 19810, "total_steps": 67140, "loss": 0.8058, "lr": 4.442644032365407e-05, "epoch": 2.95055108728031, "percentage": 29.51, "elapsed_time": "1:21:34", "remaining_time": "3:14:53", "throughput": 2333.23, "total_tokens": 11419784} {"current_steps": 19815, "total_steps": 67140, "loss": 0.6455, "lr": 4.4422349104027895e-05, "epoch": 2.9512957998212688, "percentage": 29.51, "elapsed_time": "1:21:35", "remaining_time": "3:14:52", "throughput": 2333.29, "total_tokens": 11422792} {"current_steps": 19820, "total_steps": 67140, "loss": 0.549, "lr": 4.4418256571918334e-05, "epoch": 2.9520405123622284, "percentage": 29.52, "elapsed_time": "1:21:36", "remaining_time": "3:14:50", "throughput": 2333.34, "total_tokens": 11425736} {"current_steps": 19825, "total_steps": 67140, "loss": 0.6279, "lr": 4.441416272760194e-05, "epoch": 2.952785224903187, "percentage": 29.53, "elapsed_time": "1:21:37", "remaining_time": "3:14:49", "throughput": 2333.36, "total_tokens": 11428360} {"current_steps": 19830, "total_steps": 67140, "loss": 0.6964, "lr": 4.441006757135536e-05, "epoch": 2.953529937444147, "percentage": 29.54, "elapsed_time": "1:21:38", "remaining_time": "3:14:47", "throughput": 2333.4, "total_tokens": 11431176} {"current_steps": 19835, "total_steps": 67140, "loss": 0.6761, "lr": 4.440597110345533e-05, "epoch": 2.9542746499851056, "percentage": 29.54, "elapsed_time": "1:21:40", "remaining_time": "3:14:46", "throughput": 2333.46, "total_tokens": 11434184} {"current_steps": 19840, "total_steps": 67140, "loss": 0.5807, "lr": 4.4401873324178684e-05, "epoch": 2.955019362526065, "percentage": 29.55, "elapsed_time": "1:21:41", "remaining_time": "3:14:44", "throughput": 2333.53, "total_tokens": 11437224} {"current_steps": 19845, "total_steps": 67140, "loss": 0.6306, "lr": 4.439777423380231e-05, "epoch": 2.955764075067024, "percentage": 29.56, "elapsed_time": "1:21:42", "remaining_time": "3:14:43", "throughput": 2333.54, "total_tokens": 11439816} {"current_steps": 19850, "total_steps": 67140, "loss": 0.6448, "lr": 4.439367383260322e-05, "epoch": 2.956508787607983, "percentage": 29.57, "elapsed_time": "1:21:43", "remaining_time": "3:14:41", "throughput": 2333.57, "total_tokens": 11442536} {"current_steps": 19855, "total_steps": 67140, "loss": 0.6099, "lr": 4.4389572120858506e-05, "epoch": 2.9572535001489424, "percentage": 29.57, "elapsed_time": "1:21:44", "remaining_time": "3:14:40", "throughput": 2333.66, "total_tokens": 11445800} {"current_steps": 19860, "total_steps": 67140, "loss": 0.6671, "lr": 4.4385469098845335e-05, "epoch": 2.9579982126899016, "percentage": 29.58, "elapsed_time": "1:21:45", "remaining_time": "3:14:38", "throughput": 2333.67, "total_tokens": 11448424} {"current_steps": 19865, "total_steps": 67140, "loss": 0.4793, "lr": 4.438136476684098e-05, "epoch": 2.958742925230861, "percentage": 29.59, "elapsed_time": "1:21:46", "remaining_time": "3:14:37", "throughput": 2333.71, "total_tokens": 11451240} {"current_steps": 19870, "total_steps": 67140, "loss": 0.7508, "lr": 4.4377259125122786e-05, "epoch": 2.95948763777182, "percentage": 29.59, "elapsed_time": "1:21:48", "remaining_time": "3:14:35", "throughput": 2333.77, "total_tokens": 11454184} {"current_steps": 19875, "total_steps": 67140, "loss": 0.7261, "lr": 4.4373152173968214e-05, "epoch": 2.960232350312779, "percentage": 29.6, "elapsed_time": "1:21:49", "remaining_time": "3:14:34", "throughput": 2333.77, "total_tokens": 11456712} {"current_steps": 19880, "total_steps": 67140, "loss": 0.5706, "lr": 4.436904391365477e-05, "epoch": 2.9609770628537384, "percentage": 29.61, "elapsed_time": "1:21:50", "remaining_time": "3:14:32", "throughput": 2333.83, "total_tokens": 11459656} {"current_steps": 19885, "total_steps": 67140, "loss": 0.6007, "lr": 4.43649343444601e-05, "epoch": 2.9617217753946976, "percentage": 29.62, "elapsed_time": "1:21:51", "remaining_time": "3:14:31", "throughput": 2333.86, "total_tokens": 11462440} {"current_steps": 19890, "total_steps": 67140, "loss": 0.6708, "lr": 4.436082346666189e-05, "epoch": 2.962466487935657, "percentage": 29.62, "elapsed_time": "1:21:52", "remaining_time": "3:14:29", "throughput": 2333.9, "total_tokens": 11465288} {"current_steps": 19895, "total_steps": 67140, "loss": 0.6956, "lr": 4.4356711280537954e-05, "epoch": 2.963211200476616, "percentage": 29.63, "elapsed_time": "1:21:53", "remaining_time": "3:14:28", "throughput": 2333.98, "total_tokens": 11468392} {"current_steps": 19900, "total_steps": 67140, "loss": 0.8374, "lr": 4.435259778636617e-05, "epoch": 2.963955913017575, "percentage": 29.64, "elapsed_time": "1:21:54", "remaining_time": "3:14:27", "throughput": 2334.03, "total_tokens": 11471272} {"current_steps": 19905, "total_steps": 67140, "loss": 0.5705, "lr": 4.43484829844245e-05, "epoch": 2.9647006255585344, "percentage": 29.65, "elapsed_time": "1:21:55", "remaining_time": "3:14:25", "throughput": 2334.09, "total_tokens": 11474216} {"current_steps": 19910, "total_steps": 67140, "loss": 0.5447, "lr": 4.434436687499102e-05, "epoch": 2.9654453380994936, "percentage": 29.65, "elapsed_time": "1:21:56", "remaining_time": "3:14:23", "throughput": 2334.1, "total_tokens": 11476776} {"current_steps": 19915, "total_steps": 67140, "loss": 0.6428, "lr": 4.434024945834387e-05, "epoch": 2.966190050640453, "percentage": 29.66, "elapsed_time": "1:21:58", "remaining_time": "3:14:22", "throughput": 2334.14, "total_tokens": 11479592} {"current_steps": 19920, "total_steps": 67140, "loss": 0.5973, "lr": 4.43361307347613e-05, "epoch": 2.966934763181412, "percentage": 29.67, "elapsed_time": "1:21:59", "remaining_time": "3:14:21", "throughput": 2334.21, "total_tokens": 11482632} {"current_steps": 19925, "total_steps": 67140, "loss": 0.6443, "lr": 4.433201070452163e-05, "epoch": 2.9676794757223712, "percentage": 29.68, "elapsed_time": "1:22:00", "remaining_time": "3:14:19", "throughput": 2334.28, "total_tokens": 11485736} {"current_steps": 19930, "total_steps": 67140, "loss": 0.6972, "lr": 4.432788936790327e-05, "epoch": 2.9684241882633304, "percentage": 29.68, "elapsed_time": "1:22:01", "remaining_time": "3:14:18", "throughput": 2334.31, "total_tokens": 11488456} {"current_steps": 19935, "total_steps": 67140, "loss": 0.7438, "lr": 4.432376672518473e-05, "epoch": 2.9691689008042896, "percentage": 29.69, "elapsed_time": "1:22:02", "remaining_time": "3:14:16", "throughput": 2334.38, "total_tokens": 11491528} {"current_steps": 19940, "total_steps": 67140, "loss": 0.7622, "lr": 4.43196427766446e-05, "epoch": 2.969913613345249, "percentage": 29.7, "elapsed_time": "1:22:03", "remaining_time": "3:14:15", "throughput": 2334.42, "total_tokens": 11494408} {"current_steps": 19945, "total_steps": 67140, "loss": 0.5537, "lr": 4.431551752256155e-05, "epoch": 2.970658325886208, "percentage": 29.71, "elapsed_time": "1:22:04", "remaining_time": "3:14:13", "throughput": 2334.45, "total_tokens": 11497128} {"current_steps": 19950, "total_steps": 67140, "loss": 0.5347, "lr": 4.4311390963214375e-05, "epoch": 2.9714030384271672, "percentage": 29.71, "elapsed_time": "1:22:06", "remaining_time": "3:14:12", "throughput": 2334.49, "total_tokens": 11499912} {"current_steps": 19955, "total_steps": 67140, "loss": 0.7375, "lr": 4.43072630988819e-05, "epoch": 2.9721477509681264, "percentage": 29.72, "elapsed_time": "1:22:07", "remaining_time": "3:14:10", "throughput": 2334.52, "total_tokens": 11502696} {"current_steps": 19960, "total_steps": 67140, "loss": 0.7807, "lr": 4.4303133929843086e-05, "epoch": 2.9728924635090856, "percentage": 29.73, "elapsed_time": "1:22:08", "remaining_time": "3:14:09", "throughput": 2334.56, "total_tokens": 11505512} {"current_steps": 19965, "total_steps": 67140, "loss": 0.6424, "lr": 4.4299003456376966e-05, "epoch": 2.973637176050045, "percentage": 29.74, "elapsed_time": "1:22:09", "remaining_time": "3:14:07", "throughput": 2334.63, "total_tokens": 11508616} {"current_steps": 19970, "total_steps": 67140, "loss": 0.8237, "lr": 4.429487167876265e-05, "epoch": 2.9743818885910036, "percentage": 29.74, "elapsed_time": "1:22:10", "remaining_time": "3:14:06", "throughput": 2334.66, "total_tokens": 11511368} {"current_steps": 19975, "total_steps": 67140, "loss": 0.5745, "lr": 4.429073859727936e-05, "epoch": 2.9751266011319633, "percentage": 29.75, "elapsed_time": "1:22:11", "remaining_time": "3:14:05", "throughput": 2334.74, "total_tokens": 11514504} {"current_steps": 19980, "total_steps": 67140, "loss": 0.6397, "lr": 4.428660421220638e-05, "epoch": 2.975871313672922, "percentage": 29.76, "elapsed_time": "1:22:12", "remaining_time": "3:14:03", "throughput": 2334.77, "total_tokens": 11517320} {"current_steps": 19985, "total_steps": 67140, "loss": 0.6882, "lr": 4.42824685238231e-05, "epoch": 2.9766160262138817, "percentage": 29.77, "elapsed_time": "1:22:14", "remaining_time": "3:14:02", "throughput": 2334.83, "total_tokens": 11520296} {"current_steps": 19990, "total_steps": 67140, "loss": 0.6924, "lr": 4.4278331532409e-05, "epoch": 2.9773607387548404, "percentage": 29.77, "elapsed_time": "1:22:15", "remaining_time": "3:14:00", "throughput": 2334.88, "total_tokens": 11523208} {"current_steps": 19995, "total_steps": 67140, "loss": 0.6134, "lr": 4.427419323824363e-05, "epoch": 2.9781054512958, "percentage": 29.78, "elapsed_time": "1:22:16", "remaining_time": "3:13:59", "throughput": 2334.95, "total_tokens": 11526280} {"current_steps": 20000, "total_steps": 67140, "loss": 0.5648, "lr": 4.427005364160665e-05, "epoch": 2.978850163836759, "percentage": 29.79, "elapsed_time": "1:22:17", "remaining_time": "3:13:57", "throughput": 2334.96, "total_tokens": 11528840} {"current_steps": 20005, "total_steps": 67140, "loss": 0.6555, "lr": 4.426591274277778e-05, "epoch": 2.9795948763777185, "percentage": 29.8, "elapsed_time": "1:22:18", "remaining_time": "3:13:56", "throughput": 2334.99, "total_tokens": 11531624} {"current_steps": 20010, "total_steps": 67140, "loss": 0.7797, "lr": 4.426177054203686e-05, "epoch": 2.9803395889186772, "percentage": 29.8, "elapsed_time": "1:22:19", "remaining_time": "3:13:54", "throughput": 2335.04, "total_tokens": 11534504} {"current_steps": 20015, "total_steps": 67140, "loss": 0.747, "lr": 4.425762703966381e-05, "epoch": 2.9810843014596364, "percentage": 29.81, "elapsed_time": "1:22:20", "remaining_time": "3:13:53", "throughput": 2335.1, "total_tokens": 11537448} {"current_steps": 20020, "total_steps": 67140, "loss": 0.5733, "lr": 4.425348223593861e-05, "epoch": 2.9818290140005956, "percentage": 29.82, "elapsed_time": "1:22:22", "remaining_time": "3:13:51", "throughput": 2335.14, "total_tokens": 11540360} {"current_steps": 20025, "total_steps": 67140, "loss": 0.5518, "lr": 4.424933613114136e-05, "epoch": 2.982573726541555, "percentage": 29.83, "elapsed_time": "1:22:23", "remaining_time": "3:13:50", "throughput": 2335.2, "total_tokens": 11543304} {"current_steps": 20030, "total_steps": 67140, "loss": 0.4888, "lr": 4.424518872555224e-05, "epoch": 2.983318439082514, "percentage": 29.83, "elapsed_time": "1:22:24", "remaining_time": "3:13:48", "throughput": 2335.28, "total_tokens": 11546376} {"current_steps": 20035, "total_steps": 67140, "loss": 0.664, "lr": 4.424104001945151e-05, "epoch": 2.9840631516234732, "percentage": 29.84, "elapsed_time": "1:22:25", "remaining_time": "3:13:47", "throughput": 2335.32, "total_tokens": 11549224} {"current_steps": 20040, "total_steps": 67140, "loss": 0.5323, "lr": 4.4236890013119527e-05, "epoch": 2.9848078641644324, "percentage": 29.85, "elapsed_time": "1:22:26", "remaining_time": "3:13:45", "throughput": 2335.35, "total_tokens": 11552008} {"current_steps": 20045, "total_steps": 67140, "loss": 0.6559, "lr": 4.423273870683672e-05, "epoch": 2.9855525767053916, "percentage": 29.86, "elapsed_time": "1:22:27", "remaining_time": "3:13:44", "throughput": 2335.39, "total_tokens": 11554792} {"current_steps": 20050, "total_steps": 67140, "loss": 0.7565, "lr": 4.422858610088364e-05, "epoch": 2.986297289246351, "percentage": 29.86, "elapsed_time": "1:22:28", "remaining_time": "3:13:43", "throughput": 2335.44, "total_tokens": 11557736} {"current_steps": 20055, "total_steps": 67140, "loss": 0.5579, "lr": 4.422443219554088e-05, "epoch": 2.98704200178731, "percentage": 29.87, "elapsed_time": "1:22:29", "remaining_time": "3:13:41", "throughput": 2335.47, "total_tokens": 11560392} {"current_steps": 20060, "total_steps": 67140, "loss": 0.7114, "lr": 4.422027699108915e-05, "epoch": 2.9877867143282693, "percentage": 29.88, "elapsed_time": "1:22:31", "remaining_time": "3:13:40", "throughput": 2335.57, "total_tokens": 11563720} {"current_steps": 20065, "total_steps": 67140, "loss": 0.5326, "lr": 4.421612048780925e-05, "epoch": 2.9885314268692285, "percentage": 29.89, "elapsed_time": "1:22:32", "remaining_time": "3:13:38", "throughput": 2335.63, "total_tokens": 11566696} {"current_steps": 20070, "total_steps": 67140, "loss": 0.7154, "lr": 4.421196268598205e-05, "epoch": 2.9892761394101877, "percentage": 29.89, "elapsed_time": "1:22:33", "remaining_time": "3:13:37", "throughput": 2335.66, "total_tokens": 11569448} {"current_steps": 20075, "total_steps": 67140, "loss": 0.5672, "lr": 4.4207803585888524e-05, "epoch": 2.990020851951147, "percentage": 29.9, "elapsed_time": "1:22:34", "remaining_time": "3:13:35", "throughput": 2335.71, "total_tokens": 11572328} {"current_steps": 20080, "total_steps": 67140, "loss": 0.6141, "lr": 4.420364318780973e-05, "epoch": 2.990765564492106, "percentage": 29.91, "elapsed_time": "1:22:35", "remaining_time": "3:13:34", "throughput": 2335.76, "total_tokens": 11575304} {"current_steps": 20085, "total_steps": 67140, "loss": 0.5715, "lr": 4.419948149202679e-05, "epoch": 2.9915102770330653, "percentage": 29.92, "elapsed_time": "1:22:36", "remaining_time": "3:13:32", "throughput": 2335.77, "total_tokens": 11577960} {"current_steps": 20090, "total_steps": 67140, "loss": 0.7696, "lr": 4.419531849882097e-05, "epoch": 2.9922549895740245, "percentage": 29.92, "elapsed_time": "1:22:37", "remaining_time": "3:13:31", "throughput": 2335.8, "total_tokens": 11580680} {"current_steps": 20095, "total_steps": 67140, "loss": 0.5549, "lr": 4.419115420847356e-05, "epoch": 2.9929997021149837, "percentage": 29.93, "elapsed_time": "1:22:39", "remaining_time": "3:13:29", "throughput": 2335.83, "total_tokens": 11583464} {"current_steps": 20100, "total_steps": 67140, "loss": 0.5329, "lr": 4.418698862126597e-05, "epoch": 2.993744414655943, "percentage": 29.94, "elapsed_time": "1:22:40", "remaining_time": "3:13:28", "throughput": 2335.88, "total_tokens": 11586376} {"current_steps": 20105, "total_steps": 67140, "loss": 0.5955, "lr": 4.418282173747971e-05, "epoch": 2.994489127196902, "percentage": 29.94, "elapsed_time": "1:22:41", "remaining_time": "3:13:26", "throughput": 2335.96, "total_tokens": 11589480} {"current_steps": 20110, "total_steps": 67140, "loss": 0.7076, "lr": 4.4178653557396335e-05, "epoch": 2.9952338397378613, "percentage": 29.95, "elapsed_time": "1:22:42", "remaining_time": "3:13:25", "throughput": 2336.07, "total_tokens": 11592840} {"current_steps": 20115, "total_steps": 67140, "loss": 0.9499, "lr": 4.417448408129753e-05, "epoch": 2.9959785522788205, "percentage": 29.96, "elapsed_time": "1:22:43", "remaining_time": "3:13:24", "throughput": 2336.12, "total_tokens": 11595688} {"current_steps": 20120, "total_steps": 67140, "loss": 0.7651, "lr": 4.417031330946505e-05, "epoch": 2.9967232648197797, "percentage": 29.97, "elapsed_time": "1:22:44", "remaining_time": "3:13:22", "throughput": 2336.22, "total_tokens": 11598920} {"current_steps": 20125, "total_steps": 67140, "loss": 0.568, "lr": 4.4166141242180736e-05, "epoch": 2.997467977360739, "percentage": 29.97, "elapsed_time": "1:22:45", "remaining_time": "3:13:21", "throughput": 2336.25, "total_tokens": 11601672} {"current_steps": 20130, "total_steps": 67140, "loss": 0.6955, "lr": 4.4161967879726526e-05, "epoch": 2.998212689901698, "percentage": 29.98, "elapsed_time": "1:22:47", "remaining_time": "3:13:19", "throughput": 2336.31, "total_tokens": 11604680} {"current_steps": 20135, "total_steps": 67140, "loss": 0.6529, "lr": 4.415779322238443e-05, "epoch": 2.9989574024426573, "percentage": 29.99, "elapsed_time": "1:22:48", "remaining_time": "3:13:18", "throughput": 2336.37, "total_tokens": 11607688} {"current_steps": 20140, "total_steps": 67140, "loss": 0.6193, "lr": 4.4153617270436556e-05, "epoch": 2.9997021149836165, "percentage": 30.0, "elapsed_time": "1:22:49", "remaining_time": "3:13:16", "throughput": 2336.4, "total_tokens": 11610440} {"current_steps": 20142, "total_steps": 67140, "eval_loss": 0.6564539074897766, "epoch": 3.0, "percentage": 30.0, "elapsed_time": "1:24:03", "remaining_time": "3:16:09", "throughput": 2301.97, "total_tokens": 11611120} {"current_steps": 20145, "total_steps": 67140, "loss": 0.5165, "lr": 4.414944002416511e-05, "epoch": 3.0004468275245757, "percentage": 30.0, "elapsed_time": "1:24:06", "remaining_time": "3:16:12", "throughput": 2301.26, "total_tokens": 11612848} {"current_steps": 20150, "total_steps": 67140, "loss": 0.6088, "lr": 4.414526148385235e-05, "epoch": 3.001191540065535, "percentage": 30.01, "elapsed_time": "1:24:07", "remaining_time": "3:16:10", "throughput": 2301.3, "total_tokens": 11615664} {"current_steps": 20155, "total_steps": 67140, "loss": 0.7137, "lr": 4.414108164978067e-05, "epoch": 3.001936252606494, "percentage": 30.02, "elapsed_time": "1:24:08", "remaining_time": "3:16:09", "throughput": 2301.35, "total_tokens": 11618480} {"current_steps": 20160, "total_steps": 67140, "loss": 0.7797, "lr": 4.4136900522232506e-05, "epoch": 3.002680965147453, "percentage": 30.03, "elapsed_time": "1:24:09", "remaining_time": "3:16:07", "throughput": 2301.38, "total_tokens": 11621168} {"current_steps": 20165, "total_steps": 67140, "loss": 0.7357, "lr": 4.413271810149041e-05, "epoch": 3.003425677688412, "percentage": 30.03, "elapsed_time": "1:24:10", "remaining_time": "3:16:06", "throughput": 2301.46, "total_tokens": 11624240} {"current_steps": 20170, "total_steps": 67140, "loss": 0.5393, "lr": 4.412853438783701e-05, "epoch": 3.0041703902293713, "percentage": 30.04, "elapsed_time": "1:24:11", "remaining_time": "3:16:04", "throughput": 2301.54, "total_tokens": 11627312} {"current_steps": 20175, "total_steps": 67140, "loss": 0.6779, "lr": 4.412434938155503e-05, "epoch": 3.0049151027703305, "percentage": 30.05, "elapsed_time": "1:24:13", "remaining_time": "3:16:03", "throughput": 2301.6, "total_tokens": 11630256} {"current_steps": 20180, "total_steps": 67140, "loss": 0.7829, "lr": 4.4120163082927274e-05, "epoch": 3.0056598153112897, "percentage": 30.06, "elapsed_time": "1:24:14", "remaining_time": "3:16:01", "throughput": 2301.62, "total_tokens": 11632880} {"current_steps": 20185, "total_steps": 67140, "loss": 0.7058, "lr": 4.411597549223663e-05, "epoch": 3.006404527852249, "percentage": 30.06, "elapsed_time": "1:24:15", "remaining_time": "3:15:59", "throughput": 2301.67, "total_tokens": 11635696} {"current_steps": 20190, "total_steps": 67140, "loss": 0.6478, "lr": 4.411178660976609e-05, "epoch": 3.007149240393208, "percentage": 30.07, "elapsed_time": "1:24:16", "remaining_time": "3:15:58", "throughput": 2301.73, "total_tokens": 11638576} {"current_steps": 20195, "total_steps": 67140, "loss": 0.6786, "lr": 4.410759643579871e-05, "epoch": 3.0078939529341673, "percentage": 30.08, "elapsed_time": "1:24:17", "remaining_time": "3:15:56", "throughput": 2301.83, "total_tokens": 11641840} {"current_steps": 20200, "total_steps": 67140, "loss": 0.7621, "lr": 4.410340497061764e-05, "epoch": 3.0086386654751265, "percentage": 30.09, "elapsed_time": "1:24:18", "remaining_time": "3:15:55", "throughput": 2301.84, "total_tokens": 11644432} {"current_steps": 20205, "total_steps": 67140, "loss": 0.5672, "lr": 4.4099212214506146e-05, "epoch": 3.0093833780160857, "percentage": 30.09, "elapsed_time": "1:24:19", "remaining_time": "3:15:53", "throughput": 2301.88, "total_tokens": 11647248} {"current_steps": 20210, "total_steps": 67140, "loss": 0.5889, "lr": 4.4095018167747536e-05, "epoch": 3.010128090557045, "percentage": 30.1, "elapsed_time": "1:24:21", "remaining_time": "3:15:52", "throughput": 2301.95, "total_tokens": 11650256} {"current_steps": 20215, "total_steps": 67140, "loss": 0.5863, "lr": 4.4090822830625236e-05, "epoch": 3.010872803098004, "percentage": 30.11, "elapsed_time": "1:24:22", "remaining_time": "3:15:50", "throughput": 2302.0, "total_tokens": 11653104} {"current_steps": 20220, "total_steps": 67140, "loss": 0.6282, "lr": 4.408662620342274e-05, "epoch": 3.0116175156389633, "percentage": 30.12, "elapsed_time": "1:24:23", "remaining_time": "3:15:49", "throughput": 2302.05, "total_tokens": 11655952} {"current_steps": 20225, "total_steps": 67140, "loss": 0.3887, "lr": 4.408242828642365e-05, "epoch": 3.0123622281799225, "percentage": 30.12, "elapsed_time": "1:24:24", "remaining_time": "3:15:47", "throughput": 2302.12, "total_tokens": 11658960} {"current_steps": 20230, "total_steps": 67140, "loss": 0.7563, "lr": 4.4078229079911636e-05, "epoch": 3.0131069407208817, "percentage": 30.13, "elapsed_time": "1:24:25", "remaining_time": "3:15:46", "throughput": 2302.17, "total_tokens": 11661840} {"current_steps": 20235, "total_steps": 67140, "loss": 0.6348, "lr": 4.407402858417047e-05, "epoch": 3.013851653261841, "percentage": 30.14, "elapsed_time": "1:24:26", "remaining_time": "3:15:44", "throughput": 2302.24, "total_tokens": 11664848} {"current_steps": 20240, "total_steps": 67140, "loss": 0.6483, "lr": 4.4069826799484e-05, "epoch": 3.0145963658028, "percentage": 30.15, "elapsed_time": "1:24:27", "remaining_time": "3:15:43", "throughput": 2302.27, "total_tokens": 11667632} {"current_steps": 20245, "total_steps": 67140, "loss": 0.5859, "lr": 4.406562372613617e-05, "epoch": 3.0153410783437593, "percentage": 30.15, "elapsed_time": "1:24:29", "remaining_time": "3:15:41", "throughput": 2302.33, "total_tokens": 11670544} {"current_steps": 20250, "total_steps": 67140, "loss": 0.6997, "lr": 4.406141936441099e-05, "epoch": 3.0160857908847185, "percentage": 30.16, "elapsed_time": "1:24:30", "remaining_time": "3:15:40", "throughput": 2302.37, "total_tokens": 11673392} {"current_steps": 20255, "total_steps": 67140, "loss": 0.6209, "lr": 4.40572137145926e-05, "epoch": 3.0168305034256777, "percentage": 30.17, "elapsed_time": "1:24:31", "remaining_time": "3:15:38", "throughput": 2302.45, "total_tokens": 11676464} {"current_steps": 20260, "total_steps": 67140, "loss": 0.5279, "lr": 4.405300677696519e-05, "epoch": 3.017575215966637, "percentage": 30.18, "elapsed_time": "1:24:32", "remaining_time": "3:15:37", "throughput": 2302.49, "total_tokens": 11679248} {"current_steps": 20265, "total_steps": 67140, "loss": 0.6477, "lr": 4.4048798551813056e-05, "epoch": 3.018319928507596, "percentage": 30.18, "elapsed_time": "1:24:33", "remaining_time": "3:15:35", "throughput": 2302.53, "total_tokens": 11682032} {"current_steps": 20270, "total_steps": 67140, "loss": 0.443, "lr": 4.4044589039420546e-05, "epoch": 3.0190646410485553, "percentage": 30.19, "elapsed_time": "1:24:34", "remaining_time": "3:15:34", "throughput": 2302.56, "total_tokens": 11684752} {"current_steps": 20275, "total_steps": 67140, "loss": 0.5204, "lr": 4.404037824007214e-05, "epoch": 3.0198093535895145, "percentage": 30.2, "elapsed_time": "1:24:35", "remaining_time": "3:15:32", "throughput": 2302.6, "total_tokens": 11687536} {"current_steps": 20280, "total_steps": 67140, "loss": 0.754, "lr": 4.4036166154052387e-05, "epoch": 3.0205540661304737, "percentage": 30.21, "elapsed_time": "1:24:36", "remaining_time": "3:15:31", "throughput": 2302.7, "total_tokens": 11690736} {"current_steps": 20285, "total_steps": 67140, "loss": 0.7208, "lr": 4.4031952781645924e-05, "epoch": 3.021298778671433, "percentage": 30.21, "elapsed_time": "1:24:38", "remaining_time": "3:15:29", "throughput": 2302.79, "total_tokens": 11693904} {"current_steps": 20290, "total_steps": 67140, "loss": 0.453, "lr": 4.4027738123137465e-05, "epoch": 3.022043491212392, "percentage": 30.22, "elapsed_time": "1:24:39", "remaining_time": "3:15:28", "throughput": 2302.86, "total_tokens": 11696912} {"current_steps": 20295, "total_steps": 67140, "loss": 0.5804, "lr": 4.402352217881183e-05, "epoch": 3.0227882037533513, "percentage": 30.23, "elapsed_time": "1:24:40", "remaining_time": "3:15:26", "throughput": 2302.93, "total_tokens": 11699920} {"current_steps": 20300, "total_steps": 67140, "loss": 0.6071, "lr": 4.4019304948953906e-05, "epoch": 3.0235329162943105, "percentage": 30.24, "elapsed_time": "1:24:41", "remaining_time": "3:15:25", "throughput": 2303.01, "total_tokens": 11702960} {"current_steps": 20305, "total_steps": 67140, "loss": 0.4365, "lr": 4.401508643384868e-05, "epoch": 3.0242776288352697, "percentage": 30.24, "elapsed_time": "1:24:42", "remaining_time": "3:15:23", "throughput": 2303.09, "total_tokens": 11706000} {"current_steps": 20310, "total_steps": 67140, "loss": 0.4829, "lr": 4.4010866633781225e-05, "epoch": 3.025022341376229, "percentage": 30.25, "elapsed_time": "1:24:43", "remaining_time": "3:15:22", "throughput": 2303.14, "total_tokens": 11708880} {"current_steps": 20315, "total_steps": 67140, "loss": 0.5543, "lr": 4.4006645549036697e-05, "epoch": 3.025767053917188, "percentage": 30.26, "elapsed_time": "1:24:45", "remaining_time": "3:15:21", "throughput": 2303.27, "total_tokens": 11712560} {"current_steps": 20320, "total_steps": 67140, "loss": 0.6742, "lr": 4.400242317990033e-05, "epoch": 3.0265117664581473, "percentage": 30.27, "elapsed_time": "1:24:46", "remaining_time": "3:15:19", "throughput": 2303.37, "total_tokens": 11715856} {"current_steps": 20325, "total_steps": 67140, "loss": 0.6104, "lr": 4.399819952665747e-05, "epoch": 3.0272564789991065, "percentage": 30.27, "elapsed_time": "1:24:47", "remaining_time": "3:15:18", "throughput": 2303.44, "total_tokens": 11718832} {"current_steps": 20330, "total_steps": 67140, "loss": 0.7787, "lr": 4.399397458959353e-05, "epoch": 3.0280011915400658, "percentage": 30.28, "elapsed_time": "1:24:48", "remaining_time": "3:15:16", "throughput": 2303.46, "total_tokens": 11721456} {"current_steps": 20335, "total_steps": 67140, "loss": 0.5266, "lr": 4.398974836899401e-05, "epoch": 3.0287459040810245, "percentage": 30.29, "elapsed_time": "1:24:49", "remaining_time": "3:15:15", "throughput": 2303.48, "total_tokens": 11724144} {"current_steps": 20340, "total_steps": 67140, "loss": 0.8965, "lr": 4.398552086514449e-05, "epoch": 3.0294906166219837, "percentage": 30.29, "elapsed_time": "1:24:50", "remaining_time": "3:15:13", "throughput": 2303.52, "total_tokens": 11726928} {"current_steps": 20345, "total_steps": 67140, "loss": 0.5926, "lr": 4.398129207833067e-05, "epoch": 3.030235329162943, "percentage": 30.3, "elapsed_time": "1:24:51", "remaining_time": "3:15:11", "throughput": 2303.55, "total_tokens": 11729648} {"current_steps": 20350, "total_steps": 67140, "loss": 0.6682, "lr": 4.3977062008838307e-05, "epoch": 3.030980041703902, "percentage": 30.31, "elapsed_time": "1:24:53", "remaining_time": "3:15:10", "throughput": 2303.58, "total_tokens": 11732336} {"current_steps": 20355, "total_steps": 67140, "loss": 0.6109, "lr": 4.397283065695325e-05, "epoch": 3.0317247542448613, "percentage": 30.32, "elapsed_time": "1:24:54", "remaining_time": "3:15:08", "throughput": 2303.63, "total_tokens": 11735280} {"current_steps": 20360, "total_steps": 67140, "loss": 0.6259, "lr": 4.396859802296142e-05, "epoch": 3.0324694667858205, "percentage": 30.32, "elapsed_time": "1:24:55", "remaining_time": "3:15:07", "throughput": 2303.68, "total_tokens": 11738192} {"current_steps": 20365, "total_steps": 67140, "loss": 0.9053, "lr": 4.396436410714887e-05, "epoch": 3.0332141793267797, "percentage": 30.33, "elapsed_time": "1:24:56", "remaining_time": "3:15:05", "throughput": 2303.75, "total_tokens": 11741232} {"current_steps": 20370, "total_steps": 67140, "loss": 0.8447, "lr": 4.396012890980169e-05, "epoch": 3.033958891867739, "percentage": 30.34, "elapsed_time": "1:24:57", "remaining_time": "3:15:04", "throughput": 2303.86, "total_tokens": 11744592} {"current_steps": 20375, "total_steps": 67140, "loss": 0.7441, "lr": 4.3955892431206085e-05, "epoch": 3.034703604408698, "percentage": 30.35, "elapsed_time": "1:24:58", "remaining_time": "3:15:03", "throughput": 2303.9, "total_tokens": 11747344} {"current_steps": 20380, "total_steps": 67140, "loss": 0.5991, "lr": 4.395165467164834e-05, "epoch": 3.0354483169496573, "percentage": 30.35, "elapsed_time": "1:25:00", "remaining_time": "3:15:01", "throughput": 2303.93, "total_tokens": 11750064} {"current_steps": 20385, "total_steps": 67140, "loss": 0.6762, "lr": 4.394741563141482e-05, "epoch": 3.0361930294906165, "percentage": 30.36, "elapsed_time": "1:25:01", "remaining_time": "3:15:00", "throughput": 2304.01, "total_tokens": 11753104} {"current_steps": 20390, "total_steps": 67140, "loss": 0.5063, "lr": 4.3943175310791995e-05, "epoch": 3.0369377420315757, "percentage": 30.37, "elapsed_time": "1:25:02", "remaining_time": "3:14:58", "throughput": 2304.04, "total_tokens": 11755792} {"current_steps": 20395, "total_steps": 67140, "loss": 0.7055, "lr": 4.3938933710066396e-05, "epoch": 3.037682454572535, "percentage": 30.38, "elapsed_time": "1:25:03", "remaining_time": "3:14:56", "throughput": 2304.1, "total_tokens": 11758768} {"current_steps": 20400, "total_steps": 67140, "loss": 0.6931, "lr": 4.393469082952466e-05, "epoch": 3.038427167113494, "percentage": 30.38, "elapsed_time": "1:25:04", "remaining_time": "3:14:55", "throughput": 2304.15, "total_tokens": 11761648} {"current_steps": 20405, "total_steps": 67140, "loss": 0.6137, "lr": 4.3930446669453494e-05, "epoch": 3.0391718796544533, "percentage": 30.39, "elapsed_time": "1:25:05", "remaining_time": "3:14:53", "throughput": 2304.21, "total_tokens": 11764656} {"current_steps": 20410, "total_steps": 67140, "loss": 0.5095, "lr": 4.392620123013971e-05, "epoch": 3.0399165921954125, "percentage": 30.4, "elapsed_time": "1:25:06", "remaining_time": "3:14:52", "throughput": 2304.25, "total_tokens": 11767440} {"current_steps": 20415, "total_steps": 67140, "loss": 0.7222, "lr": 4.3921954511870194e-05, "epoch": 3.0406613047363718, "percentage": 30.41, "elapsed_time": "1:25:08", "remaining_time": "3:14:51", "throughput": 2304.35, "total_tokens": 11770704} {"current_steps": 20420, "total_steps": 67140, "loss": 0.6066, "lr": 4.3917706514931926e-05, "epoch": 3.041406017277331, "percentage": 30.41, "elapsed_time": "1:25:09", "remaining_time": "3:14:49", "throughput": 2304.4, "total_tokens": 11773552} {"current_steps": 20425, "total_steps": 67140, "loss": 0.5749, "lr": 4.391345723961197e-05, "epoch": 3.04215072981829, "percentage": 30.42, "elapsed_time": "1:25:10", "remaining_time": "3:14:48", "throughput": 2304.44, "total_tokens": 11776400} {"current_steps": 20430, "total_steps": 67140, "loss": 0.6029, "lr": 4.3909206686197456e-05, "epoch": 3.0428954423592494, "percentage": 30.43, "elapsed_time": "1:25:11", "remaining_time": "3:14:46", "throughput": 2304.49, "total_tokens": 11779280} {"current_steps": 20435, "total_steps": 67140, "loss": 0.6881, "lr": 4.3904954854975644e-05, "epoch": 3.0436401549002086, "percentage": 30.44, "elapsed_time": "1:25:12", "remaining_time": "3:14:45", "throughput": 2304.58, "total_tokens": 11782416} {"current_steps": 20440, "total_steps": 67140, "loss": 0.6163, "lr": 4.390070174623384e-05, "epoch": 3.0443848674411678, "percentage": 30.44, "elapsed_time": "1:25:13", "remaining_time": "3:14:43", "throughput": 2304.63, "total_tokens": 11785296} {"current_steps": 20445, "total_steps": 67140, "loss": 0.6047, "lr": 4.389644736025946e-05, "epoch": 3.045129579982127, "percentage": 30.45, "elapsed_time": "1:25:14", "remaining_time": "3:14:41", "throughput": 2304.66, "total_tokens": 11788016} {"current_steps": 20450, "total_steps": 67140, "loss": 0.6519, "lr": 4.389219169734e-05, "epoch": 3.045874292523086, "percentage": 30.46, "elapsed_time": "1:25:15", "remaining_time": "3:14:40", "throughput": 2304.71, "total_tokens": 11790832} {"current_steps": 20455, "total_steps": 67140, "loss": 0.5167, "lr": 4.388793475776303e-05, "epoch": 3.0466190050640454, "percentage": 30.47, "elapsed_time": "1:25:17", "remaining_time": "3:14:38", "throughput": 2304.77, "total_tokens": 11793776} {"current_steps": 20460, "total_steps": 67140, "loss": 0.5263, "lr": 4.388367654181622e-05, "epoch": 3.0473637176050046, "percentage": 30.47, "elapsed_time": "1:25:18", "remaining_time": "3:14:37", "throughput": 2304.83, "total_tokens": 11796720} {"current_steps": 20465, "total_steps": 67140, "loss": 0.6554, "lr": 4.387941704978733e-05, "epoch": 3.0481084301459638, "percentage": 30.48, "elapsed_time": "1:25:19", "remaining_time": "3:14:36", "throughput": 2304.99, "total_tokens": 11800528} {"current_steps": 20470, "total_steps": 67140, "loss": 0.7112, "lr": 4.3875156281964186e-05, "epoch": 3.048853142686923, "percentage": 30.49, "elapsed_time": "1:25:20", "remaining_time": "3:14:34", "throughput": 2305.01, "total_tokens": 11803184} {"current_steps": 20475, "total_steps": 67140, "loss": 0.5613, "lr": 4.3870894238634725e-05, "epoch": 3.049597855227882, "percentage": 30.5, "elapsed_time": "1:25:21", "remaining_time": "3:14:33", "throughput": 2305.01, "total_tokens": 11805680} {"current_steps": 20480, "total_steps": 67140, "loss": 0.6749, "lr": 4.386663092008696e-05, "epoch": 3.0503425677688414, "percentage": 30.5, "elapsed_time": "1:25:22", "remaining_time": "3:14:31", "throughput": 2305.04, "total_tokens": 11808400} {"current_steps": 20485, "total_steps": 67140, "loss": 0.6949, "lr": 4.3862366326608975e-05, "epoch": 3.0510872803098006, "percentage": 30.51, "elapsed_time": "1:25:24", "remaining_time": "3:14:30", "throughput": 2305.11, "total_tokens": 11811376} {"current_steps": 20490, "total_steps": 67140, "loss": 0.7168, "lr": 4.385810045848896e-05, "epoch": 3.05183199285076, "percentage": 30.52, "elapsed_time": "1:25:25", "remaining_time": "3:14:28", "throughput": 2305.14, "total_tokens": 11814096} {"current_steps": 20495, "total_steps": 67140, "loss": 0.7053, "lr": 4.38538333160152e-05, "epoch": 3.052576705391719, "percentage": 30.53, "elapsed_time": "1:25:26", "remaining_time": "3:14:26", "throughput": 2305.17, "total_tokens": 11816848} {"current_steps": 20500, "total_steps": 67140, "loss": 0.6177, "lr": 4.3849564899476026e-05, "epoch": 3.053321417932678, "percentage": 30.53, "elapsed_time": "1:25:27", "remaining_time": "3:14:25", "throughput": 2305.2, "total_tokens": 11819568} {"current_steps": 20505, "total_steps": 67140, "loss": 0.6202, "lr": 4.38452952091599e-05, "epoch": 3.054066130473637, "percentage": 30.54, "elapsed_time": "1:25:28", "remaining_time": "3:14:23", "throughput": 2305.29, "total_tokens": 11822768} {"current_steps": 20510, "total_steps": 67140, "loss": 0.576, "lr": 4.3841024245355346e-05, "epoch": 3.054810843014596, "percentage": 30.55, "elapsed_time": "1:25:29", "remaining_time": "3:14:22", "throughput": 2305.36, "total_tokens": 11825808} {"current_steps": 20515, "total_steps": 67140, "loss": 0.6069, "lr": 4.383675200835097e-05, "epoch": 3.0555555555555554, "percentage": 30.56, "elapsed_time": "1:25:30", "remaining_time": "3:14:21", "throughput": 2305.41, "total_tokens": 11828720} {"current_steps": 20520, "total_steps": 67140, "loss": 0.5711, "lr": 4.383247849843548e-05, "epoch": 3.0563002680965146, "percentage": 30.56, "elapsed_time": "1:25:31", "remaining_time": "3:14:19", "throughput": 2305.46, "total_tokens": 11831568} {"current_steps": 20525, "total_steps": 67140, "loss": 0.6874, "lr": 4.382820371589766e-05, "epoch": 3.0570449806374738, "percentage": 30.57, "elapsed_time": "1:25:33", "remaining_time": "3:14:17", "throughput": 2305.48, "total_tokens": 11834192} {"current_steps": 20530, "total_steps": 67140, "loss": 0.5172, "lr": 4.382392766102638e-05, "epoch": 3.057789693178433, "percentage": 30.58, "elapsed_time": "1:25:34", "remaining_time": "3:14:16", "throughput": 2305.52, "total_tokens": 11837040} {"current_steps": 20535, "total_steps": 67140, "loss": 0.6526, "lr": 4.381965033411061e-05, "epoch": 3.058534405719392, "percentage": 30.59, "elapsed_time": "1:25:35", "remaining_time": "3:14:14", "throughput": 2305.57, "total_tokens": 11839888} {"current_steps": 20540, "total_steps": 67140, "loss": 0.5817, "lr": 4.381537173543937e-05, "epoch": 3.0592791182603514, "percentage": 30.59, "elapsed_time": "1:25:36", "remaining_time": "3:14:13", "throughput": 2305.66, "total_tokens": 11843024} {"current_steps": 20545, "total_steps": 67140, "loss": 0.8025, "lr": 4.381109186530182e-05, "epoch": 3.0600238308013106, "percentage": 30.6, "elapsed_time": "1:25:37", "remaining_time": "3:14:11", "throughput": 2305.68, "total_tokens": 11845744} {"current_steps": 20550, "total_steps": 67140, "loss": 0.6478, "lr": 4.380681072398716e-05, "epoch": 3.0607685433422698, "percentage": 30.61, "elapsed_time": "1:25:38", "remaining_time": "3:14:10", "throughput": 2305.71, "total_tokens": 11848432} {"current_steps": 20555, "total_steps": 67140, "loss": 0.5359, "lr": 4.3802528311784686e-05, "epoch": 3.061513255883229, "percentage": 30.62, "elapsed_time": "1:25:39", "remaining_time": "3:14:08", "throughput": 2305.81, "total_tokens": 11851728} {"current_steps": 20560, "total_steps": 67140, "loss": 0.5075, "lr": 4.37982446289838e-05, "epoch": 3.062257968424188, "percentage": 30.62, "elapsed_time": "1:25:41", "remaining_time": "3:14:07", "throughput": 2305.85, "total_tokens": 11854544} {"current_steps": 20565, "total_steps": 67140, "loss": 0.6533, "lr": 4.379395967587398e-05, "epoch": 3.0630026809651474, "percentage": 30.63, "elapsed_time": "1:25:42", "remaining_time": "3:14:06", "throughput": 2305.96, "total_tokens": 11857840} {"current_steps": 20570, "total_steps": 67140, "loss": 0.7568, "lr": 4.378967345274476e-05, "epoch": 3.0637473935061066, "percentage": 30.64, "elapsed_time": "1:25:43", "remaining_time": "3:14:04", "throughput": 2306.01, "total_tokens": 11860784} {"current_steps": 20575, "total_steps": 67140, "loss": 0.616, "lr": 4.3785385959885805e-05, "epoch": 3.064492106047066, "percentage": 30.64, "elapsed_time": "1:25:44", "remaining_time": "3:14:03", "throughput": 2306.09, "total_tokens": 11863824} {"current_steps": 20580, "total_steps": 67140, "loss": 0.7681, "lr": 4.3781097197586845e-05, "epoch": 3.065236818588025, "percentage": 30.65, "elapsed_time": "1:25:45", "remaining_time": "3:14:01", "throughput": 2306.09, "total_tokens": 11866352} {"current_steps": 20585, "total_steps": 67140, "loss": 0.5722, "lr": 4.377680716613769e-05, "epoch": 3.065981531128984, "percentage": 30.66, "elapsed_time": "1:25:46", "remaining_time": "3:13:59", "throughput": 2306.14, "total_tokens": 11869200} {"current_steps": 20590, "total_steps": 67140, "loss": 0.5786, "lr": 4.377251586582826e-05, "epoch": 3.0667262436699434, "percentage": 30.67, "elapsed_time": "1:25:47", "remaining_time": "3:13:58", "throughput": 2306.18, "total_tokens": 11871984} {"current_steps": 20595, "total_steps": 67140, "loss": 0.7502, "lr": 4.3768223296948516e-05, "epoch": 3.0674709562109026, "percentage": 30.67, "elapsed_time": "1:25:49", "remaining_time": "3:13:56", "throughput": 2306.24, "total_tokens": 11874928} {"current_steps": 20600, "total_steps": 67140, "loss": 0.573, "lr": 4.3763929459788554e-05, "epoch": 3.068215668751862, "percentage": 30.68, "elapsed_time": "1:25:50", "remaining_time": "3:13:55", "throughput": 2306.27, "total_tokens": 11877680} {"current_steps": 20605, "total_steps": 67140, "loss": 0.6874, "lr": 4.375963435463853e-05, "epoch": 3.068960381292821, "percentage": 30.69, "elapsed_time": "1:25:51", "remaining_time": "3:13:53", "throughput": 2306.3, "total_tokens": 11880336} {"current_steps": 20610, "total_steps": 67140, "loss": 0.6723, "lr": 4.375533798178869e-05, "epoch": 3.06970509383378, "percentage": 30.7, "elapsed_time": "1:25:52", "remaining_time": "3:13:52", "throughput": 2306.34, "total_tokens": 11883152} {"current_steps": 20615, "total_steps": 67140, "loss": 0.5061, "lr": 4.375104034152936e-05, "epoch": 3.0704498063747394, "percentage": 30.7, "elapsed_time": "1:25:53", "remaining_time": "3:13:50", "throughput": 2306.39, "total_tokens": 11886032} {"current_steps": 20620, "total_steps": 67140, "loss": 0.5146, "lr": 4.374674143415096e-05, "epoch": 3.0711945189156986, "percentage": 30.71, "elapsed_time": "1:25:54", "remaining_time": "3:13:49", "throughput": 2306.46, "total_tokens": 11889072} {"current_steps": 20625, "total_steps": 67140, "loss": 0.6195, "lr": 4.374244125994399e-05, "epoch": 3.071939231456658, "percentage": 30.72, "elapsed_time": "1:25:55", "remaining_time": "3:13:47", "throughput": 2306.57, "total_tokens": 11892336} {"current_steps": 20630, "total_steps": 67140, "loss": 0.7263, "lr": 4.3738139819199045e-05, "epoch": 3.072683943997617, "percentage": 30.73, "elapsed_time": "1:25:57", "remaining_time": "3:13:46", "throughput": 2306.64, "total_tokens": 11895408} {"current_steps": 20635, "total_steps": 67140, "loss": 0.6292, "lr": 4.3733837112206786e-05, "epoch": 3.073428656538576, "percentage": 30.73, "elapsed_time": "1:25:58", "remaining_time": "3:13:44", "throughput": 2306.71, "total_tokens": 11898448} {"current_steps": 20640, "total_steps": 67140, "loss": 0.7557, "lr": 4.372953313925798e-05, "epoch": 3.0741733690795354, "percentage": 30.74, "elapsed_time": "1:25:59", "remaining_time": "3:13:43", "throughput": 2306.78, "total_tokens": 11901424} {"current_steps": 20645, "total_steps": 67140, "loss": 0.6249, "lr": 4.3725227900643485e-05, "epoch": 3.0749180816204946, "percentage": 30.75, "elapsed_time": "1:26:00", "remaining_time": "3:13:42", "throughput": 2306.86, "total_tokens": 11904496} {"current_steps": 20650, "total_steps": 67140, "loss": 0.528, "lr": 4.372092139665422e-05, "epoch": 3.075662794161454, "percentage": 30.76, "elapsed_time": "1:26:01", "remaining_time": "3:13:40", "throughput": 2306.88, "total_tokens": 11907152} {"current_steps": 20655, "total_steps": 67140, "loss": 0.7451, "lr": 4.3716613627581195e-05, "epoch": 3.076407506702413, "percentage": 30.76, "elapsed_time": "1:26:02", "remaining_time": "3:13:38", "throughput": 2306.9, "total_tokens": 11909776} {"current_steps": 20660, "total_steps": 67140, "loss": 0.6245, "lr": 4.3712304593715516e-05, "epoch": 3.0771522192433722, "percentage": 30.77, "elapsed_time": "1:26:03", "remaining_time": "3:13:37", "throughput": 2306.95, "total_tokens": 11912624} {"current_steps": 20665, "total_steps": 67140, "loss": 0.7704, "lr": 4.3707994295348374e-05, "epoch": 3.0778969317843314, "percentage": 30.78, "elapsed_time": "1:26:04", "remaining_time": "3:13:35", "throughput": 2307.0, "total_tokens": 11915504} {"current_steps": 20670, "total_steps": 67140, "loss": 0.6113, "lr": 4.370368273277103e-05, "epoch": 3.0786416443252906, "percentage": 30.79, "elapsed_time": "1:26:06", "remaining_time": "3:13:34", "throughput": 2307.09, "total_tokens": 11918736} {"current_steps": 20675, "total_steps": 67140, "loss": 0.7572, "lr": 4.3699369906274864e-05, "epoch": 3.07938635686625, "percentage": 30.79, "elapsed_time": "1:26:07", "remaining_time": "3:13:32", "throughput": 2307.16, "total_tokens": 11921776} {"current_steps": 20680, "total_steps": 67140, "loss": 0.5653, "lr": 4.3695055816151296e-05, "epoch": 3.0801310694072086, "percentage": 30.8, "elapsed_time": "1:26:08", "remaining_time": "3:13:31", "throughput": 2307.23, "total_tokens": 11924784} {"current_steps": 20685, "total_steps": 67140, "loss": 0.8132, "lr": 4.369074046269187e-05, "epoch": 3.080875781948168, "percentage": 30.81, "elapsed_time": "1:26:09", "remaining_time": "3:13:29", "throughput": 2307.29, "total_tokens": 11927728} {"current_steps": 20690, "total_steps": 67140, "loss": 0.7135, "lr": 4.3686423846188196e-05, "epoch": 3.081620494489127, "percentage": 30.82, "elapsed_time": "1:26:10", "remaining_time": "3:13:28", "throughput": 2307.36, "total_tokens": 11930768} {"current_steps": 20695, "total_steps": 67140, "loss": 0.6018, "lr": 4.368210596693197e-05, "epoch": 3.082365207030086, "percentage": 30.82, "elapsed_time": "1:26:11", "remaining_time": "3:13:27", "throughput": 2307.42, "total_tokens": 11933744} {"current_steps": 20700, "total_steps": 67140, "loss": 0.7081, "lr": 4.367778682521498e-05, "epoch": 3.0831099195710454, "percentage": 30.83, "elapsed_time": "1:26:13", "remaining_time": "3:13:25", "throughput": 2307.47, "total_tokens": 11936560} {"current_steps": 20705, "total_steps": 67140, "loss": 0.6529, "lr": 4.367346642132909e-05, "epoch": 3.0838546321120046, "percentage": 30.84, "elapsed_time": "1:26:14", "remaining_time": "3:13:24", "throughput": 2307.56, "total_tokens": 11939760} {"current_steps": 20710, "total_steps": 67140, "loss": 0.6038, "lr": 4.366914475556626e-05, "epoch": 3.084599344652964, "percentage": 30.85, "elapsed_time": "1:26:15", "remaining_time": "3:13:22", "throughput": 2307.61, "total_tokens": 11942608} {"current_steps": 20715, "total_steps": 67140, "loss": 0.5943, "lr": 4.3664821828218536e-05, "epoch": 3.085344057193923, "percentage": 30.85, "elapsed_time": "1:26:16", "remaining_time": "3:13:21", "throughput": 2307.65, "total_tokens": 11945360} {"current_steps": 20720, "total_steps": 67140, "loss": 0.6459, "lr": 4.3660497639578036e-05, "epoch": 3.086088769734882, "percentage": 30.86, "elapsed_time": "1:26:17", "remaining_time": "3:13:19", "throughput": 2307.67, "total_tokens": 11948016} {"current_steps": 20725, "total_steps": 67140, "loss": 0.674, "lr": 4.3656172189936975e-05, "epoch": 3.0868334822758414, "percentage": 30.87, "elapsed_time": "1:26:18", "remaining_time": "3:13:18", "throughput": 2307.73, "total_tokens": 11951056} {"current_steps": 20730, "total_steps": 67140, "loss": 0.8094, "lr": 4.3651845479587647e-05, "epoch": 3.0875781948168006, "percentage": 30.88, "elapsed_time": "1:26:19", "remaining_time": "3:13:16", "throughput": 2307.79, "total_tokens": 11954000} {"current_steps": 20735, "total_steps": 67140, "loss": 0.605, "lr": 4.3647517508822434e-05, "epoch": 3.08832290735776, "percentage": 30.88, "elapsed_time": "1:26:20", "remaining_time": "3:13:14", "throughput": 2307.8, "total_tokens": 11956592} {"current_steps": 20740, "total_steps": 67140, "loss": 0.6449, "lr": 4.36431882779338e-05, "epoch": 3.089067619898719, "percentage": 30.89, "elapsed_time": "1:26:22", "remaining_time": "3:13:13", "throughput": 2307.84, "total_tokens": 11959376} {"current_steps": 20745, "total_steps": 67140, "loss": 0.6588, "lr": 4.3638857787214304e-05, "epoch": 3.0898123324396782, "percentage": 30.9, "elapsed_time": "1:26:23", "remaining_time": "3:13:11", "throughput": 2307.86, "total_tokens": 11962032} {"current_steps": 20750, "total_steps": 67140, "loss": 0.6372, "lr": 4.363452603695658e-05, "epoch": 3.0905570449806374, "percentage": 30.91, "elapsed_time": "1:26:24", "remaining_time": "3:13:10", "throughput": 2307.92, "total_tokens": 11965072} {"current_steps": 20755, "total_steps": 67140, "loss": 0.6245, "lr": 4.363019302745334e-05, "epoch": 3.0913017575215966, "percentage": 30.91, "elapsed_time": "1:26:25", "remaining_time": "3:13:09", "throughput": 2308.0, "total_tokens": 11968208} {"current_steps": 20760, "total_steps": 67140, "loss": 0.7172, "lr": 4.362585875899741e-05, "epoch": 3.092046470062556, "percentage": 30.92, "elapsed_time": "1:26:26", "remaining_time": "3:13:07", "throughput": 2308.05, "total_tokens": 11971088} {"current_steps": 20765, "total_steps": 67140, "loss": 0.6604, "lr": 4.3621523231881665e-05, "epoch": 3.092791182603515, "percentage": 30.93, "elapsed_time": "1:26:27", "remaining_time": "3:13:06", "throughput": 2308.12, "total_tokens": 11974128} {"current_steps": 20770, "total_steps": 67140, "loss": 0.6354, "lr": 4.36171864463991e-05, "epoch": 3.0935358951444742, "percentage": 30.94, "elapsed_time": "1:26:28", "remaining_time": "3:13:04", "throughput": 2308.17, "total_tokens": 11976976} {"current_steps": 20775, "total_steps": 67140, "loss": 0.5988, "lr": 4.361284840284275e-05, "epoch": 3.0942806076854334, "percentage": 30.94, "elapsed_time": "1:26:30", "remaining_time": "3:13:03", "throughput": 2308.2, "total_tokens": 11979728} {"current_steps": 20780, "total_steps": 67140, "loss": 0.8698, "lr": 4.36085091015058e-05, "epoch": 3.0950253202263927, "percentage": 30.95, "elapsed_time": "1:26:31", "remaining_time": "3:13:01", "throughput": 2308.26, "total_tokens": 11982672} {"current_steps": 20785, "total_steps": 67140, "loss": 0.5585, "lr": 4.3604168542681444e-05, "epoch": 3.095770032767352, "percentage": 30.96, "elapsed_time": "1:26:32", "remaining_time": "3:12:59", "throughput": 2308.29, "total_tokens": 11985360} {"current_steps": 20790, "total_steps": 67140, "loss": 0.6136, "lr": 4.3599826726663026e-05, "epoch": 3.096514745308311, "percentage": 30.97, "elapsed_time": "1:26:33", "remaining_time": "3:12:58", "throughput": 2308.33, "total_tokens": 11988208} {"current_steps": 20795, "total_steps": 67140, "loss": 0.7443, "lr": 4.359548365374394e-05, "epoch": 3.0972594578492703, "percentage": 30.97, "elapsed_time": "1:26:34", "remaining_time": "3:12:56", "throughput": 2308.38, "total_tokens": 11991120} {"current_steps": 20800, "total_steps": 67140, "loss": 0.6702, "lr": 4.3591139324217666e-05, "epoch": 3.0980041703902295, "percentage": 30.98, "elapsed_time": "1:26:35", "remaining_time": "3:12:55", "throughput": 2308.42, "total_tokens": 11993904} {"current_steps": 20805, "total_steps": 67140, "loss": 0.7111, "lr": 4.3586793738377785e-05, "epoch": 3.0987488829311887, "percentage": 30.99, "elapsed_time": "1:26:36", "remaining_time": "3:12:53", "throughput": 2308.48, "total_tokens": 11996848} {"current_steps": 20810, "total_steps": 67140, "loss": 0.7827, "lr": 4.358244689651795e-05, "epoch": 3.099493595472148, "percentage": 30.99, "elapsed_time": "1:26:37", "remaining_time": "3:12:52", "throughput": 2308.52, "total_tokens": 11999632} {"current_steps": 20815, "total_steps": 67140, "loss": 0.7555, "lr": 4.357809879893191e-05, "epoch": 3.100238308013107, "percentage": 31.0, "elapsed_time": "1:26:39", "remaining_time": "3:12:50", "throughput": 2308.53, "total_tokens": 12002224} {"current_steps": 20820, "total_steps": 67140, "loss": 0.5925, "lr": 4.357374944591348e-05, "epoch": 3.1009830205540663, "percentage": 31.01, "elapsed_time": "1:26:40", "remaining_time": "3:12:49", "throughput": 2308.58, "total_tokens": 12005072} {"current_steps": 20825, "total_steps": 67140, "loss": 0.7306, "lr": 4.3569398837756586e-05, "epoch": 3.1017277330950255, "percentage": 31.02, "elapsed_time": "1:26:41", "remaining_time": "3:12:47", "throughput": 2308.6, "total_tokens": 12007728} {"current_steps": 20830, "total_steps": 67140, "loss": 0.7715, "lr": 4.356504697475521e-05, "epoch": 3.1024724456359847, "percentage": 31.02, "elapsed_time": "1:26:42", "remaining_time": "3:12:46", "throughput": 2308.63, "total_tokens": 12010448} {"current_steps": 20835, "total_steps": 67140, "loss": 0.647, "lr": 4.356069385720344e-05, "epoch": 3.103217158176944, "percentage": 31.03, "elapsed_time": "1:26:43", "remaining_time": "3:12:44", "throughput": 2308.69, "total_tokens": 12013392} {"current_steps": 20840, "total_steps": 67140, "loss": 0.5705, "lr": 4.3556339485395444e-05, "epoch": 3.103961870717903, "percentage": 31.04, "elapsed_time": "1:26:44", "remaining_time": "3:12:43", "throughput": 2308.73, "total_tokens": 12016208} {"current_steps": 20845, "total_steps": 67140, "loss": 0.7651, "lr": 4.355198385962547e-05, "epoch": 3.1047065832588623, "percentage": 31.05, "elapsed_time": "1:26:45", "remaining_time": "3:12:41", "throughput": 2308.79, "total_tokens": 12019152} {"current_steps": 20850, "total_steps": 67140, "loss": 0.676, "lr": 4.354762698018785e-05, "epoch": 3.1054512957998215, "percentage": 31.05, "elapsed_time": "1:26:46", "remaining_time": "3:12:40", "throughput": 2308.83, "total_tokens": 12021936} {"current_steps": 20855, "total_steps": 67140, "loss": 0.6553, "lr": 4.3543268847377005e-05, "epoch": 3.1061960083407802, "percentage": 31.06, "elapsed_time": "1:26:48", "remaining_time": "3:12:38", "throughput": 2308.9, "total_tokens": 12024944} {"current_steps": 20860, "total_steps": 67140, "loss": 0.5602, "lr": 4.353890946148745e-05, "epoch": 3.1069407208817394, "percentage": 31.07, "elapsed_time": "1:26:49", "remaining_time": "3:12:37", "throughput": 2308.93, "total_tokens": 12027696} {"current_steps": 20865, "total_steps": 67140, "loss": 0.6932, "lr": 4.353454882281377e-05, "epoch": 3.1076854334226987, "percentage": 31.08, "elapsed_time": "1:26:50", "remaining_time": "3:12:35", "throughput": 2309.01, "total_tokens": 12030832} {"current_steps": 20870, "total_steps": 67140, "loss": 0.585, "lr": 4.353018693165063e-05, "epoch": 3.108430145963658, "percentage": 31.08, "elapsed_time": "1:26:51", "remaining_time": "3:12:34", "throughput": 2309.04, "total_tokens": 12033552} {"current_steps": 20875, "total_steps": 67140, "loss": 0.626, "lr": 4.35258237882928e-05, "epoch": 3.109174858504617, "percentage": 31.09, "elapsed_time": "1:26:52", "remaining_time": "3:12:32", "throughput": 2309.04, "total_tokens": 12036080} {"current_steps": 20880, "total_steps": 67140, "loss": 0.7564, "lr": 4.352145939303511e-05, "epoch": 3.1099195710455763, "percentage": 31.1, "elapsed_time": "1:26:53", "remaining_time": "3:12:31", "throughput": 2309.09, "total_tokens": 12038960} {"current_steps": 20885, "total_steps": 67140, "loss": 0.7341, "lr": 4.35170937461725e-05, "epoch": 3.1106642835865355, "percentage": 31.11, "elapsed_time": "1:26:54", "remaining_time": "3:12:29", "throughput": 2309.16, "total_tokens": 12042032} {"current_steps": 20890, "total_steps": 67140, "loss": 0.3906, "lr": 4.3512726847999987e-05, "epoch": 3.1114089961274947, "percentage": 31.11, "elapsed_time": "1:26:55", "remaining_time": "3:12:28", "throughput": 2309.18, "total_tokens": 12044688} {"current_steps": 20895, "total_steps": 67140, "loss": 0.5772, "lr": 4.3508358698812654e-05, "epoch": 3.112153708668454, "percentage": 31.12, "elapsed_time": "1:26:57", "remaining_time": "3:12:26", "throughput": 2309.2, "total_tokens": 12047344} {"current_steps": 20900, "total_steps": 67140, "loss": 0.6542, "lr": 4.350398929890569e-05, "epoch": 3.112898421209413, "percentage": 31.13, "elapsed_time": "1:26:58", "remaining_time": "3:12:25", "throughput": 2309.26, "total_tokens": 12050256} {"current_steps": 20905, "total_steps": 67140, "loss": 0.7147, "lr": 4.349961864857436e-05, "epoch": 3.1136431337503723, "percentage": 31.14, "elapsed_time": "1:26:59", "remaining_time": "3:12:23", "throughput": 2309.29, "total_tokens": 12053040} {"current_steps": 20910, "total_steps": 67140, "loss": 0.6841, "lr": 4.349524674811403e-05, "epoch": 3.1143878462913315, "percentage": 31.14, "elapsed_time": "1:27:00", "remaining_time": "3:12:22", "throughput": 2309.34, "total_tokens": 12055920} {"current_steps": 20915, "total_steps": 67140, "loss": 0.5664, "lr": 4.3490873597820106e-05, "epoch": 3.1151325588322907, "percentage": 31.15, "elapsed_time": "1:27:01", "remaining_time": "3:12:20", "throughput": 2309.44, "total_tokens": 12059216} {"current_steps": 20920, "total_steps": 67140, "loss": 0.6631, "lr": 4.3486499197988126e-05, "epoch": 3.11587727137325, "percentage": 31.16, "elapsed_time": "1:27:02", "remaining_time": "3:12:19", "throughput": 2309.5, "total_tokens": 12062160} {"current_steps": 20925, "total_steps": 67140, "loss": 0.6796, "lr": 4.348212354891369e-05, "epoch": 3.116621983914209, "percentage": 31.17, "elapsed_time": "1:27:03", "remaining_time": "3:12:17", "throughput": 2309.55, "total_tokens": 12065040} {"current_steps": 20930, "total_steps": 67140, "loss": 0.4925, "lr": 4.347774665089248e-05, "epoch": 3.1173666964551683, "percentage": 31.17, "elapsed_time": "1:27:05", "remaining_time": "3:12:16", "throughput": 2309.63, "total_tokens": 12068176} {"current_steps": 20935, "total_steps": 67140, "loss": 0.589, "lr": 4.347336850422029e-05, "epoch": 3.1181114089961275, "percentage": 31.18, "elapsed_time": "1:27:06", "remaining_time": "3:12:14", "throughput": 2309.66, "total_tokens": 12070928} {"current_steps": 20940, "total_steps": 67140, "loss": 0.6078, "lr": 4.346898910919296e-05, "epoch": 3.1188561215370867, "percentage": 31.19, "elapsed_time": "1:27:07", "remaining_time": "3:12:13", "throughput": 2309.71, "total_tokens": 12073776} {"current_steps": 20945, "total_steps": 67140, "loss": 0.728, "lr": 4.346460846610643e-05, "epoch": 3.119600834078046, "percentage": 31.2, "elapsed_time": "1:27:08", "remaining_time": "3:12:11", "throughput": 2309.75, "total_tokens": 12076624} {"current_steps": 20950, "total_steps": 67140, "loss": 0.641, "lr": 4.346022657525673e-05, "epoch": 3.120345546619005, "percentage": 31.2, "elapsed_time": "1:27:09", "remaining_time": "3:12:10", "throughput": 2309.83, "total_tokens": 12079728} {"current_steps": 20955, "total_steps": 67140, "loss": 0.5199, "lr": 4.345584343693998e-05, "epoch": 3.1210902591599643, "percentage": 31.21, "elapsed_time": "1:27:10", "remaining_time": "3:12:08", "throughput": 2309.88, "total_tokens": 12082672} {"current_steps": 20960, "total_steps": 67140, "loss": 0.6488, "lr": 4.345145905145237e-05, "epoch": 3.1218349717009235, "percentage": 31.22, "elapsed_time": "1:27:12", "remaining_time": "3:12:07", "throughput": 2309.94, "total_tokens": 12085680} {"current_steps": 20965, "total_steps": 67140, "loss": 0.6839, "lr": 4.344707341909017e-05, "epoch": 3.1225796842418827, "percentage": 31.23, "elapsed_time": "1:27:13", "remaining_time": "3:12:05", "throughput": 2309.98, "total_tokens": 12088432} {"current_steps": 20970, "total_steps": 67140, "loss": 0.76, "lr": 4.3442686540149744e-05, "epoch": 3.123324396782842, "percentage": 31.23, "elapsed_time": "1:27:14", "remaining_time": "3:12:04", "throughput": 2310.07, "total_tokens": 12091600} {"current_steps": 20975, "total_steps": 67140, "loss": 0.7111, "lr": 4.343829841492755e-05, "epoch": 3.124069109323801, "percentage": 31.24, "elapsed_time": "1:27:15", "remaining_time": "3:12:02", "throughput": 2310.12, "total_tokens": 12094416} {"current_steps": 20980, "total_steps": 67140, "loss": 0.5199, "lr": 4.343390904372011e-05, "epoch": 3.1248138218647603, "percentage": 31.25, "elapsed_time": "1:27:16", "remaining_time": "3:12:01", "throughput": 2310.19, "total_tokens": 12097488} {"current_steps": 20985, "total_steps": 67140, "loss": 0.5717, "lr": 4.3429518426824047e-05, "epoch": 3.1255585344057195, "percentage": 31.26, "elapsed_time": "1:27:17", "remaining_time": "3:12:00", "throughput": 2310.27, "total_tokens": 12100560} {"current_steps": 20990, "total_steps": 67140, "loss": 0.4965, "lr": 4.342512656453606e-05, "epoch": 3.1263032469466787, "percentage": 31.26, "elapsed_time": "1:27:18", "remaining_time": "3:11:58", "throughput": 2310.29, "total_tokens": 12103248} {"current_steps": 20995, "total_steps": 67140, "loss": 0.545, "lr": 4.342073345715292e-05, "epoch": 3.127047959487638, "percentage": 31.27, "elapsed_time": "1:27:19", "remaining_time": "3:11:56", "throughput": 2310.3, "total_tokens": 12105776} {"current_steps": 21000, "total_steps": 67140, "loss": 0.8327, "lr": 4.341633910497151e-05, "epoch": 3.127792672028597, "percentage": 31.28, "elapsed_time": "1:27:21", "remaining_time": "3:11:55", "throughput": 2310.35, "total_tokens": 12108656} {"current_steps": 21005, "total_steps": 67140, "loss": 0.8018, "lr": 4.3411943508288786e-05, "epoch": 3.1285373845695563, "percentage": 31.29, "elapsed_time": "1:27:22", "remaining_time": "3:11:53", "throughput": 2310.4, "total_tokens": 12111536} {"current_steps": 21010, "total_steps": 67140, "loss": 0.6177, "lr": 4.3407546667401776e-05, "epoch": 3.1292820971105155, "percentage": 31.29, "elapsed_time": "1:27:23", "remaining_time": "3:11:52", "throughput": 2310.48, "total_tokens": 12114704} {"current_steps": 21015, "total_steps": 67140, "loss": 0.6403, "lr": 4.34031485826076e-05, "epoch": 3.1300268096514747, "percentage": 31.3, "elapsed_time": "1:27:24", "remaining_time": "3:11:50", "throughput": 2310.52, "total_tokens": 12117488} {"current_steps": 21020, "total_steps": 67140, "loss": 0.7171, "lr": 4.339874925420347e-05, "epoch": 3.1307715221924335, "percentage": 31.31, "elapsed_time": "1:27:25", "remaining_time": "3:11:49", "throughput": 2310.56, "total_tokens": 12120304} {"current_steps": 21025, "total_steps": 67140, "loss": 0.5373, "lr": 4.339434868248665e-05, "epoch": 3.131516234733393, "percentage": 31.32, "elapsed_time": "1:27:26", "remaining_time": "3:11:47", "throughput": 2310.63, "total_tokens": 12123280} {"current_steps": 21030, "total_steps": 67140, "loss": 0.6247, "lr": 4.3389946867754546e-05, "epoch": 3.132260947274352, "percentage": 31.32, "elapsed_time": "1:27:27", "remaining_time": "3:11:46", "throughput": 2310.66, "total_tokens": 12125968} {"current_steps": 21035, "total_steps": 67140, "loss": 0.6108, "lr": 4.338554381030459e-05, "epoch": 3.133005659815311, "percentage": 31.33, "elapsed_time": "1:27:28", "remaining_time": "3:11:44", "throughput": 2310.69, "total_tokens": 12128784} {"current_steps": 21040, "total_steps": 67140, "loss": 0.6924, "lr": 4.338113951043436e-05, "epoch": 3.1337503723562703, "percentage": 31.34, "elapsed_time": "1:27:30", "remaining_time": "3:11:43", "throughput": 2310.73, "total_tokens": 12131632} {"current_steps": 21045, "total_steps": 67140, "loss": 0.7183, "lr": 4.337673396844143e-05, "epoch": 3.1344950848972295, "percentage": 31.34, "elapsed_time": "1:27:31", "remaining_time": "3:11:41", "throughput": 2310.78, "total_tokens": 12134512} {"current_steps": 21050, "total_steps": 67140, "loss": 0.7288, "lr": 4.337232718462354e-05, "epoch": 3.1352397974381887, "percentage": 31.35, "elapsed_time": "1:27:32", "remaining_time": "3:11:40", "throughput": 2310.87, "total_tokens": 12137744} {"current_steps": 21055, "total_steps": 67140, "loss": 0.5002, "lr": 4.336791915927847e-05, "epoch": 3.135984509979148, "percentage": 31.36, "elapsed_time": "1:27:33", "remaining_time": "3:11:38", "throughput": 2310.92, "total_tokens": 12140528} {"current_steps": 21060, "total_steps": 67140, "loss": 0.7549, "lr": 4.3363509892704114e-05, "epoch": 3.136729222520107, "percentage": 31.37, "elapsed_time": "1:27:34", "remaining_time": "3:11:37", "throughput": 2310.96, "total_tokens": 12143376} {"current_steps": 21065, "total_steps": 67140, "loss": 0.7128, "lr": 4.335909938519841e-05, "epoch": 3.1374739350610663, "percentage": 31.37, "elapsed_time": "1:27:35", "remaining_time": "3:11:35", "throughput": 2310.99, "total_tokens": 12146064} {"current_steps": 21070, "total_steps": 67140, "loss": 0.6231, "lr": 4.3354687637059414e-05, "epoch": 3.1382186476020255, "percentage": 31.38, "elapsed_time": "1:27:36", "remaining_time": "3:11:34", "throughput": 2311.08, "total_tokens": 12149328} {"current_steps": 21075, "total_steps": 67140, "loss": 0.7109, "lr": 4.335027464858526e-05, "epoch": 3.1389633601429847, "percentage": 31.39, "elapsed_time": "1:27:38", "remaining_time": "3:11:33", "throughput": 2311.1, "total_tokens": 12152048} {"current_steps": 21080, "total_steps": 67140, "loss": 0.4886, "lr": 4.334586042007414e-05, "epoch": 3.139708072683944, "percentage": 31.4, "elapsed_time": "1:27:39", "remaining_time": "3:11:31", "throughput": 2311.14, "total_tokens": 12154864} {"current_steps": 21085, "total_steps": 67140, "loss": 0.6294, "lr": 4.3341444951824365e-05, "epoch": 3.140452785224903, "percentage": 31.4, "elapsed_time": "1:27:40", "remaining_time": "3:11:30", "throughput": 2311.22, "total_tokens": 12158032} {"current_steps": 21090, "total_steps": 67140, "loss": 0.8125, "lr": 4.3337028244134315e-05, "epoch": 3.1411974977658623, "percentage": 31.41, "elapsed_time": "1:27:41", "remaining_time": "3:11:28", "throughput": 2311.24, "total_tokens": 12160656} {"current_steps": 21095, "total_steps": 67140, "loss": 0.6005, "lr": 4.3332610297302445e-05, "epoch": 3.1419422103068215, "percentage": 31.42, "elapsed_time": "1:27:42", "remaining_time": "3:11:26", "throughput": 2311.27, "total_tokens": 12163376} {"current_steps": 21100, "total_steps": 67140, "loss": 0.602, "lr": 4.3328191111627306e-05, "epoch": 3.1426869228477807, "percentage": 31.43, "elapsed_time": "1:27:43", "remaining_time": "3:11:25", "throughput": 2311.31, "total_tokens": 12166192} {"current_steps": 21105, "total_steps": 67140, "loss": 0.5194, "lr": 4.332377068740753e-05, "epoch": 3.14343163538874, "percentage": 31.43, "elapsed_time": "1:27:44", "remaining_time": "3:11:24", "throughput": 2311.4, "total_tokens": 12169360} {"current_steps": 21110, "total_steps": 67140, "loss": 0.6859, "lr": 4.331934902494184e-05, "epoch": 3.144176347929699, "percentage": 31.44, "elapsed_time": "1:27:46", "remaining_time": "3:11:22", "throughput": 2311.42, "total_tokens": 12171984} {"current_steps": 21115, "total_steps": 67140, "loss": 0.5591, "lr": 4.331492612452901e-05, "epoch": 3.1449210604706583, "percentage": 31.45, "elapsed_time": "1:27:47", "remaining_time": "3:11:20", "throughput": 2311.43, "total_tokens": 12174576} {"current_steps": 21120, "total_steps": 67140, "loss": 0.6655, "lr": 4.331050198646794e-05, "epoch": 3.1456657730116175, "percentage": 31.46, "elapsed_time": "1:27:48", "remaining_time": "3:11:19", "throughput": 2311.45, "total_tokens": 12177296} {"current_steps": 21125, "total_steps": 67140, "loss": 0.6941, "lr": 4.330607661105759e-05, "epoch": 3.1464104855525767, "percentage": 31.46, "elapsed_time": "1:27:49", "remaining_time": "3:11:17", "throughput": 2311.52, "total_tokens": 12180304} {"current_steps": 21130, "total_steps": 67140, "loss": 0.6464, "lr": 4.330164999859702e-05, "epoch": 3.147155198093536, "percentage": 31.47, "elapsed_time": "1:27:50", "remaining_time": "3:11:16", "throughput": 2311.59, "total_tokens": 12183408} {"current_steps": 21135, "total_steps": 67140, "loss": 0.7609, "lr": 4.3297222149385336e-05, "epoch": 3.147899910634495, "percentage": 31.48, "elapsed_time": "1:27:51", "remaining_time": "3:11:15", "throughput": 2311.63, "total_tokens": 12186192} {"current_steps": 21140, "total_steps": 67140, "loss": 0.7504, "lr": 4.329279306372178e-05, "epoch": 3.1486446231754543, "percentage": 31.49, "elapsed_time": "1:27:52", "remaining_time": "3:11:13", "throughput": 2311.68, "total_tokens": 12189136} {"current_steps": 21145, "total_steps": 67140, "loss": 0.6324, "lr": 4.3288362741905635e-05, "epoch": 3.1493893357164136, "percentage": 31.49, "elapsed_time": "1:27:54", "remaining_time": "3:11:12", "throughput": 2311.75, "total_tokens": 12192176} {"current_steps": 21150, "total_steps": 67140, "loss": 0.5897, "lr": 4.32839311842363e-05, "epoch": 3.1501340482573728, "percentage": 31.5, "elapsed_time": "1:27:55", "remaining_time": "3:11:10", "throughput": 2311.8, "total_tokens": 12195056} {"current_steps": 21155, "total_steps": 67140, "loss": 0.399, "lr": 4.327949839101323e-05, "epoch": 3.150878760798332, "percentage": 31.51, "elapsed_time": "1:27:56", "remaining_time": "3:11:09", "throughput": 2311.82, "total_tokens": 12197712} {"current_steps": 21160, "total_steps": 67140, "loss": 0.6521, "lr": 4.3275064362535966e-05, "epoch": 3.151623473339291, "percentage": 31.52, "elapsed_time": "1:27:57", "remaining_time": "3:11:07", "throughput": 2311.91, "total_tokens": 12200944} {"current_steps": 21165, "total_steps": 67140, "loss": 0.5447, "lr": 4.327062909910417e-05, "epoch": 3.1523681858802504, "percentage": 31.52, "elapsed_time": "1:27:58", "remaining_time": "3:11:06", "throughput": 2311.91, "total_tokens": 12203472} {"current_steps": 21170, "total_steps": 67140, "loss": 0.5308, "lr": 4.326619260101753e-05, "epoch": 3.1531128984212096, "percentage": 31.53, "elapsed_time": "1:27:59", "remaining_time": "3:11:04", "throughput": 2311.95, "total_tokens": 12206256} {"current_steps": 21175, "total_steps": 67140, "loss": 0.692, "lr": 4.326175486857587e-05, "epoch": 3.1538576109621688, "percentage": 31.54, "elapsed_time": "1:28:00", "remaining_time": "3:11:03", "throughput": 2312.0, "total_tokens": 12209200} {"current_steps": 21180, "total_steps": 67140, "loss": 0.8347, "lr": 4.3257315902079055e-05, "epoch": 3.154602323503128, "percentage": 31.55, "elapsed_time": "1:28:01", "remaining_time": "3:11:01", "throughput": 2312.03, "total_tokens": 12211888} {"current_steps": 21185, "total_steps": 67140, "loss": 0.6439, "lr": 4.3252875701827064e-05, "epoch": 3.155347036044087, "percentage": 31.55, "elapsed_time": "1:28:03", "remaining_time": "3:11:00", "throughput": 2312.08, "total_tokens": 12214800} {"current_steps": 21190, "total_steps": 67140, "loss": 0.7016, "lr": 4.324843426811994e-05, "epoch": 3.1560917485850464, "percentage": 31.56, "elapsed_time": "1:28:04", "remaining_time": "3:10:58", "throughput": 2312.17, "total_tokens": 12218032} {"current_steps": 21195, "total_steps": 67140, "loss": 0.5255, "lr": 4.324399160125782e-05, "epoch": 3.156836461126005, "percentage": 31.57, "elapsed_time": "1:28:05", "remaining_time": "3:10:57", "throughput": 2312.21, "total_tokens": 12220816} {"current_steps": 21200, "total_steps": 67140, "loss": 0.6889, "lr": 4.323954770154093e-05, "epoch": 3.157581173666965, "percentage": 31.58, "elapsed_time": "1:28:06", "remaining_time": "3:10:55", "throughput": 2312.27, "total_tokens": 12223824} {"current_steps": 21205, "total_steps": 67140, "loss": 0.567, "lr": 4.323510256926956e-05, "epoch": 3.1583258862079235, "percentage": 31.58, "elapsed_time": "1:28:07", "remaining_time": "3:10:54", "throughput": 2312.35, "total_tokens": 12226928} {"current_steps": 21210, "total_steps": 67140, "loss": 0.4709, "lr": 4.323065620474409e-05, "epoch": 3.1590705987488827, "percentage": 31.59, "elapsed_time": "1:28:08", "remaining_time": "3:10:52", "throughput": 2312.39, "total_tokens": 12229808} {"current_steps": 21215, "total_steps": 67140, "loss": 0.4851, "lr": 4.3226208608265e-05, "epoch": 3.159815311289842, "percentage": 31.6, "elapsed_time": "1:28:09", "remaining_time": "3:10:51", "throughput": 2312.4, "total_tokens": 12232400} {"current_steps": 21220, "total_steps": 67140, "loss": 0.6456, "lr": 4.322175978013283e-05, "epoch": 3.160560023830801, "percentage": 31.61, "elapsed_time": "1:28:11", "remaining_time": "3:10:49", "throughput": 2312.46, "total_tokens": 12235344} {"current_steps": 21225, "total_steps": 67140, "loss": 0.6154, "lr": 4.321730972064823e-05, "epoch": 3.1613047363717603, "percentage": 31.61, "elapsed_time": "1:28:12", "remaining_time": "3:10:48", "throughput": 2312.49, "total_tokens": 12238096} {"current_steps": 21230, "total_steps": 67140, "loss": 0.7059, "lr": 4.32128584301119e-05, "epoch": 3.1620494489127196, "percentage": 31.62, "elapsed_time": "1:28:13", "remaining_time": "3:10:46", "throughput": 2312.56, "total_tokens": 12241168} {"current_steps": 21235, "total_steps": 67140, "loss": 0.384, "lr": 4.320840590882464e-05, "epoch": 3.1627941614536788, "percentage": 31.63, "elapsed_time": "1:28:14", "remaining_time": "3:10:45", "throughput": 2312.62, "total_tokens": 12244112} {"current_steps": 21240, "total_steps": 67140, "loss": 0.8253, "lr": 4.320395215708734e-05, "epoch": 3.163538873994638, "percentage": 31.64, "elapsed_time": "1:28:15", "remaining_time": "3:10:44", "throughput": 2312.72, "total_tokens": 12247440} {"current_steps": 21245, "total_steps": 67140, "loss": 0.6139, "lr": 4.319949717520096e-05, "epoch": 3.164283586535597, "percentage": 31.64, "elapsed_time": "1:28:16", "remaining_time": "3:10:42", "throughput": 2312.76, "total_tokens": 12250256} {"current_steps": 21250, "total_steps": 67140, "loss": 0.69, "lr": 4.319504096346657e-05, "epoch": 3.1650282990765564, "percentage": 31.65, "elapsed_time": "1:28:17", "remaining_time": "3:10:40", "throughput": 2312.79, "total_tokens": 12252944} {"current_steps": 21255, "total_steps": 67140, "loss": 0.7443, "lr": 4.319058352218528e-05, "epoch": 3.1657730116175156, "percentage": 31.66, "elapsed_time": "1:28:19", "remaining_time": "3:10:39", "throughput": 2312.82, "total_tokens": 12255696} {"current_steps": 21260, "total_steps": 67140, "loss": 0.6291, "lr": 4.3186124851658305e-05, "epoch": 3.1665177241584748, "percentage": 31.67, "elapsed_time": "1:28:20", "remaining_time": "3:10:37", "throughput": 2312.86, "total_tokens": 12258544} {"current_steps": 21265, "total_steps": 67140, "loss": 0.7026, "lr": 4.318166495218696e-05, "epoch": 3.167262436699434, "percentage": 31.67, "elapsed_time": "1:28:21", "remaining_time": "3:10:36", "throughput": 2312.96, "total_tokens": 12261808} {"current_steps": 21270, "total_steps": 67140, "loss": 0.7023, "lr": 4.317720382407262e-05, "epoch": 3.168007149240393, "percentage": 31.68, "elapsed_time": "1:28:22", "remaining_time": "3:10:35", "throughput": 2313.0, "total_tokens": 12264592} {"current_steps": 21275, "total_steps": 67140, "loss": 0.5906, "lr": 4.317274146761674e-05, "epoch": 3.1687518617813524, "percentage": 31.69, "elapsed_time": "1:28:23", "remaining_time": "3:10:33", "throughput": 2313.05, "total_tokens": 12267440} {"current_steps": 21280, "total_steps": 67140, "loss": 0.7074, "lr": 4.316827788312089e-05, "epoch": 3.1694965743223116, "percentage": 31.69, "elapsed_time": "1:28:24", "remaining_time": "3:10:32", "throughput": 2313.11, "total_tokens": 12270416} {"current_steps": 21285, "total_steps": 67140, "loss": 0.5547, "lr": 4.316381307088668e-05, "epoch": 3.170241286863271, "percentage": 31.7, "elapsed_time": "1:28:25", "remaining_time": "3:10:30", "throughput": 2313.17, "total_tokens": 12273424} {"current_steps": 21290, "total_steps": 67140, "loss": 0.6956, "lr": 4.315934703121583e-05, "epoch": 3.17098599940423, "percentage": 31.71, "elapsed_time": "1:28:27", "remaining_time": "3:10:29", "throughput": 2313.19, "total_tokens": 12276080} {"current_steps": 21295, "total_steps": 67140, "loss": 0.5839, "lr": 4.315487976441014e-05, "epoch": 3.171730711945189, "percentage": 31.72, "elapsed_time": "1:28:28", "remaining_time": "3:10:27", "throughput": 2313.26, "total_tokens": 12279152} {"current_steps": 21300, "total_steps": 67140, "loss": 0.5938, "lr": 4.3150411270771486e-05, "epoch": 3.1724754244861484, "percentage": 31.72, "elapsed_time": "1:28:29", "remaining_time": "3:10:26", "throughput": 2313.34, "total_tokens": 12282352} {"current_steps": 21305, "total_steps": 67140, "loss": 0.7018, "lr": 4.3145941550601836e-05, "epoch": 3.1732201370271076, "percentage": 31.73, "elapsed_time": "1:28:30", "remaining_time": "3:10:24", "throughput": 2313.37, "total_tokens": 12285040} {"current_steps": 21310, "total_steps": 67140, "loss": 0.6305, "lr": 4.314147060420323e-05, "epoch": 3.173964849568067, "percentage": 31.74, "elapsed_time": "1:28:31", "remaining_time": "3:10:23", "throughput": 2313.43, "total_tokens": 12288016} {"current_steps": 21315, "total_steps": 67140, "loss": 0.7711, "lr": 4.31369984318778e-05, "epoch": 3.174709562109026, "percentage": 31.75, "elapsed_time": "1:28:32", "remaining_time": "3:10:21", "throughput": 2313.48, "total_tokens": 12290896} {"current_steps": 21320, "total_steps": 67140, "loss": 0.6977, "lr": 4.313252503392775e-05, "epoch": 3.175454274649985, "percentage": 31.75, "elapsed_time": "1:28:33", "remaining_time": "3:10:20", "throughput": 2313.55, "total_tokens": 12293904} {"current_steps": 21325, "total_steps": 67140, "loss": 0.6321, "lr": 4.3128050410655384e-05, "epoch": 3.1761989871909444, "percentage": 31.76, "elapsed_time": "1:28:35", "remaining_time": "3:10:18", "throughput": 2313.6, "total_tokens": 12296784} {"current_steps": 21330, "total_steps": 67140, "loss": 0.5445, "lr": 4.312357456236308e-05, "epoch": 3.1769436997319036, "percentage": 31.77, "elapsed_time": "1:28:36", "remaining_time": "3:10:17", "throughput": 2313.7, "total_tokens": 12300112} {"current_steps": 21335, "total_steps": 67140, "loss": 0.6752, "lr": 4.3119097489353285e-05, "epoch": 3.177688412272863, "percentage": 31.78, "elapsed_time": "1:28:37", "remaining_time": "3:10:16", "throughput": 2313.76, "total_tokens": 12303120} {"current_steps": 21340, "total_steps": 67140, "loss": 0.6823, "lr": 4.311461919192855e-05, "epoch": 3.178433124813822, "percentage": 31.78, "elapsed_time": "1:28:38", "remaining_time": "3:10:14", "throughput": 2313.82, "total_tokens": 12306064} {"current_steps": 21345, "total_steps": 67140, "loss": 0.6722, "lr": 4.31101396703915e-05, "epoch": 3.179177837354781, "percentage": 31.79, "elapsed_time": "1:28:39", "remaining_time": "3:10:13", "throughput": 2313.86, "total_tokens": 12308912} {"current_steps": 21350, "total_steps": 67140, "loss": 0.5198, "lr": 4.310565892504484e-05, "epoch": 3.1799225498957404, "percentage": 31.8, "elapsed_time": "1:28:40", "remaining_time": "3:10:11", "throughput": 2313.91, "total_tokens": 12311792} {"current_steps": 21355, "total_steps": 67140, "loss": 0.7182, "lr": 4.3101176956191365e-05, "epoch": 3.1806672624366996, "percentage": 31.81, "elapsed_time": "1:28:41", "remaining_time": "3:10:10", "throughput": 2313.94, "total_tokens": 12314544} {"current_steps": 21360, "total_steps": 67140, "loss": 0.5677, "lr": 4.309669376413394e-05, "epoch": 3.181411974977659, "percentage": 31.81, "elapsed_time": "1:28:43", "remaining_time": "3:10:08", "throughput": 2313.99, "total_tokens": 12317456} {"current_steps": 21365, "total_steps": 67140, "loss": 0.5628, "lr": 4.309220934917553e-05, "epoch": 3.182156687518618, "percentage": 31.82, "elapsed_time": "1:28:44", "remaining_time": "3:10:07", "throughput": 2314.04, "total_tokens": 12320400} {"current_steps": 21370, "total_steps": 67140, "loss": 0.7105, "lr": 4.3087723711619166e-05, "epoch": 3.182901400059577, "percentage": 31.83, "elapsed_time": "1:28:45", "remaining_time": "3:10:05", "throughput": 2314.06, "total_tokens": 12323120} {"current_steps": 21375, "total_steps": 67140, "loss": 0.6346, "lr": 4.3083236851767976e-05, "epoch": 3.1836461126005364, "percentage": 31.84, "elapsed_time": "1:28:46", "remaining_time": "3:10:04", "throughput": 2314.1, "total_tokens": 12325936} {"current_steps": 21380, "total_steps": 67140, "loss": 0.6293, "lr": 4.307874876992516e-05, "epoch": 3.184390825141495, "percentage": 31.84, "elapsed_time": "1:28:47", "remaining_time": "3:10:02", "throughput": 2314.14, "total_tokens": 12328816} {"current_steps": 21385, "total_steps": 67140, "loss": 0.7608, "lr": 4.307425946639401e-05, "epoch": 3.1851355376824544, "percentage": 31.85, "elapsed_time": "1:28:48", "remaining_time": "3:10:01", "throughput": 2314.21, "total_tokens": 12331856} {"current_steps": 21390, "total_steps": 67140, "loss": 0.683, "lr": 4.3069768941477885e-05, "epoch": 3.1858802502234136, "percentage": 31.86, "elapsed_time": "1:28:49", "remaining_time": "3:09:59", "throughput": 2314.27, "total_tokens": 12334864} {"current_steps": 21395, "total_steps": 67140, "loss": 0.5193, "lr": 4.3065277195480235e-05, "epoch": 3.186624962764373, "percentage": 31.87, "elapsed_time": "1:28:50", "remaining_time": "3:09:58", "throughput": 2314.27, "total_tokens": 12337328} {"current_steps": 21400, "total_steps": 67140, "loss": 0.7364, "lr": 4.306078422870461e-05, "epoch": 3.187369675305332, "percentage": 31.87, "elapsed_time": "1:28:52", "remaining_time": "3:09:56", "throughput": 2314.33, "total_tokens": 12340400} {"current_steps": 21405, "total_steps": 67140, "loss": 0.7411, "lr": 4.3056290041454615e-05, "epoch": 3.188114387846291, "percentage": 31.88, "elapsed_time": "1:28:53", "remaining_time": "3:09:55", "throughput": 2314.38, "total_tokens": 12343280} {"current_steps": 21410, "total_steps": 67140, "loss": 0.5558, "lr": 4.3051794634033946e-05, "epoch": 3.1888591003872504, "percentage": 31.89, "elapsed_time": "1:28:54", "remaining_time": "3:09:53", "throughput": 2314.4, "total_tokens": 12345936} {"current_steps": 21415, "total_steps": 67140, "loss": 0.686, "lr": 4.304729800674639e-05, "epoch": 3.1896038129282096, "percentage": 31.9, "elapsed_time": "1:28:55", "remaining_time": "3:09:52", "throughput": 2314.45, "total_tokens": 12348880} {"current_steps": 21420, "total_steps": 67140, "loss": 0.5175, "lr": 4.304280015989581e-05, "epoch": 3.190348525469169, "percentage": 31.9, "elapsed_time": "1:28:56", "remaining_time": "3:09:51", "throughput": 2314.52, "total_tokens": 12351984} {"current_steps": 21425, "total_steps": 67140, "loss": 0.6182, "lr": 4.303830109378616e-05, "epoch": 3.191093238010128, "percentage": 31.91, "elapsed_time": "1:28:57", "remaining_time": "3:09:49", "throughput": 2314.57, "total_tokens": 12354896} {"current_steps": 21430, "total_steps": 67140, "loss": 0.4923, "lr": 4.303380080872145e-05, "epoch": 3.191837950551087, "percentage": 31.92, "elapsed_time": "1:28:59", "remaining_time": "3:09:48", "throughput": 2314.6, "total_tokens": 12357680} {"current_steps": 21435, "total_steps": 67140, "loss": 0.6038, "lr": 4.302929930500581e-05, "epoch": 3.1925826630920464, "percentage": 31.93, "elapsed_time": "1:29:00", "remaining_time": "3:09:46", "throughput": 2314.65, "total_tokens": 12360592} {"current_steps": 21440, "total_steps": 67140, "loss": 0.6848, "lr": 4.302479658294341e-05, "epoch": 3.1933273756330056, "percentage": 31.93, "elapsed_time": "1:29:01", "remaining_time": "3:09:45", "throughput": 2314.68, "total_tokens": 12363344} {"current_steps": 21445, "total_steps": 67140, "loss": 0.668, "lr": 4.3020292642838556e-05, "epoch": 3.194072088173965, "percentage": 31.94, "elapsed_time": "1:29:02", "remaining_time": "3:09:43", "throughput": 2314.74, "total_tokens": 12366352} {"current_steps": 21450, "total_steps": 67140, "loss": 0.4355, "lr": 4.301578748499558e-05, "epoch": 3.194816800714924, "percentage": 31.95, "elapsed_time": "1:29:03", "remaining_time": "3:09:42", "throughput": 2314.79, "total_tokens": 12369200} {"current_steps": 21455, "total_steps": 67140, "loss": 0.6735, "lr": 4.301128110971895e-05, "epoch": 3.1955615132558832, "percentage": 31.96, "elapsed_time": "1:29:04", "remaining_time": "3:09:40", "throughput": 2314.85, "total_tokens": 12372208} {"current_steps": 21460, "total_steps": 67140, "loss": 0.5654, "lr": 4.300677351731315e-05, "epoch": 3.1963062257968424, "percentage": 31.96, "elapsed_time": "1:29:05", "remaining_time": "3:09:39", "throughput": 2314.9, "total_tokens": 12375152} {"current_steps": 21465, "total_steps": 67140, "loss": 0.8125, "lr": 4.300226470808282e-05, "epoch": 3.1970509383378016, "percentage": 31.97, "elapsed_time": "1:29:07", "remaining_time": "3:09:37", "throughput": 2314.96, "total_tokens": 12378096} {"current_steps": 21470, "total_steps": 67140, "loss": 0.5632, "lr": 4.2997754682332626e-05, "epoch": 3.197795650878761, "percentage": 31.98, "elapsed_time": "1:29:08", "remaining_time": "3:09:36", "throughput": 2315.03, "total_tokens": 12381200} {"current_steps": 21475, "total_steps": 67140, "loss": 0.5234, "lr": 4.2993243440367345e-05, "epoch": 3.19854036341972, "percentage": 31.99, "elapsed_time": "1:29:09", "remaining_time": "3:09:34", "throughput": 2315.06, "total_tokens": 12383952} {"current_steps": 21480, "total_steps": 67140, "loss": 0.5282, "lr": 4.2988730982491824e-05, "epoch": 3.1992850759606792, "percentage": 31.99, "elapsed_time": "1:29:10", "remaining_time": "3:09:33", "throughput": 2315.09, "total_tokens": 12386672} {"current_steps": 21485, "total_steps": 67140, "loss": 0.678, "lr": 4.2984217309011e-05, "epoch": 3.2000297885016384, "percentage": 32.0, "elapsed_time": "1:29:11", "remaining_time": "3:09:31", "throughput": 2315.14, "total_tokens": 12389520} {"current_steps": 21490, "total_steps": 67140, "loss": 0.6022, "lr": 4.2979702420229894e-05, "epoch": 3.2007745010425976, "percentage": 32.01, "elapsed_time": "1:29:12", "remaining_time": "3:09:30", "throughput": 2315.21, "total_tokens": 12392560} {"current_steps": 21495, "total_steps": 67140, "loss": 0.5673, "lr": 4.29751863164536e-05, "epoch": 3.201519213583557, "percentage": 32.02, "elapsed_time": "1:29:13", "remaining_time": "3:09:28", "throughput": 2315.22, "total_tokens": 12395184} {"current_steps": 21500, "total_steps": 67140, "loss": 0.6188, "lr": 4.2970668997987294e-05, "epoch": 3.202263926124516, "percentage": 32.02, "elapsed_time": "1:29:14", "remaining_time": "3:09:27", "throughput": 2315.27, "total_tokens": 12398032} {"current_steps": 21505, "total_steps": 67140, "loss": 0.6591, "lr": 4.296615046513624e-05, "epoch": 3.2030086386654752, "percentage": 32.03, "elapsed_time": "1:29:16", "remaining_time": "3:09:25", "throughput": 2315.35, "total_tokens": 12401168} {"current_steps": 21510, "total_steps": 67140, "loss": 0.5939, "lr": 4.296163071820578e-05, "epoch": 3.2037533512064345, "percentage": 32.04, "elapsed_time": "1:29:17", "remaining_time": "3:09:24", "throughput": 2315.41, "total_tokens": 12404144} {"current_steps": 21515, "total_steps": 67140, "loss": 0.721, "lr": 4.295710975750135e-05, "epoch": 3.2044980637473937, "percentage": 32.04, "elapsed_time": "1:29:18", "remaining_time": "3:09:23", "throughput": 2315.48, "total_tokens": 12407216} {"current_steps": 21520, "total_steps": 67140, "loss": 0.8653, "lr": 4.295258758332845e-05, "epoch": 3.205242776288353, "percentage": 32.05, "elapsed_time": "1:29:19", "remaining_time": "3:09:21", "throughput": 2315.5, "total_tokens": 12409904} {"current_steps": 21525, "total_steps": 67140, "loss": 0.5928, "lr": 4.294806419599267e-05, "epoch": 3.205987488829312, "percentage": 32.06, "elapsed_time": "1:29:20", "remaining_time": "3:09:20", "throughput": 2315.58, "total_tokens": 12413008} {"current_steps": 21530, "total_steps": 67140, "loss": 0.7647, "lr": 4.2943539595799675e-05, "epoch": 3.2067322013702713, "percentage": 32.07, "elapsed_time": "1:29:21", "remaining_time": "3:09:18", "throughput": 2315.62, "total_tokens": 12415888} {"current_steps": 21535, "total_steps": 67140, "loss": 0.6305, "lr": 4.293901378305523e-05, "epoch": 3.2074769139112305, "percentage": 32.07, "elapsed_time": "1:29:22", "remaining_time": "3:09:17", "throughput": 2315.67, "total_tokens": 12418800} {"current_steps": 21540, "total_steps": 67140, "loss": 0.6732, "lr": 4.2934486758065176e-05, "epoch": 3.2082216264521897, "percentage": 32.08, "elapsed_time": "1:29:24", "remaining_time": "3:09:15", "throughput": 2315.72, "total_tokens": 12421680} {"current_steps": 21545, "total_steps": 67140, "loss": 0.7111, "lr": 4.292995852113542e-05, "epoch": 3.2089663389931484, "percentage": 32.09, "elapsed_time": "1:29:25", "remaining_time": "3:09:14", "throughput": 2315.79, "total_tokens": 12424816} {"current_steps": 21550, "total_steps": 67140, "loss": 0.4836, "lr": 4.292542907257196e-05, "epoch": 3.2097110515341076, "percentage": 32.1, "elapsed_time": "1:29:26", "remaining_time": "3:09:12", "throughput": 2315.81, "total_tokens": 12427472} {"current_steps": 21555, "total_steps": 67140, "loss": 0.6532, "lr": 4.292089841268089e-05, "epoch": 3.210455764075067, "percentage": 32.1, "elapsed_time": "1:29:27", "remaining_time": "3:09:11", "throughput": 2315.88, "total_tokens": 12430480} {"current_steps": 21560, "total_steps": 67140, "loss": 0.6472, "lr": 4.291636654176836e-05, "epoch": 3.211200476616026, "percentage": 32.11, "elapsed_time": "1:29:28", "remaining_time": "3:09:09", "throughput": 2315.92, "total_tokens": 12433360} {"current_steps": 21565, "total_steps": 67140, "loss": 0.5084, "lr": 4.291183346014063e-05, "epoch": 3.2119451891569852, "percentage": 32.12, "elapsed_time": "1:29:29", "remaining_time": "3:09:08", "throughput": 2315.98, "total_tokens": 12436336} {"current_steps": 21570, "total_steps": 67140, "loss": 0.6348, "lr": 4.290729916810401e-05, "epoch": 3.2126899016979444, "percentage": 32.13, "elapsed_time": "1:29:30", "remaining_time": "3:09:06", "throughput": 2316.02, "total_tokens": 12439184} {"current_steps": 21575, "total_steps": 67140, "loss": 0.6525, "lr": 4.290276366596492e-05, "epoch": 3.2134346142389036, "percentage": 32.13, "elapsed_time": "1:29:32", "remaining_time": "3:09:05", "throughput": 2316.05, "total_tokens": 12442000} {"current_steps": 21580, "total_steps": 67140, "loss": 0.7474, "lr": 4.2898226954029844e-05, "epoch": 3.214179326779863, "percentage": 32.14, "elapsed_time": "1:29:33", "remaining_time": "3:09:03", "throughput": 2316.08, "total_tokens": 12444720} {"current_steps": 21585, "total_steps": 67140, "loss": 0.5047, "lr": 4.289368903260536e-05, "epoch": 3.214924039320822, "percentage": 32.15, "elapsed_time": "1:29:34", "remaining_time": "3:09:02", "throughput": 2316.11, "total_tokens": 12447440} {"current_steps": 21590, "total_steps": 67140, "loss": 0.7448, "lr": 4.288914990199814e-05, "epoch": 3.2156687518617812, "percentage": 32.16, "elapsed_time": "1:29:35", "remaining_time": "3:09:00", "throughput": 2316.15, "total_tokens": 12450256} {"current_steps": 21595, "total_steps": 67140, "loss": 0.663, "lr": 4.288460956251489e-05, "epoch": 3.2164134644027405, "percentage": 32.16, "elapsed_time": "1:29:36", "remaining_time": "3:08:59", "throughput": 2316.19, "total_tokens": 12453136} {"current_steps": 21600, "total_steps": 67140, "loss": 0.6654, "lr": 4.288006801446243e-05, "epoch": 3.2171581769436997, "percentage": 32.17, "elapsed_time": "1:29:37", "remaining_time": "3:08:58", "throughput": 2316.27, "total_tokens": 12456272} {"current_steps": 21605, "total_steps": 67140, "loss": 0.7383, "lr": 4.287552525814768e-05, "epoch": 3.217902889484659, "percentage": 32.18, "elapsed_time": "1:29:38", "remaining_time": "3:08:56", "throughput": 2316.29, "total_tokens": 12458992} {"current_steps": 21610, "total_steps": 67140, "loss": 0.7141, "lr": 4.2870981293877605e-05, "epoch": 3.218647602025618, "percentage": 32.19, "elapsed_time": "1:29:40", "remaining_time": "3:08:55", "throughput": 2316.34, "total_tokens": 12461936} {"current_steps": 21615, "total_steps": 67140, "loss": 0.5553, "lr": 4.286643612195927e-05, "epoch": 3.2193923145665773, "percentage": 32.19, "elapsed_time": "1:29:41", "remaining_time": "3:08:53", "throughput": 2316.37, "total_tokens": 12464656} {"current_steps": 21620, "total_steps": 67140, "loss": 0.4035, "lr": 4.286188974269983e-05, "epoch": 3.2201370271075365, "percentage": 32.2, "elapsed_time": "1:29:42", "remaining_time": "3:08:52", "throughput": 2316.41, "total_tokens": 12467600} {"current_steps": 21625, "total_steps": 67140, "loss": 0.784, "lr": 4.28573421564065e-05, "epoch": 3.2208817396484957, "percentage": 32.21, "elapsed_time": "1:29:43", "remaining_time": "3:08:50", "throughput": 2316.46, "total_tokens": 12470512} {"current_steps": 21630, "total_steps": 67140, "loss": 0.5835, "lr": 4.2852793363386585e-05, "epoch": 3.221626452189455, "percentage": 32.22, "elapsed_time": "1:29:44", "remaining_time": "3:08:49", "throughput": 2316.5, "total_tokens": 12473328} {"current_steps": 21635, "total_steps": 67140, "loss": 0.6938, "lr": 4.2848243363947484e-05, "epoch": 3.222371164730414, "percentage": 32.22, "elapsed_time": "1:29:45", "remaining_time": "3:08:47", "throughput": 2316.53, "total_tokens": 12476016} {"current_steps": 21640, "total_steps": 67140, "loss": 0.656, "lr": 4.2843692158396655e-05, "epoch": 3.2231158772713733, "percentage": 32.23, "elapsed_time": "1:29:46", "remaining_time": "3:08:46", "throughput": 2316.61, "total_tokens": 12479152} {"current_steps": 21645, "total_steps": 67140, "loss": 0.6826, "lr": 4.283913974704166e-05, "epoch": 3.2238605898123325, "percentage": 32.24, "elapsed_time": "1:29:47", "remaining_time": "3:08:44", "throughput": 2316.63, "total_tokens": 12481840} {"current_steps": 21650, "total_steps": 67140, "loss": 0.6625, "lr": 4.283458613019013e-05, "epoch": 3.2246053023532917, "percentage": 32.25, "elapsed_time": "1:29:49", "remaining_time": "3:08:43", "throughput": 2316.7, "total_tokens": 12484880} {"current_steps": 21655, "total_steps": 67140, "loss": 0.6579, "lr": 4.283003130814978e-05, "epoch": 3.225350014894251, "percentage": 32.25, "elapsed_time": "1:29:50", "remaining_time": "3:08:41", "throughput": 2316.72, "total_tokens": 12487536} {"current_steps": 21660, "total_steps": 67140, "loss": 0.6197, "lr": 4.2825475281228406e-05, "epoch": 3.22609472743521, "percentage": 32.26, "elapsed_time": "1:29:51", "remaining_time": "3:08:40", "throughput": 2316.76, "total_tokens": 12490320} {"current_steps": 21665, "total_steps": 67140, "loss": 0.7221, "lr": 4.282091804973388e-05, "epoch": 3.2268394399761693, "percentage": 32.27, "elapsed_time": "1:29:52", "remaining_time": "3:08:38", "throughput": 2316.8, "total_tokens": 12493200} {"current_steps": 21670, "total_steps": 67140, "loss": 0.5876, "lr": 4.2816359613974176e-05, "epoch": 3.2275841525171285, "percentage": 32.28, "elapsed_time": "1:29:53", "remaining_time": "3:08:37", "throughput": 2316.8, "total_tokens": 12495664} {"current_steps": 21675, "total_steps": 67140, "loss": 0.5871, "lr": 4.281179997425732e-05, "epoch": 3.2283288650580877, "percentage": 32.28, "elapsed_time": "1:29:54", "remaining_time": "3:08:35", "throughput": 2316.88, "total_tokens": 12498864} {"current_steps": 21680, "total_steps": 67140, "loss": 0.5802, "lr": 4.280723913089144e-05, "epoch": 3.229073577599047, "percentage": 32.29, "elapsed_time": "1:29:55", "remaining_time": "3:08:34", "throughput": 2316.91, "total_tokens": 12501648} {"current_steps": 21685, "total_steps": 67140, "loss": 0.533, "lr": 4.280267708418474e-05, "epoch": 3.229818290140006, "percentage": 32.3, "elapsed_time": "1:29:56", "remaining_time": "3:08:32", "throughput": 2316.95, "total_tokens": 12504464} {"current_steps": 21690, "total_steps": 67140, "loss": 0.6751, "lr": 4.279811383444551e-05, "epoch": 3.2305630026809653, "percentage": 32.31, "elapsed_time": "1:29:58", "remaining_time": "3:08:31", "throughput": 2317.04, "total_tokens": 12507664} {"current_steps": 21695, "total_steps": 67140, "loss": 0.5549, "lr": 4.2793549381982095e-05, "epoch": 3.2313077152219245, "percentage": 32.31, "elapsed_time": "1:29:59", "remaining_time": "3:08:29", "throughput": 2317.06, "total_tokens": 12510320} {"current_steps": 21700, "total_steps": 67140, "loss": 0.5537, "lr": 4.278898372710296e-05, "epoch": 3.2320524277628837, "percentage": 32.32, "elapsed_time": "1:30:00", "remaining_time": "3:08:28", "throughput": 2317.1, "total_tokens": 12513136} {"current_steps": 21705, "total_steps": 67140, "loss": 0.6049, "lr": 4.2784416870116635e-05, "epoch": 3.232797140303843, "percentage": 32.33, "elapsed_time": "1:30:01", "remaining_time": "3:08:26", "throughput": 2317.1, "total_tokens": 12515664} {"current_steps": 21710, "total_steps": 67140, "loss": 0.67, "lr": 4.2779848811331726e-05, "epoch": 3.233541852844802, "percentage": 32.34, "elapsed_time": "1:30:02", "remaining_time": "3:08:25", "throughput": 2317.14, "total_tokens": 12518512} {"current_steps": 21715, "total_steps": 67140, "loss": 0.6946, "lr": 4.2775279551056914e-05, "epoch": 3.2342865653857613, "percentage": 32.34, "elapsed_time": "1:30:03", "remaining_time": "3:08:23", "throughput": 2317.17, "total_tokens": 12521232} {"current_steps": 21720, "total_steps": 67140, "loss": 0.746, "lr": 4.277070908960098e-05, "epoch": 3.23503127792672, "percentage": 32.35, "elapsed_time": "1:30:04", "remaining_time": "3:08:22", "throughput": 2317.19, "total_tokens": 12523888} {"current_steps": 21725, "total_steps": 67140, "loss": 0.7889, "lr": 4.276613742727278e-05, "epoch": 3.2357759904676793, "percentage": 32.36, "elapsed_time": "1:30:05", "remaining_time": "3:08:20", "throughput": 2317.25, "total_tokens": 12526832} {"current_steps": 21730, "total_steps": 67140, "loss": 0.5858, "lr": 4.276156456438124e-05, "epoch": 3.2365207030086385, "percentage": 32.37, "elapsed_time": "1:30:07", "remaining_time": "3:08:19", "throughput": 2317.3, "total_tokens": 12529744} {"current_steps": 21735, "total_steps": 67140, "loss": 0.6806, "lr": 4.275699050123538e-05, "epoch": 3.2372654155495977, "percentage": 32.37, "elapsed_time": "1:30:08", "remaining_time": "3:08:17", "throughput": 2317.35, "total_tokens": 12532720} {"current_steps": 21740, "total_steps": 67140, "loss": 0.6459, "lr": 4.27524152381443e-05, "epoch": 3.238010128090557, "percentage": 32.38, "elapsed_time": "1:30:09", "remaining_time": "3:08:16", "throughput": 2317.39, "total_tokens": 12535504} {"current_steps": 21745, "total_steps": 67140, "loss": 0.6182, "lr": 4.2747838775417174e-05, "epoch": 3.238754840631516, "percentage": 32.39, "elapsed_time": "1:30:10", "remaining_time": "3:08:15", "throughput": 2317.48, "total_tokens": 12538768} {"current_steps": 21750, "total_steps": 67140, "loss": 0.8129, "lr": 4.2743261113363266e-05, "epoch": 3.2394995531724753, "percentage": 32.39, "elapsed_time": "1:30:11", "remaining_time": "3:08:13", "throughput": 2317.52, "total_tokens": 12541616} {"current_steps": 21755, "total_steps": 67140, "loss": 0.6863, "lr": 4.27386822522919e-05, "epoch": 3.2402442657134345, "percentage": 32.4, "elapsed_time": "1:30:12", "remaining_time": "3:08:12", "throughput": 2317.55, "total_tokens": 12544400} {"current_steps": 21760, "total_steps": 67140, "loss": 0.6453, "lr": 4.273410219251252e-05, "epoch": 3.2409889782543937, "percentage": 32.41, "elapsed_time": "1:30:13", "remaining_time": "3:08:10", "throughput": 2317.6, "total_tokens": 12547280} {"current_steps": 21765, "total_steps": 67140, "loss": 0.6469, "lr": 4.27295209343346e-05, "epoch": 3.241733690795353, "percentage": 32.42, "elapsed_time": "1:30:15", "remaining_time": "3:08:09", "throughput": 2317.65, "total_tokens": 12550224} {"current_steps": 21770, "total_steps": 67140, "loss": 0.7998, "lr": 4.2724938478067746e-05, "epoch": 3.242478403336312, "percentage": 32.42, "elapsed_time": "1:30:16", "remaining_time": "3:08:07", "throughput": 2317.7, "total_tokens": 12553072} {"current_steps": 21775, "total_steps": 67140, "loss": 0.6333, "lr": 4.2720354824021616e-05, "epoch": 3.2432231158772713, "percentage": 32.43, "elapsed_time": "1:30:17", "remaining_time": "3:08:06", "throughput": 2317.75, "total_tokens": 12556016} {"current_steps": 21780, "total_steps": 67140, "loss": 0.5724, "lr": 4.271576997250595e-05, "epoch": 3.2439678284182305, "percentage": 32.44, "elapsed_time": "1:30:18", "remaining_time": "3:08:04", "throughput": 2317.78, "total_tokens": 12558704} {"current_steps": 21785, "total_steps": 67140, "loss": 0.688, "lr": 4.271118392383058e-05, "epoch": 3.2447125409591897, "percentage": 32.45, "elapsed_time": "1:30:19", "remaining_time": "3:08:03", "throughput": 2317.85, "total_tokens": 12561808} {"current_steps": 21790, "total_steps": 67140, "loss": 0.6131, "lr": 4.2706596678305405e-05, "epoch": 3.245457253500149, "percentage": 32.45, "elapsed_time": "1:30:20", "remaining_time": "3:08:01", "throughput": 2317.92, "total_tokens": 12564912} {"current_steps": 21795, "total_steps": 67140, "loss": 0.5159, "lr": 4.2702008236240424e-05, "epoch": 3.246201966041108, "percentage": 32.46, "elapsed_time": "1:30:21", "remaining_time": "3:08:00", "throughput": 2317.96, "total_tokens": 12567760} {"current_steps": 21800, "total_steps": 67140, "loss": 0.626, "lr": 4.269741859794568e-05, "epoch": 3.2469466785820673, "percentage": 32.47, "elapsed_time": "1:30:23", "remaining_time": "3:07:58", "throughput": 2318.0, "total_tokens": 12570512} {"current_steps": 21805, "total_steps": 67140, "loss": 0.7033, "lr": 4.2692827763731356e-05, "epoch": 3.2476913911230265, "percentage": 32.48, "elapsed_time": "1:30:24", "remaining_time": "3:07:57", "throughput": 2318.04, "total_tokens": 12573360} {"current_steps": 21810, "total_steps": 67140, "loss": 0.6001, "lr": 4.268823573390766e-05, "epoch": 3.2484361036639857, "percentage": 32.48, "elapsed_time": "1:30:25", "remaining_time": "3:07:55", "throughput": 2318.05, "total_tokens": 12575984} {"current_steps": 21815, "total_steps": 67140, "loss": 0.7178, "lr": 4.26836425087849e-05, "epoch": 3.249180816204945, "percentage": 32.49, "elapsed_time": "1:30:26", "remaining_time": "3:07:54", "throughput": 2318.09, "total_tokens": 12578800} {"current_steps": 21820, "total_steps": 67140, "loss": 0.5227, "lr": 4.267904808867349e-05, "epoch": 3.249925528745904, "percentage": 32.5, "elapsed_time": "1:30:27", "remaining_time": "3:07:52", "throughput": 2318.1, "total_tokens": 12581424} {"current_steps": 21825, "total_steps": 67140, "loss": 0.6564, "lr": 4.267445247388389e-05, "epoch": 3.2506702412868633, "percentage": 32.51, "elapsed_time": "1:30:28", "remaining_time": "3:07:51", "throughput": 2318.17, "total_tokens": 12584464} {"current_steps": 21830, "total_steps": 67140, "loss": 0.6334, "lr": 4.2669855664726635e-05, "epoch": 3.2514149538278225, "percentage": 32.51, "elapsed_time": "1:30:29", "remaining_time": "3:07:49", "throughput": 2318.23, "total_tokens": 12587472} {"current_steps": 21835, "total_steps": 67140, "loss": 0.6821, "lr": 4.266525766151238e-05, "epoch": 3.2521596663687817, "percentage": 32.52, "elapsed_time": "1:30:30", "remaining_time": "3:07:48", "throughput": 2318.26, "total_tokens": 12590288} {"current_steps": 21840, "total_steps": 67140, "loss": 0.7353, "lr": 4.266065846455184e-05, "epoch": 3.252904378909741, "percentage": 32.53, "elapsed_time": "1:30:32", "remaining_time": "3:07:47", "throughput": 2318.32, "total_tokens": 12593296} {"current_steps": 21845, "total_steps": 67140, "loss": 0.6484, "lr": 4.26560580741558e-05, "epoch": 3.2536490914507, "percentage": 32.54, "elapsed_time": "1:30:33", "remaining_time": "3:07:45", "throughput": 2318.36, "total_tokens": 12596144} {"current_steps": 21850, "total_steps": 67140, "loss": 0.53, "lr": 4.2651456490635144e-05, "epoch": 3.2543938039916593, "percentage": 32.54, "elapsed_time": "1:30:34", "remaining_time": "3:07:44", "throughput": 2318.43, "total_tokens": 12599152} {"current_steps": 21855, "total_steps": 67140, "loss": 0.6845, "lr": 4.2646853714300816e-05, "epoch": 3.2551385165326185, "percentage": 32.55, "elapsed_time": "1:30:35", "remaining_time": "3:07:42", "throughput": 2318.46, "total_tokens": 12601904} {"current_steps": 21860, "total_steps": 67140, "loss": 0.5723, "lr": 4.264224974546387e-05, "epoch": 3.2558832290735777, "percentage": 32.56, "elapsed_time": "1:30:36", "remaining_time": "3:07:41", "throughput": 2318.52, "total_tokens": 12604880} {"current_steps": 21865, "total_steps": 67140, "loss": 0.7245, "lr": 4.263764458443541e-05, "epoch": 3.256627941614537, "percentage": 32.57, "elapsed_time": "1:30:37", "remaining_time": "3:07:39", "throughput": 2318.58, "total_tokens": 12607920} {"current_steps": 21870, "total_steps": 67140, "loss": 0.6624, "lr": 4.263303823152663e-05, "epoch": 3.257372654155496, "percentage": 32.57, "elapsed_time": "1:30:38", "remaining_time": "3:07:38", "throughput": 2318.64, "total_tokens": 12610960} {"current_steps": 21875, "total_steps": 67140, "loss": 0.7967, "lr": 4.262843068704883e-05, "epoch": 3.2581173666964554, "percentage": 32.58, "elapsed_time": "1:30:40", "remaining_time": "3:07:36", "throughput": 2318.68, "total_tokens": 12613840} {"current_steps": 21880, "total_steps": 67140, "loss": 0.6968, "lr": 4.262382195131335e-05, "epoch": 3.2588620792374146, "percentage": 32.59, "elapsed_time": "1:30:41", "remaining_time": "3:07:35", "throughput": 2318.72, "total_tokens": 12616688} {"current_steps": 21885, "total_steps": 67140, "loss": 0.6778, "lr": 4.2619212024631636e-05, "epoch": 3.2596067917783733, "percentage": 32.6, "elapsed_time": "1:30:42", "remaining_time": "3:07:33", "throughput": 2318.73, "total_tokens": 12619312} {"current_steps": 21890, "total_steps": 67140, "loss": 0.6229, "lr": 4.261460090731521e-05, "epoch": 3.260351504319333, "percentage": 32.6, "elapsed_time": "1:30:43", "remaining_time": "3:07:32", "throughput": 2318.78, "total_tokens": 12622192} {"current_steps": 21895, "total_steps": 67140, "loss": 0.7222, "lr": 4.2609988599675665e-05, "epoch": 3.2610962168602917, "percentage": 32.61, "elapsed_time": "1:30:44", "remaining_time": "3:07:30", "throughput": 2318.81, "total_tokens": 12624912} {"current_steps": 21900, "total_steps": 67140, "loss": 0.7248, "lr": 4.2605375102024694e-05, "epoch": 3.2618409294012514, "percentage": 32.62, "elapsed_time": "1:30:45", "remaining_time": "3:07:29", "throughput": 2318.94, "total_tokens": 12628592} {"current_steps": 21905, "total_steps": 67140, "loss": 0.6045, "lr": 4.2600760414674044e-05, "epoch": 3.26258564194221, "percentage": 32.63, "elapsed_time": "1:30:47", "remaining_time": "3:07:28", "throughput": 2319.0, "total_tokens": 12631632} {"current_steps": 21910, "total_steps": 67140, "loss": 0.8092, "lr": 4.259614453793557e-05, "epoch": 3.2633303544831693, "percentage": 32.63, "elapsed_time": "1:30:48", "remaining_time": "3:07:26", "throughput": 2319.06, "total_tokens": 12634672} {"current_steps": 21915, "total_steps": 67140, "loss": 0.6815, "lr": 4.25915274721212e-05, "epoch": 3.2640750670241285, "percentage": 32.64, "elapsed_time": "1:30:49", "remaining_time": "3:07:25", "throughput": 2319.1, "total_tokens": 12637520} {"current_steps": 21920, "total_steps": 67140, "loss": 0.6061, "lr": 4.258690921754291e-05, "epoch": 3.2648197795650877, "percentage": 32.65, "elapsed_time": "1:30:50", "remaining_time": "3:07:23", "throughput": 2319.11, "total_tokens": 12640144} {"current_steps": 21925, "total_steps": 67140, "loss": 0.6677, "lr": 4.25822897745128e-05, "epoch": 3.265564492106047, "percentage": 32.66, "elapsed_time": "1:30:51", "remaining_time": "3:07:22", "throughput": 2319.17, "total_tokens": 12643088} {"current_steps": 21930, "total_steps": 67140, "loss": 0.5959, "lr": 4.257766914334303e-05, "epoch": 3.266309204647006, "percentage": 32.66, "elapsed_time": "1:30:52", "remaining_time": "3:07:21", "throughput": 2319.2, "total_tokens": 12645904} {"current_steps": 21935, "total_steps": 67140, "loss": 0.6818, "lr": 4.257304732434585e-05, "epoch": 3.2670539171879653, "percentage": 32.67, "elapsed_time": "1:30:53", "remaining_time": "3:07:19", "throughput": 2319.24, "total_tokens": 12648784} {"current_steps": 21940, "total_steps": 67140, "loss": 0.6076, "lr": 4.256842431783358e-05, "epoch": 3.2677986297289245, "percentage": 32.68, "elapsed_time": "1:30:54", "remaining_time": "3:07:18", "throughput": 2319.28, "total_tokens": 12651632} {"current_steps": 21945, "total_steps": 67140, "loss": 0.5244, "lr": 4.256380012411862e-05, "epoch": 3.2685433422698837, "percentage": 32.69, "elapsed_time": "1:30:56", "remaining_time": "3:07:16", "throughput": 2319.33, "total_tokens": 12654544} {"current_steps": 21950, "total_steps": 67140, "loss": 0.7272, "lr": 4.255917474351345e-05, "epoch": 3.269288054810843, "percentage": 32.69, "elapsed_time": "1:30:57", "remaining_time": "3:07:15", "throughput": 2319.37, "total_tokens": 12657392} {"current_steps": 21955, "total_steps": 67140, "loss": 0.7261, "lr": 4.2554548176330655e-05, "epoch": 3.270032767351802, "percentage": 32.7, "elapsed_time": "1:30:58", "remaining_time": "3:07:13", "throughput": 2319.43, "total_tokens": 12660400} {"current_steps": 21960, "total_steps": 67140, "loss": 0.5965, "lr": 4.254992042288286e-05, "epoch": 3.2707774798927614, "percentage": 32.71, "elapsed_time": "1:30:59", "remaining_time": "3:07:12", "throughput": 2319.49, "total_tokens": 12663440} {"current_steps": 21965, "total_steps": 67140, "loss": 0.6538, "lr": 4.254529148348279e-05, "epoch": 3.2715221924337206, "percentage": 32.72, "elapsed_time": "1:31:00", "remaining_time": "3:07:10", "throughput": 2319.55, "total_tokens": 12666416} {"current_steps": 21970, "total_steps": 67140, "loss": 0.5986, "lr": 4.254066135844326e-05, "epoch": 3.2722669049746798, "percentage": 32.72, "elapsed_time": "1:31:01", "remaining_time": "3:07:09", "throughput": 2319.58, "total_tokens": 12669168} {"current_steps": 21975, "total_steps": 67140, "loss": 0.6021, "lr": 4.253603004807715e-05, "epoch": 3.273011617515639, "percentage": 32.73, "elapsed_time": "1:31:03", "remaining_time": "3:07:08", "throughput": 2319.66, "total_tokens": 12672368} {"current_steps": 21980, "total_steps": 67140, "loss": 0.6341, "lr": 4.253139755269743e-05, "epoch": 3.273756330056598, "percentage": 32.74, "elapsed_time": "1:31:04", "remaining_time": "3:07:06", "throughput": 2319.67, "total_tokens": 12674896} {"current_steps": 21985, "total_steps": 67140, "loss": 0.5273, "lr": 4.2526763872617137e-05, "epoch": 3.2745010425975574, "percentage": 32.75, "elapsed_time": "1:31:05", "remaining_time": "3:07:05", "throughput": 2319.74, "total_tokens": 12677968} {"current_steps": 21990, "total_steps": 67140, "loss": 0.6128, "lr": 4.2522129008149395e-05, "epoch": 3.2752457551385166, "percentage": 32.75, "elapsed_time": "1:31:06", "remaining_time": "3:07:03", "throughput": 2319.78, "total_tokens": 12680816} {"current_steps": 21995, "total_steps": 67140, "loss": 0.5147, "lr": 4.2517492959607426e-05, "epoch": 3.2759904676794758, "percentage": 32.76, "elapsed_time": "1:31:07", "remaining_time": "3:07:02", "throughput": 2319.82, "total_tokens": 12683664} {"current_steps": 22000, "total_steps": 67140, "loss": 0.5548, "lr": 4.251285572730449e-05, "epoch": 3.276735180220435, "percentage": 32.77, "elapsed_time": "1:31:08", "remaining_time": "3:07:00", "throughput": 2319.87, "total_tokens": 12686608} {"current_steps": 22005, "total_steps": 67140, "loss": 0.6129, "lr": 4.250821731155398e-05, "epoch": 3.277479892761394, "percentage": 32.77, "elapsed_time": "1:31:09", "remaining_time": "3:06:59", "throughput": 2319.91, "total_tokens": 12689392} {"current_steps": 22010, "total_steps": 67140, "loss": 0.7539, "lr": 4.250357771266932e-05, "epoch": 3.2782246053023534, "percentage": 32.78, "elapsed_time": "1:31:10", "remaining_time": "3:06:57", "throughput": 2319.95, "total_tokens": 12692240} {"current_steps": 22015, "total_steps": 67140, "loss": 0.5279, "lr": 4.249893693096404e-05, "epoch": 3.2789693178433126, "percentage": 32.79, "elapsed_time": "1:31:12", "remaining_time": "3:06:56", "throughput": 2320.01, "total_tokens": 12695344} {"current_steps": 22020, "total_steps": 67140, "loss": 0.7504, "lr": 4.249429496675175e-05, "epoch": 3.279714030384272, "percentage": 32.8, "elapsed_time": "1:31:13", "remaining_time": "3:06:54", "throughput": 2320.03, "total_tokens": 12697968} {"current_steps": 22025, "total_steps": 67140, "loss": 0.6132, "lr": 4.248965182034613e-05, "epoch": 3.280458742925231, "percentage": 32.8, "elapsed_time": "1:31:14", "remaining_time": "3:06:53", "throughput": 2320.11, "total_tokens": 12701200} {"current_steps": 22030, "total_steps": 67140, "loss": 0.5974, "lr": 4.248500749206096e-05, "epoch": 3.28120345546619, "percentage": 32.81, "elapsed_time": "1:31:15", "remaining_time": "3:06:52", "throughput": 2320.14, "total_tokens": 12704016} {"current_steps": 22035, "total_steps": 67140, "loss": 0.7065, "lr": 4.248036198221006e-05, "epoch": 3.2819481680071494, "percentage": 32.82, "elapsed_time": "1:31:16", "remaining_time": "3:06:50", "throughput": 2320.16, "total_tokens": 12706640} {"current_steps": 22040, "total_steps": 67140, "loss": 0.6839, "lr": 4.2475715291107374e-05, "epoch": 3.2826928805481086, "percentage": 32.83, "elapsed_time": "1:31:17", "remaining_time": "3:06:48", "throughput": 2320.19, "total_tokens": 12709392} {"current_steps": 22045, "total_steps": 67140, "loss": 0.5803, "lr": 4.24710674190669e-05, "epoch": 3.283437593089068, "percentage": 32.83, "elapsed_time": "1:31:18", "remaining_time": "3:06:47", "throughput": 2320.2, "total_tokens": 12711952} {"current_steps": 22050, "total_steps": 67140, "loss": 0.5041, "lr": 4.2466418366402715e-05, "epoch": 3.284182305630027, "percentage": 32.84, "elapsed_time": "1:31:19", "remaining_time": "3:06:45", "throughput": 2320.25, "total_tokens": 12714896} {"current_steps": 22055, "total_steps": 67140, "loss": 0.6409, "lr": 4.2461768133428993e-05, "epoch": 3.284927018170986, "percentage": 32.85, "elapsed_time": "1:31:21", "remaining_time": "3:06:44", "throughput": 2320.28, "total_tokens": 12717680} {"current_steps": 22060, "total_steps": 67140, "loss": 0.7414, "lr": 4.2457116720459975e-05, "epoch": 3.285671730711945, "percentage": 32.86, "elapsed_time": "1:31:22", "remaining_time": "3:06:43", "throughput": 2320.34, "total_tokens": 12720656} {"current_steps": 22065, "total_steps": 67140, "loss": 0.6332, "lr": 4.245246412780999e-05, "epoch": 3.2864164432529046, "percentage": 32.86, "elapsed_time": "1:31:23", "remaining_time": "3:06:41", "throughput": 2320.4, "total_tokens": 12723728} {"current_steps": 22070, "total_steps": 67140, "loss": 0.4434, "lr": 4.244781035579343e-05, "epoch": 3.2871611557938634, "percentage": 32.87, "elapsed_time": "1:31:24", "remaining_time": "3:06:40", "throughput": 2320.41, "total_tokens": 12726256} {"current_steps": 22075, "total_steps": 67140, "loss": 0.8371, "lr": 4.244315540472478e-05, "epoch": 3.2879058683348226, "percentage": 32.88, "elapsed_time": "1:31:25", "remaining_time": "3:06:38", "throughput": 2320.43, "total_tokens": 12728912} {"current_steps": 22080, "total_steps": 67140, "loss": 0.5718, "lr": 4.243849927491861e-05, "epoch": 3.2886505808757818, "percentage": 32.89, "elapsed_time": "1:31:26", "remaining_time": "3:06:37", "throughput": 2320.49, "total_tokens": 12731888} {"current_steps": 22085, "total_steps": 67140, "loss": 0.6594, "lr": 4.2433841966689564e-05, "epoch": 3.289395293416741, "percentage": 32.89, "elapsed_time": "1:31:27", "remaining_time": "3:06:35", "throughput": 2320.52, "total_tokens": 12734608} {"current_steps": 22090, "total_steps": 67140, "loss": 0.7304, "lr": 4.2429183480352354e-05, "epoch": 3.2901400059577, "percentage": 32.9, "elapsed_time": "1:31:28", "remaining_time": "3:06:34", "throughput": 2320.56, "total_tokens": 12737424} {"current_steps": 22095, "total_steps": 67140, "loss": 0.8623, "lr": 4.242452381622179e-05, "epoch": 3.2908847184986594, "percentage": 32.91, "elapsed_time": "1:31:30", "remaining_time": "3:06:32", "throughput": 2320.62, "total_tokens": 12740464} {"current_steps": 22100, "total_steps": 67140, "loss": 0.6853, "lr": 4.2419862974612744e-05, "epoch": 3.2916294310396186, "percentage": 32.92, "elapsed_time": "1:31:31", "remaining_time": "3:06:31", "throughput": 2320.67, "total_tokens": 12743408} {"current_steps": 22105, "total_steps": 67140, "loss": 0.6273, "lr": 4.2415200955840184e-05, "epoch": 3.292374143580578, "percentage": 32.92, "elapsed_time": "1:31:32", "remaining_time": "3:06:29", "throughput": 2320.69, "total_tokens": 12746000} {"current_steps": 22110, "total_steps": 67140, "loss": 0.6821, "lr": 4.241053776021915e-05, "epoch": 3.293118856121537, "percentage": 32.93, "elapsed_time": "1:31:33", "remaining_time": "3:06:28", "throughput": 2320.75, "total_tokens": 12749040} {"current_steps": 22115, "total_steps": 67140, "loss": 0.7408, "lr": 4.240587338806476e-05, "epoch": 3.293863568662496, "percentage": 32.94, "elapsed_time": "1:31:34", "remaining_time": "3:06:26", "throughput": 2320.8, "total_tokens": 12751920} {"current_steps": 22120, "total_steps": 67140, "loss": 0.6326, "lr": 4.2401207839692217e-05, "epoch": 3.2946082812034554, "percentage": 32.95, "elapsed_time": "1:31:35", "remaining_time": "3:06:25", "throughput": 2320.83, "total_tokens": 12754704} {"current_steps": 22125, "total_steps": 67140, "loss": 0.7631, "lr": 4.239654111541679e-05, "epoch": 3.2953529937444146, "percentage": 32.95, "elapsed_time": "1:31:36", "remaining_time": "3:06:23", "throughput": 2320.91, "total_tokens": 12757872} {"current_steps": 22130, "total_steps": 67140, "loss": 0.7011, "lr": 4.239187321555384e-05, "epoch": 3.296097706285374, "percentage": 32.96, "elapsed_time": "1:31:38", "remaining_time": "3:06:22", "throughput": 2320.99, "total_tokens": 12760976} {"current_steps": 22135, "total_steps": 67140, "loss": 0.742, "lr": 4.2387204140418815e-05, "epoch": 3.296842418826333, "percentage": 32.97, "elapsed_time": "1:31:39", "remaining_time": "3:06:21", "throughput": 2321.05, "total_tokens": 12763952} {"current_steps": 22140, "total_steps": 67140, "loss": 0.6405, "lr": 4.238253389032723e-05, "epoch": 3.297587131367292, "percentage": 32.98, "elapsed_time": "1:31:40", "remaining_time": "3:06:19", "throughput": 2321.12, "total_tokens": 12767056} {"current_steps": 22145, "total_steps": 67140, "loss": 0.8291, "lr": 4.237786246559467e-05, "epoch": 3.2983318439082514, "percentage": 32.98, "elapsed_time": "1:31:41", "remaining_time": "3:06:18", "throughput": 2321.15, "total_tokens": 12769744} {"current_steps": 22150, "total_steps": 67140, "loss": 0.6791, "lr": 4.2373189866536815e-05, "epoch": 3.2990765564492106, "percentage": 32.99, "elapsed_time": "1:31:42", "remaining_time": "3:06:16", "throughput": 2321.2, "total_tokens": 12772656} {"current_steps": 22155, "total_steps": 67140, "loss": 0.6777, "lr": 4.236851609346943e-05, "epoch": 3.29982126899017, "percentage": 33.0, "elapsed_time": "1:31:43", "remaining_time": "3:06:15", "throughput": 2321.23, "total_tokens": 12775472} {"current_steps": 22160, "total_steps": 67140, "loss": 0.6009, "lr": 4.236384114670834e-05, "epoch": 3.300565981531129, "percentage": 33.01, "elapsed_time": "1:31:44", "remaining_time": "3:06:13", "throughput": 2321.28, "total_tokens": 12778352} {"current_steps": 22165, "total_steps": 67140, "loss": 0.6497, "lr": 4.2359165026569455e-05, "epoch": 3.301310694072088, "percentage": 33.01, "elapsed_time": "1:31:46", "remaining_time": "3:06:12", "throughput": 2321.32, "total_tokens": 12781200} {"current_steps": 22170, "total_steps": 67140, "loss": 0.6207, "lr": 4.235448773336878e-05, "epoch": 3.3020554066130474, "percentage": 33.02, "elapsed_time": "1:31:47", "remaining_time": "3:06:10", "throughput": 2321.34, "total_tokens": 12783888} {"current_steps": 22175, "total_steps": 67140, "loss": 0.7777, "lr": 4.234980926742239e-05, "epoch": 3.3028001191540066, "percentage": 33.03, "elapsed_time": "1:31:48", "remaining_time": "3:06:09", "throughput": 2321.37, "total_tokens": 12786672} {"current_steps": 22180, "total_steps": 67140, "loss": 0.5983, "lr": 4.2345129629046425e-05, "epoch": 3.303544831694966, "percentage": 33.04, "elapsed_time": "1:31:49", "remaining_time": "3:06:07", "throughput": 2321.41, "total_tokens": 12789488} {"current_steps": 22185, "total_steps": 67140, "loss": 0.6495, "lr": 4.234044881855711e-05, "epoch": 3.304289544235925, "percentage": 33.04, "elapsed_time": "1:31:50", "remaining_time": "3:06:06", "throughput": 2321.43, "total_tokens": 12792240} {"current_steps": 22190, "total_steps": 67140, "loss": 0.6539, "lr": 4.233576683627078e-05, "epoch": 3.3050342567768842, "percentage": 33.05, "elapsed_time": "1:31:51", "remaining_time": "3:06:04", "throughput": 2321.44, "total_tokens": 12794864} {"current_steps": 22195, "total_steps": 67140, "loss": 0.666, "lr": 4.23310836825038e-05, "epoch": 3.3057789693178434, "percentage": 33.06, "elapsed_time": "1:31:52", "remaining_time": "3:06:03", "throughput": 2321.49, "total_tokens": 12797712} {"current_steps": 22200, "total_steps": 67140, "loss": 0.7044, "lr": 4.2326399357572654e-05, "epoch": 3.3065236818588026, "percentage": 33.07, "elapsed_time": "1:31:53", "remaining_time": "3:06:01", "throughput": 2321.55, "total_tokens": 12800784} {"current_steps": 22205, "total_steps": 67140, "loss": 0.4743, "lr": 4.232171386179388e-05, "epoch": 3.307268394399762, "percentage": 33.07, "elapsed_time": "1:31:55", "remaining_time": "3:06:00", "throughput": 2321.6, "total_tokens": 12803664} {"current_steps": 22210, "total_steps": 67140, "loss": 0.81, "lr": 4.231702719548411e-05, "epoch": 3.308013106940721, "percentage": 33.08, "elapsed_time": "1:31:56", "remaining_time": "3:05:58", "throughput": 2321.6, "total_tokens": 12806192} {"current_steps": 22215, "total_steps": 67140, "loss": 0.5593, "lr": 4.231233935896004e-05, "epoch": 3.3087578194816802, "percentage": 33.09, "elapsed_time": "1:31:57", "remaining_time": "3:05:57", "throughput": 2321.69, "total_tokens": 12809488} {"current_steps": 22220, "total_steps": 67140, "loss": 0.5861, "lr": 4.2307650352538465e-05, "epoch": 3.3095025320226394, "percentage": 33.1, "elapsed_time": "1:31:58", "remaining_time": "3:05:56", "throughput": 2321.71, "total_tokens": 12812176} {"current_steps": 22225, "total_steps": 67140, "loss": 0.6427, "lr": 4.230296017653625e-05, "epoch": 3.310247244563598, "percentage": 33.1, "elapsed_time": "1:31:59", "remaining_time": "3:05:54", "throughput": 2321.75, "total_tokens": 12815024} {"current_steps": 22230, "total_steps": 67140, "loss": 0.6526, "lr": 4.2298268831270335e-05, "epoch": 3.310991957104558, "percentage": 33.11, "elapsed_time": "1:32:00", "remaining_time": "3:05:53", "throughput": 2321.79, "total_tokens": 12817776} {"current_steps": 22235, "total_steps": 67140, "loss": 0.6368, "lr": 4.229357631705774e-05, "epoch": 3.3117366696455166, "percentage": 33.12, "elapsed_time": "1:32:01", "remaining_time": "3:05:51", "throughput": 2321.8, "total_tokens": 12820400} {"current_steps": 22240, "total_steps": 67140, "loss": 0.7007, "lr": 4.228888263421557e-05, "epoch": 3.3124813821864763, "percentage": 33.12, "elapsed_time": "1:32:02", "remaining_time": "3:05:50", "throughput": 2321.86, "total_tokens": 12823472} {"current_steps": 22245, "total_steps": 67140, "loss": 0.6123, "lr": 4.2284187783061e-05, "epoch": 3.313226094727435, "percentage": 33.13, "elapsed_time": "1:32:04", "remaining_time": "3:05:48", "throughput": 2321.87, "total_tokens": 12826032} {"current_steps": 22250, "total_steps": 67140, "loss": 0.6842, "lr": 4.22794917639113e-05, "epoch": 3.313970807268394, "percentage": 33.14, "elapsed_time": "1:32:05", "remaining_time": "3:05:47", "throughput": 2321.91, "total_tokens": 12828848} {"current_steps": 22255, "total_steps": 67140, "loss": 0.5993, "lr": 4.227479457708379e-05, "epoch": 3.3147155198093534, "percentage": 33.15, "elapsed_time": "1:32:06", "remaining_time": "3:05:45", "throughput": 2321.95, "total_tokens": 12831728} {"current_steps": 22260, "total_steps": 67140, "loss": 0.7398, "lr": 4.22700962228959e-05, "epoch": 3.3154602323503126, "percentage": 33.15, "elapsed_time": "1:32:07", "remaining_time": "3:05:44", "throughput": 2322.0, "total_tokens": 12834576} {"current_steps": 22265, "total_steps": 67140, "loss": 0.7411, "lr": 4.2265396701665125e-05, "epoch": 3.316204944891272, "percentage": 33.16, "elapsed_time": "1:32:08", "remaining_time": "3:05:42", "throughput": 2322.01, "total_tokens": 12837232} {"current_steps": 22270, "total_steps": 67140, "loss": 0.7225, "lr": 4.226069601370904e-05, "epoch": 3.316949657432231, "percentage": 33.17, "elapsed_time": "1:32:09", "remaining_time": "3:05:41", "throughput": 2322.05, "total_tokens": 12840016} {"current_steps": 22275, "total_steps": 67140, "loss": 0.7367, "lr": 4.225599415934529e-05, "epoch": 3.3176943699731902, "percentage": 33.18, "elapsed_time": "1:32:10", "remaining_time": "3:05:39", "throughput": 2322.11, "total_tokens": 12843024} {"current_steps": 22280, "total_steps": 67140, "loss": 0.5611, "lr": 4.225129113889161e-05, "epoch": 3.3184390825141494, "percentage": 33.18, "elapsed_time": "1:32:11", "remaining_time": "3:05:38", "throughput": 2322.14, "total_tokens": 12845872} {"current_steps": 22285, "total_steps": 67140, "loss": 0.4406, "lr": 4.224658695266582e-05, "epoch": 3.3191837950551086, "percentage": 33.19, "elapsed_time": "1:32:13", "remaining_time": "3:05:36", "throughput": 2322.19, "total_tokens": 12848720} {"current_steps": 22290, "total_steps": 67140, "loss": 0.5375, "lr": 4.22418816009858e-05, "epoch": 3.319928507596068, "percentage": 33.2, "elapsed_time": "1:32:14", "remaining_time": "3:05:35", "throughput": 2322.23, "total_tokens": 12851600} {"current_steps": 22295, "total_steps": 67140, "loss": 0.5227, "lr": 4.223717508416952e-05, "epoch": 3.320673220137027, "percentage": 33.21, "elapsed_time": "1:32:15", "remaining_time": "3:05:33", "throughput": 2322.24, "total_tokens": 12854224} {"current_steps": 22300, "total_steps": 67140, "loss": 0.639, "lr": 4.2232467402535036e-05, "epoch": 3.3214179326779862, "percentage": 33.21, "elapsed_time": "1:32:16", "remaining_time": "3:05:32", "throughput": 2322.3, "total_tokens": 12857232} {"current_steps": 22305, "total_steps": 67140, "loss": 0.7363, "lr": 4.222775855640047e-05, "epoch": 3.3221626452189454, "percentage": 33.22, "elapsed_time": "1:32:17", "remaining_time": "3:05:30", "throughput": 2322.33, "total_tokens": 12860016} {"current_steps": 22310, "total_steps": 67140, "loss": 0.746, "lr": 4.222304854608401e-05, "epoch": 3.3229073577599046, "percentage": 33.23, "elapsed_time": "1:32:18", "remaining_time": "3:05:29", "throughput": 2322.4, "total_tokens": 12863120} {"current_steps": 22315, "total_steps": 67140, "loss": 0.6181, "lr": 4.221833737190396e-05, "epoch": 3.323652070300864, "percentage": 33.24, "elapsed_time": "1:32:19", "remaining_time": "3:05:28", "throughput": 2322.42, "total_tokens": 12865808} {"current_steps": 22320, "total_steps": 67140, "loss": 0.5263, "lr": 4.2213625034178674e-05, "epoch": 3.324396782841823, "percentage": 33.24, "elapsed_time": "1:32:20", "remaining_time": "3:05:26", "throughput": 2322.49, "total_tokens": 12868848} {"current_steps": 22325, "total_steps": 67140, "loss": 0.6764, "lr": 4.220891153322659e-05, "epoch": 3.3251414953827823, "percentage": 33.25, "elapsed_time": "1:32:22", "remaining_time": "3:05:25", "throughput": 2322.49, "total_tokens": 12871312} {"current_steps": 22330, "total_steps": 67140, "loss": 0.7982, "lr": 4.220419686936623e-05, "epoch": 3.3258862079237415, "percentage": 33.26, "elapsed_time": "1:32:23", "remaining_time": "3:05:23", "throughput": 2322.56, "total_tokens": 12874384} {"current_steps": 22335, "total_steps": 67140, "loss": 0.7454, "lr": 4.21994810429162e-05, "epoch": 3.3266309204647007, "percentage": 33.27, "elapsed_time": "1:32:24", "remaining_time": "3:05:22", "throughput": 2322.57, "total_tokens": 12876976} {"current_steps": 22340, "total_steps": 67140, "loss": 0.6179, "lr": 4.2194764054195166e-05, "epoch": 3.32737563300566, "percentage": 33.27, "elapsed_time": "1:32:25", "remaining_time": "3:05:20", "throughput": 2322.59, "total_tokens": 12879600} {"current_steps": 22345, "total_steps": 67140, "loss": 0.7527, "lr": 4.219004590352189e-05, "epoch": 3.328120345546619, "percentage": 33.28, "elapsed_time": "1:32:26", "remaining_time": "3:05:19", "throughput": 2322.65, "total_tokens": 12882672} {"current_steps": 22350, "total_steps": 67140, "loss": 0.5696, "lr": 4.2185326591215196e-05, "epoch": 3.3288650580875783, "percentage": 33.29, "elapsed_time": "1:32:27", "remaining_time": "3:05:17", "throughput": 2322.67, "total_tokens": 12885392} {"current_steps": 22355, "total_steps": 67140, "loss": 0.6491, "lr": 4.2180606117594e-05, "epoch": 3.3296097706285375, "percentage": 33.3, "elapsed_time": "1:32:28", "remaining_time": "3:05:16", "throughput": 2322.71, "total_tokens": 12888240} {"current_steps": 22360, "total_steps": 67140, "loss": 0.6986, "lr": 4.21758844829773e-05, "epoch": 3.3303544831694967, "percentage": 33.3, "elapsed_time": "1:32:29", "remaining_time": "3:05:14", "throughput": 2322.73, "total_tokens": 12890896} {"current_steps": 22365, "total_steps": 67140, "loss": 0.5726, "lr": 4.2171161687684156e-05, "epoch": 3.331099195710456, "percentage": 33.31, "elapsed_time": "1:32:31", "remaining_time": "3:05:13", "throughput": 2322.78, "total_tokens": 12893840} {"current_steps": 22370, "total_steps": 67140, "loss": 0.6002, "lr": 4.216643773203372e-05, "epoch": 3.331843908251415, "percentage": 33.32, "elapsed_time": "1:32:32", "remaining_time": "3:05:11", "throughput": 2322.82, "total_tokens": 12896688} {"current_steps": 22375, "total_steps": 67140, "loss": 0.8097, "lr": 4.216171261634521e-05, "epoch": 3.3325886207923743, "percentage": 33.33, "elapsed_time": "1:32:33", "remaining_time": "3:05:10", "throughput": 2322.9, "total_tokens": 12899824} {"current_steps": 22380, "total_steps": 67140, "loss": 0.7782, "lr": 4.215698634093794e-05, "epoch": 3.3333333333333335, "percentage": 33.33, "elapsed_time": "1:32:34", "remaining_time": "3:05:08", "throughput": 2322.96, "total_tokens": 12902864} {"current_steps": 22385, "total_steps": 67140, "loss": 0.5549, "lr": 4.2152258906131295e-05, "epoch": 3.3340780458742927, "percentage": 33.34, "elapsed_time": "1:32:35", "remaining_time": "3:05:07", "throughput": 2322.99, "total_tokens": 12905616} {"current_steps": 22390, "total_steps": 67140, "loss": 0.6217, "lr": 4.214753031224472e-05, "epoch": 3.334822758415252, "percentage": 33.35, "elapsed_time": "1:32:36", "remaining_time": "3:05:06", "throughput": 2323.07, "total_tokens": 12908816} {"current_steps": 22395, "total_steps": 67140, "loss": 0.6124, "lr": 4.2142800559597764e-05, "epoch": 3.335567470956211, "percentage": 33.36, "elapsed_time": "1:32:37", "remaining_time": "3:05:04", "throughput": 2323.1, "total_tokens": 12911536} {"current_steps": 22400, "total_steps": 67140, "loss": 0.8452, "lr": 4.2138069648510045e-05, "epoch": 3.33631218349717, "percentage": 33.36, "elapsed_time": "1:32:39", "remaining_time": "3:05:03", "throughput": 2323.14, "total_tokens": 12914384} {"current_steps": 22405, "total_steps": 67140, "loss": 0.6655, "lr": 4.2133337579301255e-05, "epoch": 3.3370568960381295, "percentage": 33.37, "elapsed_time": "1:32:40", "remaining_time": "3:05:01", "throughput": 2323.17, "total_tokens": 12917136} {"current_steps": 22410, "total_steps": 67140, "loss": 0.7251, "lr": 4.212860435229117e-05, "epoch": 3.3378016085790883, "percentage": 33.38, "elapsed_time": "1:32:41", "remaining_time": "3:05:00", "throughput": 2323.2, "total_tokens": 12919824} {"current_steps": 22415, "total_steps": 67140, "loss": 0.7456, "lr": 4.212386996779965e-05, "epoch": 3.338546321120048, "percentage": 33.39, "elapsed_time": "1:32:42", "remaining_time": "3:04:58", "throughput": 2323.22, "total_tokens": 12922576} {"current_steps": 22420, "total_steps": 67140, "loss": 0.4686, "lr": 4.2119134426146614e-05, "epoch": 3.3392910336610067, "percentage": 33.39, "elapsed_time": "1:32:43", "remaining_time": "3:04:57", "throughput": 2323.29, "total_tokens": 12925648} {"current_steps": 22425, "total_steps": 67140, "loss": 0.8079, "lr": 4.211439772765208e-05, "epoch": 3.340035746201966, "percentage": 33.4, "elapsed_time": "1:32:44", "remaining_time": "3:04:55", "throughput": 2323.3, "total_tokens": 12928272} {"current_steps": 22430, "total_steps": 67140, "loss": 0.5926, "lr": 4.210965987263612e-05, "epoch": 3.340780458742925, "percentage": 33.41, "elapsed_time": "1:32:45", "remaining_time": "3:04:54", "throughput": 2323.32, "total_tokens": 12930960} {"current_steps": 22435, "total_steps": 67140, "loss": 0.695, "lr": 4.2104920861418906e-05, "epoch": 3.3415251712838843, "percentage": 33.42, "elapsed_time": "1:32:46", "remaining_time": "3:04:52", "throughput": 2323.36, "total_tokens": 12933808} {"current_steps": 22440, "total_steps": 67140, "loss": 0.7016, "lr": 4.21001806943207e-05, "epoch": 3.3422698838248435, "percentage": 33.42, "elapsed_time": "1:32:48", "remaining_time": "3:04:51", "throughput": 2323.41, "total_tokens": 12936816} {"current_steps": 22445, "total_steps": 67140, "loss": 0.5603, "lr": 4.209543937166179e-05, "epoch": 3.3430145963658027, "percentage": 33.43, "elapsed_time": "1:32:49", "remaining_time": "3:04:49", "throughput": 2323.46, "total_tokens": 12939728} {"current_steps": 22450, "total_steps": 67140, "loss": 0.5831, "lr": 4.2090696893762605e-05, "epoch": 3.343759308906762, "percentage": 33.44, "elapsed_time": "1:32:50", "remaining_time": "3:04:48", "throughput": 2323.5, "total_tokens": 12942544} {"current_steps": 22455, "total_steps": 67140, "loss": 0.5953, "lr": 4.20859532609436e-05, "epoch": 3.344504021447721, "percentage": 33.45, "elapsed_time": "1:32:51", "remaining_time": "3:04:46", "throughput": 2323.53, "total_tokens": 12945328} {"current_steps": 22460, "total_steps": 67140, "loss": 0.5826, "lr": 4.208120847352535e-05, "epoch": 3.3452487339886803, "percentage": 33.45, "elapsed_time": "1:32:52", "remaining_time": "3:04:45", "throughput": 2323.53, "total_tokens": 12947824} {"current_steps": 22465, "total_steps": 67140, "loss": 0.6923, "lr": 4.207646253182847e-05, "epoch": 3.3459934465296395, "percentage": 33.46, "elapsed_time": "1:32:53", "remaining_time": "3:04:44", "throughput": 2323.62, "total_tokens": 12951120} {"current_steps": 22470, "total_steps": 67140, "loss": 0.7501, "lr": 4.207171543617369e-05, "epoch": 3.3467381590705987, "percentage": 33.47, "elapsed_time": "1:32:54", "remaining_time": "3:04:42", "throughput": 2323.65, "total_tokens": 12953904} {"current_steps": 22475, "total_steps": 67140, "loss": 0.6259, "lr": 4.206696718688178e-05, "epoch": 3.347482871611558, "percentage": 33.47, "elapsed_time": "1:32:55", "remaining_time": "3:04:41", "throughput": 2323.7, "total_tokens": 12956752} {"current_steps": 22480, "total_steps": 67140, "loss": 0.5878, "lr": 4.206221778427362e-05, "epoch": 3.348227584152517, "percentage": 33.48, "elapsed_time": "1:32:57", "remaining_time": "3:04:39", "throughput": 2323.77, "total_tokens": 12959920} {"current_steps": 22485, "total_steps": 67140, "loss": 0.588, "lr": 4.205746722867014e-05, "epoch": 3.3489722966934763, "percentage": 33.49, "elapsed_time": "1:32:58", "remaining_time": "3:04:38", "throughput": 2323.81, "total_tokens": 12962704} {"current_steps": 22490, "total_steps": 67140, "loss": 0.7254, "lr": 4.2052715520392397e-05, "epoch": 3.3497170092344355, "percentage": 33.5, "elapsed_time": "1:32:59", "remaining_time": "3:04:36", "throughput": 2323.86, "total_tokens": 12965712} {"current_steps": 22495, "total_steps": 67140, "loss": 0.5348, "lr": 4.2047962659761454e-05, "epoch": 3.3504617217753947, "percentage": 33.5, "elapsed_time": "1:33:00", "remaining_time": "3:04:35", "throughput": 2323.91, "total_tokens": 12968592} {"current_steps": 22500, "total_steps": 67140, "loss": 0.4877, "lr": 4.204320864709852e-05, "epoch": 3.351206434316354, "percentage": 33.51, "elapsed_time": "1:33:01", "remaining_time": "3:04:34", "throughput": 2323.97, "total_tokens": 12971664} {"current_steps": 22505, "total_steps": 67140, "loss": 0.6584, "lr": 4.203845348272483e-05, "epoch": 3.351951146857313, "percentage": 33.52, "elapsed_time": "1:33:02", "remaining_time": "3:04:32", "throughput": 2324.0, "total_tokens": 12974448} {"current_steps": 22510, "total_steps": 67140, "loss": 0.7273, "lr": 4.2033697166961716e-05, "epoch": 3.3526958593982723, "percentage": 33.53, "elapsed_time": "1:33:03", "remaining_time": "3:04:31", "throughput": 2324.05, "total_tokens": 12977424} {"current_steps": 22515, "total_steps": 67140, "loss": 0.7408, "lr": 4.202893970013062e-05, "epoch": 3.3534405719392315, "percentage": 33.53, "elapsed_time": "1:33:05", "remaining_time": "3:04:29", "throughput": 2324.09, "total_tokens": 12980272} {"current_steps": 22520, "total_steps": 67140, "loss": 0.6392, "lr": 4.202418108255301e-05, "epoch": 3.3541852844801907, "percentage": 33.54, "elapsed_time": "1:33:06", "remaining_time": "3:04:28", "throughput": 2324.14, "total_tokens": 12983184} {"current_steps": 22525, "total_steps": 67140, "loss": 0.5959, "lr": 4.201942131455045e-05, "epoch": 3.35492999702115, "percentage": 33.55, "elapsed_time": "1:33:07", "remaining_time": "3:04:26", "throughput": 2324.19, "total_tokens": 12986096} {"current_steps": 22530, "total_steps": 67140, "loss": 0.6437, "lr": 4.2014660396444596e-05, "epoch": 3.355674709562109, "percentage": 33.56, "elapsed_time": "1:33:08", "remaining_time": "3:04:25", "throughput": 2324.24, "total_tokens": 12989072} {"current_steps": 22535, "total_steps": 67140, "loss": 0.758, "lr": 4.200989832855717e-05, "epoch": 3.3564194221030683, "percentage": 33.56, "elapsed_time": "1:33:09", "remaining_time": "3:04:23", "throughput": 2324.29, "total_tokens": 12991984} {"current_steps": 22540, "total_steps": 67140, "loss": 0.5508, "lr": 4.2005135111209976e-05, "epoch": 3.3571641346440275, "percentage": 33.57, "elapsed_time": "1:33:10", "remaining_time": "3:04:22", "throughput": 2324.32, "total_tokens": 12994704} {"current_steps": 22545, "total_steps": 67140, "loss": 0.5946, "lr": 4.200037074472488e-05, "epoch": 3.3579088471849867, "percentage": 33.58, "elapsed_time": "1:33:11", "remaining_time": "3:04:20", "throughput": 2324.37, "total_tokens": 12997616} {"current_steps": 22550, "total_steps": 67140, "loss": 0.7242, "lr": 4.1995605229423856e-05, "epoch": 3.358653559725946, "percentage": 33.59, "elapsed_time": "1:33:13", "remaining_time": "3:04:19", "throughput": 2324.39, "total_tokens": 13000336} {"current_steps": 22555, "total_steps": 67140, "loss": 0.8466, "lr": 4.199083856562893e-05, "epoch": 3.359398272266905, "percentage": 33.59, "elapsed_time": "1:33:14", "remaining_time": "3:04:17", "throughput": 2324.42, "total_tokens": 13003024} {"current_steps": 22560, "total_steps": 67140, "loss": 0.5911, "lr": 4.198607075366221e-05, "epoch": 3.3601429848078643, "percentage": 33.6, "elapsed_time": "1:33:15", "remaining_time": "3:04:16", "throughput": 2324.46, "total_tokens": 13005968} {"current_steps": 22565, "total_steps": 67140, "loss": 0.5896, "lr": 4.198130179384589e-05, "epoch": 3.3608876973488235, "percentage": 33.61, "elapsed_time": "1:33:16", "remaining_time": "3:04:15", "throughput": 2324.48, "total_tokens": 13008656} {"current_steps": 22570, "total_steps": 67140, "loss": 0.5126, "lr": 4.197653168650223e-05, "epoch": 3.3616324098897827, "percentage": 33.62, "elapsed_time": "1:33:17", "remaining_time": "3:04:13", "throughput": 2324.54, "total_tokens": 13011696} {"current_steps": 22575, "total_steps": 67140, "loss": 0.6833, "lr": 4.197176043195359e-05, "epoch": 3.3623771224307415, "percentage": 33.62, "elapsed_time": "1:33:18", "remaining_time": "3:04:12", "throughput": 2324.57, "total_tokens": 13014448} {"current_steps": 22580, "total_steps": 67140, "loss": 0.6151, "lr": 4.196698803052237e-05, "epoch": 3.363121834971701, "percentage": 33.63, "elapsed_time": "1:33:19", "remaining_time": "3:04:10", "throughput": 2324.64, "total_tokens": 13017552} {"current_steps": 22585, "total_steps": 67140, "loss": 0.7761, "lr": 4.196221448253109e-05, "epoch": 3.36386654751266, "percentage": 33.64, "elapsed_time": "1:33:20", "remaining_time": "3:04:09", "throughput": 2324.72, "total_tokens": 13020720} {"current_steps": 22590, "total_steps": 67140, "loss": 0.6243, "lr": 4.1957439788302325e-05, "epoch": 3.3646112600536195, "percentage": 33.65, "elapsed_time": "1:33:22", "remaining_time": "3:04:07", "throughput": 2324.73, "total_tokens": 13023344} {"current_steps": 22595, "total_steps": 67140, "loss": 0.5113, "lr": 4.195266394815871e-05, "epoch": 3.3653559725945783, "percentage": 33.65, "elapsed_time": "1:33:23", "remaining_time": "3:04:06", "throughput": 2324.81, "total_tokens": 13026672} {"current_steps": 22600, "total_steps": 67140, "loss": 0.6205, "lr": 4.1947886962423e-05, "epoch": 3.3661006851355375, "percentage": 33.66, "elapsed_time": "1:33:24", "remaining_time": "3:04:05", "throughput": 2324.87, "total_tokens": 13029744} {"current_steps": 22605, "total_steps": 67140, "loss": 0.7441, "lr": 4.1943108831417987e-05, "epoch": 3.3668453976764967, "percentage": 33.67, "elapsed_time": "1:33:25", "remaining_time": "3:04:03", "throughput": 2324.92, "total_tokens": 13032720} {"current_steps": 22610, "total_steps": 67140, "loss": 0.7565, "lr": 4.193832955546657e-05, "epoch": 3.367590110217456, "percentage": 33.68, "elapsed_time": "1:33:26", "remaining_time": "3:04:02", "throughput": 2325.02, "total_tokens": 13036080} {"current_steps": 22615, "total_steps": 67140, "loss": 0.7449, "lr": 4.1933549134891706e-05, "epoch": 3.368334822758415, "percentage": 33.68, "elapsed_time": "1:33:27", "remaining_time": "3:04:01", "throughput": 2325.05, "total_tokens": 13038832} {"current_steps": 22620, "total_steps": 67140, "loss": 0.7092, "lr": 4.192876757001643e-05, "epoch": 3.3690795352993743, "percentage": 33.69, "elapsed_time": "1:33:29", "remaining_time": "3:03:59", "throughput": 2325.08, "total_tokens": 13041616} {"current_steps": 22625, "total_steps": 67140, "loss": 0.6917, "lr": 4.1923984861163886e-05, "epoch": 3.3698242478403335, "percentage": 33.7, "elapsed_time": "1:33:30", "remaining_time": "3:03:58", "throughput": 2325.13, "total_tokens": 13044592} {"current_steps": 22630, "total_steps": 67140, "loss": 0.666, "lr": 4.191920100865724e-05, "epoch": 3.3705689603812927, "percentage": 33.71, "elapsed_time": "1:33:31", "remaining_time": "3:03:56", "throughput": 2325.15, "total_tokens": 13047248} {"current_steps": 22635, "total_steps": 67140, "loss": 0.6605, "lr": 4.191441601281978e-05, "epoch": 3.371313672922252, "percentage": 33.71, "elapsed_time": "1:33:32", "remaining_time": "3:03:55", "throughput": 2325.18, "total_tokens": 13050096} {"current_steps": 22640, "total_steps": 67140, "loss": 0.5666, "lr": 4.1909629873974865e-05, "epoch": 3.372058385463211, "percentage": 33.72, "elapsed_time": "1:33:33", "remaining_time": "3:03:53", "throughput": 2325.23, "total_tokens": 13053040} {"current_steps": 22645, "total_steps": 67140, "loss": 0.5649, "lr": 4.1904842592445906e-05, "epoch": 3.3728030980041703, "percentage": 33.73, "elapsed_time": "1:33:34", "remaining_time": "3:03:52", "throughput": 2325.28, "total_tokens": 13055920} {"current_steps": 22650, "total_steps": 67140, "loss": 0.6113, "lr": 4.190005416855641e-05, "epoch": 3.3735478105451295, "percentage": 33.74, "elapsed_time": "1:33:35", "remaining_time": "3:03:50", "throughput": 2325.31, "total_tokens": 13058672} {"current_steps": 22655, "total_steps": 67140, "loss": 0.6249, "lr": 4.1895264602629966e-05, "epoch": 3.3742925230860887, "percentage": 33.74, "elapsed_time": "1:33:37", "remaining_time": "3:03:49", "throughput": 2325.37, "total_tokens": 13061776} {"current_steps": 22660, "total_steps": 67140, "loss": 0.6699, "lr": 4.189047389499023e-05, "epoch": 3.375037235627048, "percentage": 33.75, "elapsed_time": "1:33:38", "remaining_time": "3:03:48", "throughput": 2325.46, "total_tokens": 13065040} {"current_steps": 22665, "total_steps": 67140, "loss": 0.6497, "lr": 4.1885682045960945e-05, "epoch": 3.375781948168007, "percentage": 33.76, "elapsed_time": "1:33:39", "remaining_time": "3:03:46", "throughput": 2325.51, "total_tokens": 13067984} {"current_steps": 22670, "total_steps": 67140, "loss": 0.8425, "lr": 4.188088905586591e-05, "epoch": 3.3765266607089663, "percentage": 33.77, "elapsed_time": "1:33:40", "remaining_time": "3:03:45", "throughput": 2325.55, "total_tokens": 13070800} {"current_steps": 22675, "total_steps": 67140, "loss": 0.6988, "lr": 4.1876094925029036e-05, "epoch": 3.3772713732499255, "percentage": 33.77, "elapsed_time": "1:33:41", "remaining_time": "3:03:43", "throughput": 2325.59, "total_tokens": 13073712} {"current_steps": 22680, "total_steps": 67140, "loss": 0.7065, "lr": 4.187129965377427e-05, "epoch": 3.3780160857908847, "percentage": 33.78, "elapsed_time": "1:33:42", "remaining_time": "3:03:42", "throughput": 2325.61, "total_tokens": 13076400} {"current_steps": 22685, "total_steps": 67140, "loss": 0.671, "lr": 4.186650324242568e-05, "epoch": 3.378760798331844, "percentage": 33.79, "elapsed_time": "1:33:43", "remaining_time": "3:03:41", "throughput": 2325.69, "total_tokens": 13079536} {"current_steps": 22690, "total_steps": 67140, "loss": 0.6252, "lr": 4.186170569130737e-05, "epoch": 3.379505510872803, "percentage": 33.8, "elapsed_time": "1:33:45", "remaining_time": "3:03:39", "throughput": 2325.74, "total_tokens": 13082416} {"current_steps": 22695, "total_steps": 67140, "loss": 0.7014, "lr": 4.185690700074354e-05, "epoch": 3.3802502234137624, "percentage": 33.8, "elapsed_time": "1:33:46", "remaining_time": "3:03:38", "throughput": 2325.74, "total_tokens": 13085008} {"current_steps": 22700, "total_steps": 67140, "loss": 0.6796, "lr": 4.185210717105848e-05, "epoch": 3.3809949359547216, "percentage": 33.81, "elapsed_time": "1:33:47", "remaining_time": "3:03:36", "throughput": 2325.78, "total_tokens": 13087824} {"current_steps": 22705, "total_steps": 67140, "loss": 0.8224, "lr": 4.184730620257652e-05, "epoch": 3.3817396484956808, "percentage": 33.82, "elapsed_time": "1:33:48", "remaining_time": "3:03:35", "throughput": 2325.79, "total_tokens": 13090416} {"current_steps": 22710, "total_steps": 67140, "loss": 0.6051, "lr": 4.18425040956221e-05, "epoch": 3.38248436103664, "percentage": 33.82, "elapsed_time": "1:33:49", "remaining_time": "3:03:33", "throughput": 2325.9, "total_tokens": 13093968} {"current_steps": 22715, "total_steps": 67140, "loss": 0.7402, "lr": 4.183770085051974e-05, "epoch": 3.383229073577599, "percentage": 33.83, "elapsed_time": "1:33:50", "remaining_time": "3:03:32", "throughput": 2325.93, "total_tokens": 13096752} {"current_steps": 22720, "total_steps": 67140, "loss": 0.908, "lr": 4.183289646759402e-05, "epoch": 3.3839737861185584, "percentage": 33.84, "elapsed_time": "1:33:51", "remaining_time": "3:03:30", "throughput": 2325.96, "total_tokens": 13099536} {"current_steps": 22725, "total_steps": 67140, "loss": 0.6313, "lr": 4.182809094716958e-05, "epoch": 3.3847184986595176, "percentage": 33.85, "elapsed_time": "1:33:52", "remaining_time": "3:03:29", "throughput": 2325.98, "total_tokens": 13102128} {"current_steps": 22730, "total_steps": 67140, "loss": 0.7439, "lr": 4.182328428957118e-05, "epoch": 3.3854632112004768, "percentage": 33.85, "elapsed_time": "1:33:54", "remaining_time": "3:03:27", "throughput": 2326.03, "total_tokens": 13105168} {"current_steps": 22735, "total_steps": 67140, "loss": 0.6428, "lr": 4.181847649512362e-05, "epoch": 3.386207923741436, "percentage": 33.86, "elapsed_time": "1:33:55", "remaining_time": "3:03:26", "throughput": 2326.1, "total_tokens": 13108272} {"current_steps": 22740, "total_steps": 67140, "loss": 0.6803, "lr": 4.181366756415181e-05, "epoch": 3.386952636282395, "percentage": 33.87, "elapsed_time": "1:33:56", "remaining_time": "3:03:25", "throughput": 2326.15, "total_tokens": 13111184} {"current_steps": 22745, "total_steps": 67140, "loss": 0.6126, "lr": 4.18088574969807e-05, "epoch": 3.3876973488233544, "percentage": 33.88, "elapsed_time": "1:33:57", "remaining_time": "3:03:23", "throughput": 2326.19, "total_tokens": 13114000} {"current_steps": 22750, "total_steps": 67140, "loss": 0.73, "lr": 4.1804046293935334e-05, "epoch": 3.388442061364313, "percentage": 33.88, "elapsed_time": "1:33:58", "remaining_time": "3:03:22", "throughput": 2326.24, "total_tokens": 13116944} {"current_steps": 22755, "total_steps": 67140, "loss": 0.7854, "lr": 4.179923395534084e-05, "epoch": 3.389186773905273, "percentage": 33.89, "elapsed_time": "1:33:59", "remaining_time": "3:03:20", "throughput": 2326.29, "total_tokens": 13119856} {"current_steps": 22760, "total_steps": 67140, "loss": 0.6932, "lr": 4.1794420481522424e-05, "epoch": 3.3899314864462315, "percentage": 33.9, "elapsed_time": "1:34:01", "remaining_time": "3:03:19", "throughput": 2326.36, "total_tokens": 13123056} {"current_steps": 22765, "total_steps": 67140, "loss": 0.742, "lr": 4.178960587280535e-05, "epoch": 3.390676198987191, "percentage": 33.91, "elapsed_time": "1:34:02", "remaining_time": "3:03:18", "throughput": 2326.42, "total_tokens": 13126032} {"current_steps": 22770, "total_steps": 67140, "loss": 0.6575, "lr": 4.178479012951497e-05, "epoch": 3.39142091152815, "percentage": 33.91, "elapsed_time": "1:34:03", "remaining_time": "3:03:16", "throughput": 2326.49, "total_tokens": 13129200} {"current_steps": 22775, "total_steps": 67140, "loss": 0.535, "lr": 4.177997325197671e-05, "epoch": 3.392165624069109, "percentage": 33.92, "elapsed_time": "1:34:04", "remaining_time": "3:03:15", "throughput": 2326.51, "total_tokens": 13131920} {"current_steps": 22780, "total_steps": 67140, "loss": 0.6147, "lr": 4.177515524051609e-05, "epoch": 3.3929103366100684, "percentage": 33.93, "elapsed_time": "1:34:05", "remaining_time": "3:03:13", "throughput": 2326.54, "total_tokens": 13134704} {"current_steps": 22785, "total_steps": 67140, "loss": 0.6416, "lr": 4.1770336095458676e-05, "epoch": 3.3936550491510276, "percentage": 33.94, "elapsed_time": "1:34:06", "remaining_time": "3:03:12", "throughput": 2326.56, "total_tokens": 13137424} {"current_steps": 22790, "total_steps": 67140, "loss": 0.5585, "lr": 4.176551581713013e-05, "epoch": 3.3943997616919868, "percentage": 33.94, "elapsed_time": "1:34:07", "remaining_time": "3:03:10", "throughput": 2326.61, "total_tokens": 13140336} {"current_steps": 22795, "total_steps": 67140, "loss": 0.5779, "lr": 4.1760694405856194e-05, "epoch": 3.395144474232946, "percentage": 33.95, "elapsed_time": "1:34:08", "remaining_time": "3:03:09", "throughput": 2326.62, "total_tokens": 13142960} {"current_steps": 22800, "total_steps": 67140, "loss": 0.5537, "lr": 4.1755871861962674e-05, "epoch": 3.395889186773905, "percentage": 33.96, "elapsed_time": "1:34:10", "remaining_time": "3:03:07", "throughput": 2326.67, "total_tokens": 13145872} {"current_steps": 22805, "total_steps": 67140, "loss": 0.6526, "lr": 4.175104818577545e-05, "epoch": 3.3966338993148644, "percentage": 33.97, "elapsed_time": "1:34:11", "remaining_time": "3:03:06", "throughput": 2326.72, "total_tokens": 13148880} {"current_steps": 22810, "total_steps": 67140, "loss": 0.6498, "lr": 4.174622337762051e-05, "epoch": 3.3973786118558236, "percentage": 33.97, "elapsed_time": "1:34:12", "remaining_time": "3:03:05", "throughput": 2326.78, "total_tokens": 13151856} {"current_steps": 22815, "total_steps": 67140, "loss": 0.5825, "lr": 4.174139743782387e-05, "epoch": 3.3981233243967828, "percentage": 33.98, "elapsed_time": "1:34:13", "remaining_time": "3:03:03", "throughput": 2326.87, "total_tokens": 13155088} {"current_steps": 22820, "total_steps": 67140, "loss": 0.5939, "lr": 4.173657036671166e-05, "epoch": 3.398868036937742, "percentage": 33.99, "elapsed_time": "1:34:14", "remaining_time": "3:03:02", "throughput": 2326.9, "total_tokens": 13157872} {"current_steps": 22825, "total_steps": 67140, "loss": 0.7326, "lr": 4.173174216461006e-05, "epoch": 3.399612749478701, "percentage": 34.0, "elapsed_time": "1:34:15", "remaining_time": "3:03:00", "throughput": 2326.97, "total_tokens": 13160912} {"current_steps": 22830, "total_steps": 67140, "loss": 0.5762, "lr": 4.172691283184536e-05, "epoch": 3.4003574620196604, "percentage": 34.0, "elapsed_time": "1:34:16", "remaining_time": "3:02:59", "throughput": 2327.02, "total_tokens": 13163888} {"current_steps": 22835, "total_steps": 67140, "loss": 0.5764, "lr": 4.172208236874389e-05, "epoch": 3.4011021745606196, "percentage": 34.01, "elapsed_time": "1:34:18", "remaining_time": "3:02:57", "throughput": 2327.05, "total_tokens": 13166608} {"current_steps": 22840, "total_steps": 67140, "loss": 0.7129, "lr": 4.1717250775632086e-05, "epoch": 3.401846887101579, "percentage": 34.02, "elapsed_time": "1:34:19", "remaining_time": "3:02:56", "throughput": 2327.08, "total_tokens": 13169424} {"current_steps": 22845, "total_steps": 67140, "loss": 0.6363, "lr": 4.1712418052836445e-05, "epoch": 3.402591599642538, "percentage": 34.03, "elapsed_time": "1:34:20", "remaining_time": "3:02:55", "throughput": 2327.13, "total_tokens": 13172336} {"current_steps": 22850, "total_steps": 67140, "loss": 0.5999, "lr": 4.1707584200683535e-05, "epoch": 3.403336312183497, "percentage": 34.03, "elapsed_time": "1:34:21", "remaining_time": "3:02:53", "throughput": 2327.2, "total_tokens": 13175440} {"current_steps": 22855, "total_steps": 67140, "loss": 0.6758, "lr": 4.170274921950001e-05, "epoch": 3.4040810247244564, "percentage": 34.04, "elapsed_time": "1:34:22", "remaining_time": "3:02:52", "throughput": 2327.24, "total_tokens": 13178352} {"current_steps": 22860, "total_steps": 67140, "loss": 0.6155, "lr": 4.169791310961261e-05, "epoch": 3.4048257372654156, "percentage": 34.05, "elapsed_time": "1:34:23", "remaining_time": "3:02:50", "throughput": 2327.3, "total_tokens": 13181456} {"current_steps": 22865, "total_steps": 67140, "loss": 0.6471, "lr": 4.169307587134813e-05, "epoch": 3.405570449806375, "percentage": 34.06, "elapsed_time": "1:34:24", "remaining_time": "3:02:49", "throughput": 2327.32, "total_tokens": 13184080} {"current_steps": 22870, "total_steps": 67140, "loss": 0.6122, "lr": 4.1688237505033454e-05, "epoch": 3.406315162347334, "percentage": 34.06, "elapsed_time": "1:34:26", "remaining_time": "3:02:47", "throughput": 2327.33, "total_tokens": 13186736} {"current_steps": 22875, "total_steps": 67140, "loss": 0.5917, "lr": 4.168339801099552e-05, "epoch": 3.407059874888293, "percentage": 34.07, "elapsed_time": "1:34:27", "remaining_time": "3:02:46", "throughput": 2327.41, "total_tokens": 13189872} {"current_steps": 22880, "total_steps": 67140, "loss": 0.5374, "lr": 4.167855738956139e-05, "epoch": 3.4078045874292524, "percentage": 34.08, "elapsed_time": "1:34:28", "remaining_time": "3:02:45", "throughput": 2327.45, "total_tokens": 13192720} {"current_steps": 22885, "total_steps": 67140, "loss": 0.6855, "lr": 4.1673715641058165e-05, "epoch": 3.4085492999702116, "percentage": 34.09, "elapsed_time": "1:34:29", "remaining_time": "3:02:43", "throughput": 2327.54, "total_tokens": 13196048} {"current_steps": 22890, "total_steps": 67140, "loss": 0.6609, "lr": 4.1668872765813025e-05, "epoch": 3.409294012511171, "percentage": 34.09, "elapsed_time": "1:34:30", "remaining_time": "3:02:42", "throughput": 2327.56, "total_tokens": 13198736} {"current_steps": 22895, "total_steps": 67140, "loss": 0.7209, "lr": 4.166402876415323e-05, "epoch": 3.41003872505213, "percentage": 34.1, "elapsed_time": "1:34:31", "remaining_time": "3:02:40", "throughput": 2327.62, "total_tokens": 13201776} {"current_steps": 22900, "total_steps": 67140, "loss": 0.7132, "lr": 4.1659183636406126e-05, "epoch": 3.410783437593089, "percentage": 34.11, "elapsed_time": "1:34:32", "remaining_time": "3:02:39", "throughput": 2327.66, "total_tokens": 13204624} {"current_steps": 22905, "total_steps": 67140, "loss": 0.506, "lr": 4.165433738289912e-05, "epoch": 3.4115281501340484, "percentage": 34.12, "elapsed_time": "1:34:34", "remaining_time": "3:02:37", "throughput": 2327.73, "total_tokens": 13207696} {"current_steps": 22910, "total_steps": 67140, "loss": 0.5187, "lr": 4.164949000395971e-05, "epoch": 3.4122728626750076, "percentage": 34.12, "elapsed_time": "1:34:35", "remaining_time": "3:02:36", "throughput": 2327.76, "total_tokens": 13210448} {"current_steps": 22915, "total_steps": 67140, "loss": 0.6074, "lr": 4.1644641499915454e-05, "epoch": 3.413017575215967, "percentage": 34.13, "elapsed_time": "1:34:36", "remaining_time": "3:02:35", "throughput": 2327.8, "total_tokens": 13213264} {"current_steps": 22920, "total_steps": 67140, "loss": 0.7483, "lr": 4.1639791871094e-05, "epoch": 3.413762287756926, "percentage": 34.14, "elapsed_time": "1:34:37", "remaining_time": "3:02:33", "throughput": 2327.82, "total_tokens": 13215952} {"current_steps": 22925, "total_steps": 67140, "loss": 0.7122, "lr": 4.1634941117823065e-05, "epoch": 3.414507000297885, "percentage": 34.15, "elapsed_time": "1:34:38", "remaining_time": "3:02:31", "throughput": 2327.82, "total_tokens": 13218512} {"current_steps": 22930, "total_steps": 67140, "loss": 0.6425, "lr": 4.1630089240430434e-05, "epoch": 3.4152517128388444, "percentage": 34.15, "elapsed_time": "1:34:39", "remaining_time": "3:02:30", "throughput": 2327.89, "total_tokens": 13221584} {"current_steps": 22935, "total_steps": 67140, "loss": 0.5415, "lr": 4.162523623924399e-05, "epoch": 3.415996425379803, "percentage": 34.16, "elapsed_time": "1:34:40", "remaining_time": "3:02:29", "throughput": 2327.92, "total_tokens": 13224368} {"current_steps": 22940, "total_steps": 67140, "loss": 0.7202, "lr": 4.162038211459167e-05, "epoch": 3.4167411379207624, "percentage": 34.17, "elapsed_time": "1:34:41", "remaining_time": "3:02:27", "throughput": 2327.92, "total_tokens": 13226928} {"current_steps": 22945, "total_steps": 67140, "loss": 0.6385, "lr": 4.161552686680151e-05, "epoch": 3.4174858504617216, "percentage": 34.17, "elapsed_time": "1:34:42", "remaining_time": "3:02:26", "throughput": 2327.97, "total_tokens": 13229776} {"current_steps": 22950, "total_steps": 67140, "loss": 0.5723, "lr": 4.161067049620159e-05, "epoch": 3.418230563002681, "percentage": 34.18, "elapsed_time": "1:34:44", "remaining_time": "3:02:24", "throughput": 2328.01, "total_tokens": 13232624} {"current_steps": 22955, "total_steps": 67140, "loss": 0.6149, "lr": 4.16058130031201e-05, "epoch": 3.41897527554364, "percentage": 34.19, "elapsed_time": "1:34:45", "remaining_time": "3:02:23", "throughput": 2328.03, "total_tokens": 13235312} {"current_steps": 22960, "total_steps": 67140, "loss": 0.7431, "lr": 4.160095438788527e-05, "epoch": 3.419719988084599, "percentage": 34.2, "elapsed_time": "1:34:46", "remaining_time": "3:02:21", "throughput": 2328.04, "total_tokens": 13238000} {"current_steps": 22965, "total_steps": 67140, "loss": 0.7064, "lr": 4.1596094650825446e-05, "epoch": 3.4204647006255584, "percentage": 34.2, "elapsed_time": "1:34:47", "remaining_time": "3:02:20", "throughput": 2328.09, "total_tokens": 13240912} {"current_steps": 22970, "total_steps": 67140, "loss": 0.5968, "lr": 4.159123379226902e-05, "epoch": 3.4212094131665176, "percentage": 34.21, "elapsed_time": "1:34:48", "remaining_time": "3:02:18", "throughput": 2328.12, "total_tokens": 13243696} {"current_steps": 22975, "total_steps": 67140, "loss": 0.6334, "lr": 4.158637181254447e-05, "epoch": 3.421954125707477, "percentage": 34.22, "elapsed_time": "1:34:49", "remaining_time": "3:02:17", "throughput": 2328.2, "total_tokens": 13246992} {"current_steps": 22980, "total_steps": 67140, "loss": 0.5047, "lr": 4.158150871198034e-05, "epoch": 3.422698838248436, "percentage": 34.23, "elapsed_time": "1:34:50", "remaining_time": "3:02:16", "throughput": 2328.24, "total_tokens": 13249808} {"current_steps": 22985, "total_steps": 67140, "loss": 0.8387, "lr": 4.157664449090527e-05, "epoch": 3.423443550789395, "percentage": 34.23, "elapsed_time": "1:34:52", "remaining_time": "3:02:14", "throughput": 2328.32, "total_tokens": 13253040} {"current_steps": 22990, "total_steps": 67140, "loss": 0.7859, "lr": 4.1571779149647964e-05, "epoch": 3.4241882633303544, "percentage": 34.24, "elapsed_time": "1:34:53", "remaining_time": "3:02:13", "throughput": 2328.39, "total_tokens": 13256240} {"current_steps": 22995, "total_steps": 67140, "loss": 0.6444, "lr": 4.1566912688537195e-05, "epoch": 3.4249329758713136, "percentage": 34.25, "elapsed_time": "1:34:54", "remaining_time": "3:02:11", "throughput": 2328.41, "total_tokens": 13258928} {"current_steps": 23000, "total_steps": 67140, "loss": 0.6664, "lr": 4.156204510790183e-05, "epoch": 3.425677688412273, "percentage": 34.26, "elapsed_time": "1:34:55", "remaining_time": "3:02:10", "throughput": 2328.44, "total_tokens": 13261712} {"current_steps": 23005, "total_steps": 67140, "loss": 0.5807, "lr": 4.1557176408070784e-05, "epoch": 3.426422400953232, "percentage": 34.26, "elapsed_time": "1:34:56", "remaining_time": "3:02:08", "throughput": 2328.46, "total_tokens": 13264400} {"current_steps": 23010, "total_steps": 67140, "loss": 0.7171, "lr": 4.155230658937308e-05, "epoch": 3.4271671134941912, "percentage": 34.27, "elapsed_time": "1:34:57", "remaining_time": "3:02:07", "throughput": 2328.52, "total_tokens": 13267440} {"current_steps": 23015, "total_steps": 67140, "loss": 0.6556, "lr": 4.154743565213779e-05, "epoch": 3.4279118260351504, "percentage": 34.28, "elapsed_time": "1:34:58", "remaining_time": "3:02:06", "throughput": 2328.58, "total_tokens": 13270544} {"current_steps": 23020, "total_steps": 67140, "loss": 0.7347, "lr": 4.154256359669408e-05, "epoch": 3.4286565385761096, "percentage": 34.29, "elapsed_time": "1:35:00", "remaining_time": "3:02:04", "throughput": 2328.63, "total_tokens": 13273456} {"current_steps": 23025, "total_steps": 67140, "loss": 0.6247, "lr": 4.153769042337118e-05, "epoch": 3.429401251117069, "percentage": 34.29, "elapsed_time": "1:35:01", "remaining_time": "3:02:03", "throughput": 2328.69, "total_tokens": 13276496} {"current_steps": 23030, "total_steps": 67140, "loss": 0.6701, "lr": 4.153281613249839e-05, "epoch": 3.430145963658028, "percentage": 34.3, "elapsed_time": "1:35:02", "remaining_time": "3:02:01", "throughput": 2328.71, "total_tokens": 13279152} {"current_steps": 23035, "total_steps": 67140, "loss": 0.5451, "lr": 4.152794072440511e-05, "epoch": 3.4308906761989872, "percentage": 34.31, "elapsed_time": "1:35:03", "remaining_time": "3:02:00", "throughput": 2328.77, "total_tokens": 13282192} {"current_steps": 23040, "total_steps": 67140, "loss": 0.7461, "lr": 4.1523064199420786e-05, "epoch": 3.4316353887399464, "percentage": 34.32, "elapsed_time": "1:35:04", "remaining_time": "3:01:59", "throughput": 2328.82, "total_tokens": 13285136} {"current_steps": 23045, "total_steps": 67140, "loss": 0.6499, "lr": 4.1518186557874974e-05, "epoch": 3.4323801012809056, "percentage": 34.32, "elapsed_time": "1:35:05", "remaining_time": "3:01:57", "throughput": 2328.88, "total_tokens": 13288176} {"current_steps": 23050, "total_steps": 67140, "loss": 0.6688, "lr": 4.151330780009726e-05, "epoch": 3.433124813821865, "percentage": 34.33, "elapsed_time": "1:35:06", "remaining_time": "3:01:56", "throughput": 2328.9, "total_tokens": 13290864} {"current_steps": 23055, "total_steps": 67140, "loss": 0.6294, "lr": 4.150842792641735e-05, "epoch": 3.433869526362824, "percentage": 34.34, "elapsed_time": "1:35:08", "remaining_time": "3:01:54", "throughput": 2328.97, "total_tokens": 13293968} {"current_steps": 23060, "total_steps": 67140, "loss": 0.8054, "lr": 4.1503546937165e-05, "epoch": 3.4346142389037833, "percentage": 34.35, "elapsed_time": "1:35:09", "remaining_time": "3:01:53", "throughput": 2328.98, "total_tokens": 13296592} {"current_steps": 23065, "total_steps": 67140, "loss": 0.5678, "lr": 4.1498664832670045e-05, "epoch": 3.4353589514447425, "percentage": 34.35, "elapsed_time": "1:35:10", "remaining_time": "3:01:51", "throughput": 2329.0, "total_tokens": 13299216} {"current_steps": 23070, "total_steps": 67140, "loss": 0.6508, "lr": 4.149378161326239e-05, "epoch": 3.4361036639857017, "percentage": 34.36, "elapsed_time": "1:35:11", "remaining_time": "3:01:50", "throughput": 2329.03, "total_tokens": 13302096} {"current_steps": 23075, "total_steps": 67140, "loss": 0.7005, "lr": 4.148889727927204e-05, "epoch": 3.436848376526661, "percentage": 34.37, "elapsed_time": "1:35:12", "remaining_time": "3:01:48", "throughput": 2329.06, "total_tokens": 13304880} {"current_steps": 23080, "total_steps": 67140, "loss": 0.7141, "lr": 4.1484011831029054e-05, "epoch": 3.43759308906762, "percentage": 34.38, "elapsed_time": "1:35:13", "remaining_time": "3:01:47", "throughput": 2329.09, "total_tokens": 13307696} {"current_steps": 23085, "total_steps": 67140, "loss": 0.6769, "lr": 4.147912526886356e-05, "epoch": 3.4383378016085793, "percentage": 34.38, "elapsed_time": "1:35:14", "remaining_time": "3:01:46", "throughput": 2329.15, "total_tokens": 13310704} {"current_steps": 23090, "total_steps": 67140, "loss": 0.6731, "lr": 4.147423759310579e-05, "epoch": 3.4390825141495385, "percentage": 34.39, "elapsed_time": "1:35:16", "remaining_time": "3:01:44", "throughput": 2329.22, "total_tokens": 13313808} {"current_steps": 23095, "total_steps": 67140, "loss": 0.6221, "lr": 4.1469348804086016e-05, "epoch": 3.4398272266904977, "percentage": 34.4, "elapsed_time": "1:35:17", "remaining_time": "3:01:43", "throughput": 2329.24, "total_tokens": 13316592} {"current_steps": 23100, "total_steps": 67140, "loss": 0.6822, "lr": 4.14644589021346e-05, "epoch": 3.4405719392314564, "percentage": 34.41, "elapsed_time": "1:35:18", "remaining_time": "3:01:41", "throughput": 2329.31, "total_tokens": 13319600} {"current_steps": 23105, "total_steps": 67140, "loss": 0.7264, "lr": 4.1459567887582015e-05, "epoch": 3.441316651772416, "percentage": 34.41, "elapsed_time": "1:35:19", "remaining_time": "3:01:40", "throughput": 2329.38, "total_tokens": 13322768} {"current_steps": 23110, "total_steps": 67140, "loss": 0.6822, "lr": 4.145467576075874e-05, "epoch": 3.442061364313375, "percentage": 34.42, "elapsed_time": "1:35:20", "remaining_time": "3:01:39", "throughput": 2329.44, "total_tokens": 13325872} {"current_steps": 23115, "total_steps": 67140, "loss": 0.5463, "lr": 4.144978252199537e-05, "epoch": 3.442806076854334, "percentage": 34.43, "elapsed_time": "1:35:21", "remaining_time": "3:01:37", "throughput": 2329.5, "total_tokens": 13328976} {"current_steps": 23120, "total_steps": 67140, "loss": 0.6886, "lr": 4.1444888171622584e-05, "epoch": 3.4435507893952932, "percentage": 34.44, "elapsed_time": "1:35:22", "remaining_time": "3:01:36", "throughput": 2329.51, "total_tokens": 13331568} {"current_steps": 23125, "total_steps": 67140, "loss": 0.6075, "lr": 4.143999270997111e-05, "epoch": 3.4442955019362524, "percentage": 34.44, "elapsed_time": "1:35:24", "remaining_time": "3:01:34", "throughput": 2329.54, "total_tokens": 13334288} {"current_steps": 23130, "total_steps": 67140, "loss": 0.4876, "lr": 4.143509613737178e-05, "epoch": 3.4450402144772116, "percentage": 34.45, "elapsed_time": "1:35:25", "remaining_time": "3:01:33", "throughput": 2329.54, "total_tokens": 13336816} {"current_steps": 23135, "total_steps": 67140, "loss": 0.6254, "lr": 4.143019845415546e-05, "epoch": 3.445784927018171, "percentage": 34.46, "elapsed_time": "1:35:26", "remaining_time": "3:01:31", "throughput": 2329.59, "total_tokens": 13339760} {"current_steps": 23140, "total_steps": 67140, "loss": 0.7086, "lr": 4.142529966065314e-05, "epoch": 3.44652963955913, "percentage": 34.47, "elapsed_time": "1:35:27", "remaining_time": "3:01:30", "throughput": 2329.64, "total_tokens": 13342736} {"current_steps": 23145, "total_steps": 67140, "loss": 0.6475, "lr": 4.1420399757195845e-05, "epoch": 3.4472743521000893, "percentage": 34.47, "elapsed_time": "1:35:28", "remaining_time": "3:01:29", "throughput": 2329.7, "total_tokens": 13345776} {"current_steps": 23150, "total_steps": 67140, "loss": 0.5579, "lr": 4.141549874411469e-05, "epoch": 3.4480190646410485, "percentage": 34.48, "elapsed_time": "1:35:29", "remaining_time": "3:01:27", "throughput": 2329.73, "total_tokens": 13348592} {"current_steps": 23155, "total_steps": 67140, "loss": 0.5913, "lr": 4.1410596621740874e-05, "epoch": 3.4487637771820077, "percentage": 34.49, "elapsed_time": "1:35:30", "remaining_time": "3:01:26", "throughput": 2329.78, "total_tokens": 13351504} {"current_steps": 23160, "total_steps": 67140, "loss": 0.8171, "lr": 4.140569339040566e-05, "epoch": 3.449508489722967, "percentage": 34.5, "elapsed_time": "1:35:31", "remaining_time": "3:01:24", "throughput": 2329.81, "total_tokens": 13354256} {"current_steps": 23165, "total_steps": 67140, "loss": 0.6925, "lr": 4.140078905044039e-05, "epoch": 3.450253202263926, "percentage": 34.5, "elapsed_time": "1:35:33", "remaining_time": "3:01:23", "throughput": 2329.83, "total_tokens": 13357040} {"current_steps": 23170, "total_steps": 67140, "loss": 0.632, "lr": 4.1395883602176466e-05, "epoch": 3.4509979148048853, "percentage": 34.51, "elapsed_time": "1:35:34", "remaining_time": "3:01:21", "throughput": 2329.9, "total_tokens": 13360176} {"current_steps": 23175, "total_steps": 67140, "loss": 0.5614, "lr": 4.13909770459454e-05, "epoch": 3.4517426273458445, "percentage": 34.52, "elapsed_time": "1:35:35", "remaining_time": "3:01:20", "throughput": 2329.96, "total_tokens": 13363152} {"current_steps": 23180, "total_steps": 67140, "loss": 0.5894, "lr": 4.138606938207874e-05, "epoch": 3.4524873398868037, "percentage": 34.52, "elapsed_time": "1:35:36", "remaining_time": "3:01:19", "throughput": 2330.0, "total_tokens": 13366064} {"current_steps": 23185, "total_steps": 67140, "loss": 0.5405, "lr": 4.1381160610908134e-05, "epoch": 3.453232052427763, "percentage": 34.53, "elapsed_time": "1:35:37", "remaining_time": "3:01:17", "throughput": 2330.03, "total_tokens": 13368784} {"current_steps": 23190, "total_steps": 67140, "loss": 0.524, "lr": 4.13762507327653e-05, "epoch": 3.453976764968722, "percentage": 34.54, "elapsed_time": "1:35:38", "remaining_time": "3:01:16", "throughput": 2330.08, "total_tokens": 13371792} {"current_steps": 23195, "total_steps": 67140, "loss": 0.6079, "lr": 4.137133974798202e-05, "epoch": 3.4547214775096813, "percentage": 34.55, "elapsed_time": "1:35:39", "remaining_time": "3:01:14", "throughput": 2330.15, "total_tokens": 13374864} {"current_steps": 23200, "total_steps": 67140, "loss": 0.6904, "lr": 4.1366427656890156e-05, "epoch": 3.4554661900506405, "percentage": 34.55, "elapsed_time": "1:35:41", "remaining_time": "3:01:13", "throughput": 2330.15, "total_tokens": 13377424} {"current_steps": 23205, "total_steps": 67140, "loss": 0.523, "lr": 4.136151445982165e-05, "epoch": 3.4562109025915997, "percentage": 34.56, "elapsed_time": "1:35:42", "remaining_time": "3:01:11", "throughput": 2330.17, "total_tokens": 13380080} {"current_steps": 23210, "total_steps": 67140, "loss": 0.7694, "lr": 4.135660015710853e-05, "epoch": 3.456955615132559, "percentage": 34.57, "elapsed_time": "1:35:43", "remaining_time": "3:01:10", "throughput": 2330.2, "total_tokens": 13382928} {"current_steps": 23215, "total_steps": 67140, "loss": 0.6004, "lr": 4.1351684749082866e-05, "epoch": 3.457700327673518, "percentage": 34.58, "elapsed_time": "1:35:44", "remaining_time": "3:01:08", "throughput": 2330.25, "total_tokens": 13385872} {"current_steps": 23220, "total_steps": 67140, "loss": 0.6032, "lr": 4.1346768236076825e-05, "epoch": 3.4584450402144773, "percentage": 34.58, "elapsed_time": "1:35:45", "remaining_time": "3:01:07", "throughput": 2330.3, "total_tokens": 13388880} {"current_steps": 23225, "total_steps": 67140, "loss": 0.5816, "lr": 4.134185061842265e-05, "epoch": 3.4591897527554365, "percentage": 34.59, "elapsed_time": "1:35:46", "remaining_time": "3:01:06", "throughput": 2330.35, "total_tokens": 13391792} {"current_steps": 23230, "total_steps": 67140, "loss": 0.5339, "lr": 4.133693189645265e-05, "epoch": 3.4599344652963957, "percentage": 34.6, "elapsed_time": "1:35:47", "remaining_time": "3:01:04", "throughput": 2330.4, "total_tokens": 13394672} {"current_steps": 23235, "total_steps": 67140, "loss": 0.5803, "lr": 4.133201207049921e-05, "epoch": 3.460679177837355, "percentage": 34.61, "elapsed_time": "1:35:48", "remaining_time": "3:01:03", "throughput": 2330.44, "total_tokens": 13397584} {"current_steps": 23240, "total_steps": 67140, "loss": 0.634, "lr": 4.1327091140894805e-05, "epoch": 3.461423890378314, "percentage": 34.61, "elapsed_time": "1:35:50", "remaining_time": "3:01:01", "throughput": 2330.47, "total_tokens": 13400400} {"current_steps": 23245, "total_steps": 67140, "loss": 0.8313, "lr": 4.132216910797195e-05, "epoch": 3.4621686029192733, "percentage": 34.62, "elapsed_time": "1:35:51", "remaining_time": "3:01:00", "throughput": 2330.5, "total_tokens": 13403152} {"current_steps": 23250, "total_steps": 67140, "loss": 0.4589, "lr": 4.131724597206328e-05, "epoch": 3.4629133154602325, "percentage": 34.63, "elapsed_time": "1:35:52", "remaining_time": "3:00:58", "throughput": 2330.51, "total_tokens": 13405776} {"current_steps": 23255, "total_steps": 67140, "loss": 0.7219, "lr": 4.131232173350146e-05, "epoch": 3.4636580280011917, "percentage": 34.64, "elapsed_time": "1:35:53", "remaining_time": "3:00:57", "throughput": 2330.54, "total_tokens": 13408592} {"current_steps": 23260, "total_steps": 67140, "loss": 0.7952, "lr": 4.130739639261926e-05, "epoch": 3.464402740542151, "percentage": 34.64, "elapsed_time": "1:35:54", "remaining_time": "3:00:55", "throughput": 2330.57, "total_tokens": 13411376} {"current_steps": 23265, "total_steps": 67140, "loss": 0.5894, "lr": 4.130246994974952e-05, "epoch": 3.4651474530831097, "percentage": 34.65, "elapsed_time": "1:35:55", "remaining_time": "3:00:54", "throughput": 2330.6, "total_tokens": 13414160} {"current_steps": 23270, "total_steps": 67140, "loss": 0.589, "lr": 4.129754240522513e-05, "epoch": 3.4658921656240693, "percentage": 34.66, "elapsed_time": "1:35:56", "remaining_time": "3:00:53", "throughput": 2330.65, "total_tokens": 13417104} {"current_steps": 23275, "total_steps": 67140, "loss": 0.6076, "lr": 4.12926137593791e-05, "epoch": 3.466636878165028, "percentage": 34.67, "elapsed_time": "1:35:57", "remaining_time": "3:00:51", "throughput": 2330.71, "total_tokens": 13420144} {"current_steps": 23280, "total_steps": 67140, "loss": 0.6558, "lr": 4.128768401254446e-05, "epoch": 3.4673815907059877, "percentage": 34.67, "elapsed_time": "1:35:59", "remaining_time": "3:00:50", "throughput": 2330.77, "total_tokens": 13423216} {"current_steps": 23285, "total_steps": 67140, "loss": 0.6101, "lr": 4.128275316505435e-05, "epoch": 3.4681263032469465, "percentage": 34.68, "elapsed_time": "1:36:00", "remaining_time": "3:00:48", "throughput": 2330.79, "total_tokens": 13425904} {"current_steps": 23290, "total_steps": 67140, "loss": 0.7758, "lr": 4.1277821217242e-05, "epoch": 3.4688710157879057, "percentage": 34.69, "elapsed_time": "1:36:01", "remaining_time": "3:00:47", "throughput": 2330.84, "total_tokens": 13428912} {"current_steps": 23295, "total_steps": 67140, "loss": 0.6989, "lr": 4.127288816944066e-05, "epoch": 3.469615728328865, "percentage": 34.7, "elapsed_time": "1:36:02", "remaining_time": "3:00:46", "throughput": 2330.9, "total_tokens": 13431920} {"current_steps": 23300, "total_steps": 67140, "loss": 0.6099, "lr": 4.12679540219837e-05, "epoch": 3.470360440869824, "percentage": 34.7, "elapsed_time": "1:36:03", "remaining_time": "3:00:44", "throughput": 2330.9, "total_tokens": 13434384} {"current_steps": 23305, "total_steps": 67140, "loss": 0.5735, "lr": 4.126301877520456e-05, "epoch": 3.4711051534107833, "percentage": 34.71, "elapsed_time": "1:36:04", "remaining_time": "3:00:43", "throughput": 2330.93, "total_tokens": 13437168} {"current_steps": 23310, "total_steps": 67140, "loss": 0.5439, "lr": 4.125808242943672e-05, "epoch": 3.4718498659517425, "percentage": 34.72, "elapsed_time": "1:36:05", "remaining_time": "3:00:41", "throughput": 2330.96, "total_tokens": 13439952} {"current_steps": 23315, "total_steps": 67140, "loss": 0.7287, "lr": 4.125314498501377e-05, "epoch": 3.4725945784927017, "percentage": 34.73, "elapsed_time": "1:36:06", "remaining_time": "3:00:40", "throughput": 2330.96, "total_tokens": 13442544} {"current_steps": 23320, "total_steps": 67140, "loss": 0.801, "lr": 4.124820644226936e-05, "epoch": 3.473339291033661, "percentage": 34.73, "elapsed_time": "1:36:08", "remaining_time": "3:00:38", "throughput": 2330.99, "total_tokens": 13445296} {"current_steps": 23325, "total_steps": 67140, "loss": 0.6231, "lr": 4.124326680153723e-05, "epoch": 3.47408400357462, "percentage": 34.74, "elapsed_time": "1:36:09", "remaining_time": "3:00:37", "throughput": 2331.03, "total_tokens": 13448112} {"current_steps": 23330, "total_steps": 67140, "loss": 0.6661, "lr": 4.1238326063151164e-05, "epoch": 3.4748287161155793, "percentage": 34.75, "elapsed_time": "1:36:10", "remaining_time": "3:00:35", "throughput": 2331.06, "total_tokens": 13450896} {"current_steps": 23335, "total_steps": 67140, "loss": 0.5264, "lr": 4.1233384227445036e-05, "epoch": 3.4755734286565385, "percentage": 34.76, "elapsed_time": "1:36:11", "remaining_time": "3:00:34", "throughput": 2331.12, "total_tokens": 13453968} {"current_steps": 23340, "total_steps": 67140, "loss": 0.6773, "lr": 4.122844129475281e-05, "epoch": 3.4763181411974977, "percentage": 34.76, "elapsed_time": "1:36:12", "remaining_time": "3:00:32", "throughput": 2331.19, "total_tokens": 13457136} {"current_steps": 23345, "total_steps": 67140, "loss": 0.7095, "lr": 4.1223497265408505e-05, "epoch": 3.477062853738457, "percentage": 34.77, "elapsed_time": "1:36:13", "remaining_time": "3:00:31", "throughput": 2331.22, "total_tokens": 13459984} {"current_steps": 23350, "total_steps": 67140, "loss": 0.6193, "lr": 4.12185521397462e-05, "epoch": 3.477807566279416, "percentage": 34.78, "elapsed_time": "1:36:14", "remaining_time": "3:00:30", "throughput": 2331.27, "total_tokens": 13462960} {"current_steps": 23355, "total_steps": 67140, "loss": 0.6426, "lr": 4.12136059181001e-05, "epoch": 3.4785522788203753, "percentage": 34.79, "elapsed_time": "1:36:16", "remaining_time": "3:00:28", "throughput": 2331.29, "total_tokens": 13465584} {"current_steps": 23360, "total_steps": 67140, "loss": 0.5674, "lr": 4.1208658600804416e-05, "epoch": 3.4792969913613345, "percentage": 34.79, "elapsed_time": "1:36:17", "remaining_time": "3:00:27", "throughput": 2331.32, "total_tokens": 13468336} {"current_steps": 23365, "total_steps": 67140, "loss": 0.6288, "lr": 4.120371018819349e-05, "epoch": 3.4800417039022937, "percentage": 34.8, "elapsed_time": "1:36:18", "remaining_time": "3:00:25", "throughput": 2331.35, "total_tokens": 13471120} {"current_steps": 23370, "total_steps": 67140, "loss": 0.6457, "lr": 4.1198760680601713e-05, "epoch": 3.480786416443253, "percentage": 34.81, "elapsed_time": "1:36:19", "remaining_time": "3:00:24", "throughput": 2331.39, "total_tokens": 13474064} {"current_steps": 23375, "total_steps": 67140, "loss": 0.7742, "lr": 4.1193810078363544e-05, "epoch": 3.481531128984212, "percentage": 34.82, "elapsed_time": "1:36:20", "remaining_time": "3:00:23", "throughput": 2331.45, "total_tokens": 13477168} {"current_steps": 23380, "total_steps": 67140, "loss": 0.5293, "lr": 4.1188858381813524e-05, "epoch": 3.4822758415251713, "percentage": 34.82, "elapsed_time": "1:36:21", "remaining_time": "3:00:21", "throughput": 2331.49, "total_tokens": 13480080} {"current_steps": 23385, "total_steps": 67140, "loss": 0.7198, "lr": 4.118390559128629e-05, "epoch": 3.4830205540661305, "percentage": 34.83, "elapsed_time": "1:36:22", "remaining_time": "3:00:20", "throughput": 2331.55, "total_tokens": 13483120} {"current_steps": 23390, "total_steps": 67140, "loss": 0.4929, "lr": 4.11789517071165e-05, "epoch": 3.4837652666070897, "percentage": 34.84, "elapsed_time": "1:36:24", "remaining_time": "3:00:18", "throughput": 2331.6, "total_tokens": 13486064} {"current_steps": 23395, "total_steps": 67140, "loss": 0.9195, "lr": 4.117399672963893e-05, "epoch": 3.484509979148049, "percentage": 34.85, "elapsed_time": "1:36:25", "remaining_time": "3:00:17", "throughput": 2331.66, "total_tokens": 13489136} {"current_steps": 23400, "total_steps": 67140, "loss": 0.6108, "lr": 4.116904065918843e-05, "epoch": 3.485254691689008, "percentage": 34.85, "elapsed_time": "1:36:26", "remaining_time": "3:00:16", "throughput": 2331.71, "total_tokens": 13492144} {"current_steps": 23405, "total_steps": 67140, "loss": 0.6275, "lr": 4.11640834960999e-05, "epoch": 3.4859994042299673, "percentage": 34.86, "elapsed_time": "1:36:27", "remaining_time": "3:00:14", "throughput": 2331.77, "total_tokens": 13495120} {"current_steps": 23410, "total_steps": 67140, "loss": 0.5564, "lr": 4.115912524070832e-05, "epoch": 3.4867441167709265, "percentage": 34.87, "elapsed_time": "1:36:28", "remaining_time": "3:00:13", "throughput": 2331.83, "total_tokens": 13498192} {"current_steps": 23415, "total_steps": 67140, "loss": 0.7891, "lr": 4.1154165893348754e-05, "epoch": 3.4874888293118858, "percentage": 34.87, "elapsed_time": "1:36:29", "remaining_time": "3:00:11", "throughput": 2331.84, "total_tokens": 13500784} {"current_steps": 23420, "total_steps": 67140, "loss": 0.6063, "lr": 4.114920545435634e-05, "epoch": 3.488233541852845, "percentage": 34.88, "elapsed_time": "1:36:30", "remaining_time": "3:00:10", "throughput": 2331.87, "total_tokens": 13503536} {"current_steps": 23425, "total_steps": 67140, "loss": 0.6575, "lr": 4.114424392406628e-05, "epoch": 3.488978254393804, "percentage": 34.89, "elapsed_time": "1:36:31", "remaining_time": "3:00:08", "throughput": 2331.91, "total_tokens": 13506384} {"current_steps": 23430, "total_steps": 67140, "loss": 0.6627, "lr": 4.113928130281385e-05, "epoch": 3.4897229669347634, "percentage": 34.9, "elapsed_time": "1:36:33", "remaining_time": "3:00:07", "throughput": 2331.94, "total_tokens": 13509168} {"current_steps": 23435, "total_steps": 67140, "loss": 0.6514, "lr": 4.113431759093441e-05, "epoch": 3.4904676794757226, "percentage": 34.9, "elapsed_time": "1:36:34", "remaining_time": "3:00:05", "throughput": 2331.98, "total_tokens": 13512080} {"current_steps": 23440, "total_steps": 67140, "loss": 0.614, "lr": 4.112935278876338e-05, "epoch": 3.4912123920166813, "percentage": 34.91, "elapsed_time": "1:36:35", "remaining_time": "3:00:04", "throughput": 2332.04, "total_tokens": 13515152} {"current_steps": 23445, "total_steps": 67140, "loss": 0.8013, "lr": 4.112438689663627e-05, "epoch": 3.491957104557641, "percentage": 34.92, "elapsed_time": "1:36:36", "remaining_time": "3:00:03", "throughput": 2332.1, "total_tokens": 13518192} {"current_steps": 23450, "total_steps": 67140, "loss": 0.6227, "lr": 4.1119419914888645e-05, "epoch": 3.4927018170985997, "percentage": 34.93, "elapsed_time": "1:36:37", "remaining_time": "3:00:01", "throughput": 2332.12, "total_tokens": 13520880} {"current_steps": 23455, "total_steps": 67140, "loss": 0.6554, "lr": 4.111445184385616e-05, "epoch": 3.4934465296395594, "percentage": 34.93, "elapsed_time": "1:36:38", "remaining_time": "3:00:00", "throughput": 2332.16, "total_tokens": 13523728} {"current_steps": 23460, "total_steps": 67140, "loss": 0.6191, "lr": 4.110948268387455e-05, "epoch": 3.494191242180518, "percentage": 34.94, "elapsed_time": "1:36:39", "remaining_time": "2:59:58", "throughput": 2332.21, "total_tokens": 13526736} {"current_steps": 23465, "total_steps": 67140, "loss": 0.6585, "lr": 4.110451243527957e-05, "epoch": 3.4949359547214773, "percentage": 34.95, "elapsed_time": "1:36:41", "remaining_time": "2:59:57", "throughput": 2332.29, "total_tokens": 13529872} {"current_steps": 23470, "total_steps": 67140, "loss": 0.6533, "lr": 4.109954109840714e-05, "epoch": 3.4956806672624365, "percentage": 34.96, "elapsed_time": "1:36:42", "remaining_time": "2:59:56", "throughput": 2332.33, "total_tokens": 13532752} {"current_steps": 23475, "total_steps": 67140, "loss": 0.7109, "lr": 4.109456867359317e-05, "epoch": 3.4964253798033957, "percentage": 34.96, "elapsed_time": "1:36:43", "remaining_time": "2:59:54", "throughput": 2332.41, "total_tokens": 13536016} {"current_steps": 23480, "total_steps": 67140, "loss": 0.6907, "lr": 4.108959516117368e-05, "epoch": 3.497170092344355, "percentage": 34.97, "elapsed_time": "1:36:44", "remaining_time": "2:59:53", "throughput": 2332.45, "total_tokens": 13538896} {"current_steps": 23485, "total_steps": 67140, "loss": 0.6377, "lr": 4.108462056148477e-05, "epoch": 3.497914804885314, "percentage": 34.98, "elapsed_time": "1:36:45", "remaining_time": "2:59:51", "throughput": 2332.5, "total_tokens": 13541840} {"current_steps": 23490, "total_steps": 67140, "loss": 0.5569, "lr": 4.10796448748626e-05, "epoch": 3.4986595174262733, "percentage": 34.99, "elapsed_time": "1:36:46", "remaining_time": "2:59:50", "throughput": 2332.55, "total_tokens": 13544784} {"current_steps": 23495, "total_steps": 67140, "loss": 0.707, "lr": 4.10746681016434e-05, "epoch": 3.4994042299672325, "percentage": 34.99, "elapsed_time": "1:36:48", "remaining_time": "2:59:49", "throughput": 2332.59, "total_tokens": 13547760} {"current_steps": 23499, "total_steps": 67140, "eval_loss": 0.6524342894554138, "epoch": 3.5, "percentage": 35.0, "elapsed_time": "1:38:03", "remaining_time": "3:02:05", "throughput": 2303.18, "total_tokens": 13550032} {"current_steps": 23500, "total_steps": 67140, "loss": 0.6032, "lr": 4.1069690242163484e-05, "epoch": 3.5001489425081918, "percentage": 35.0, "elapsed_time": "1:38:05", "remaining_time": "3:02:08", "throughput": 2302.55, "total_tokens": 13550544} {"current_steps": 23505, "total_steps": 67140, "loss": 0.6502, "lr": 4.106471129675924e-05, "epoch": 3.500893655049151, "percentage": 35.01, "elapsed_time": "1:38:06", "remaining_time": "3:02:07", "throughput": 2302.58, "total_tokens": 13553264} {"current_steps": 23510, "total_steps": 67140, "loss": 0.584, "lr": 4.105973126576712e-05, "epoch": 3.50163836759011, "percentage": 35.02, "elapsed_time": "1:38:07", "remaining_time": "3:02:05", "throughput": 2302.61, "total_tokens": 13555984} {"current_steps": 23515, "total_steps": 67140, "loss": 0.8713, "lr": 4.105475014952365e-05, "epoch": 3.5023830801310694, "percentage": 35.02, "elapsed_time": "1:38:08", "remaining_time": "3:02:04", "throughput": 2302.67, "total_tokens": 13559024} {"current_steps": 23520, "total_steps": 67140, "loss": 0.6551, "lr": 4.104976794836545e-05, "epoch": 3.5031277926720286, "percentage": 35.03, "elapsed_time": "1:38:09", "remaining_time": "3:02:02", "throughput": 2302.72, "total_tokens": 13561968} {"current_steps": 23525, "total_steps": 67140, "loss": 0.794, "lr": 4.104478466262917e-05, "epoch": 3.5038725052129878, "percentage": 35.04, "elapsed_time": "1:38:10", "remaining_time": "3:02:01", "throughput": 2302.77, "total_tokens": 13564944} {"current_steps": 23530, "total_steps": 67140, "loss": 0.5519, "lr": 4.1039800292651584e-05, "epoch": 3.504617217753947, "percentage": 35.05, "elapsed_time": "1:38:11", "remaining_time": "3:01:59", "throughput": 2302.79, "total_tokens": 13567632} {"current_steps": 23535, "total_steps": 67140, "loss": 0.802, "lr": 4.103481483876951e-05, "epoch": 3.505361930294906, "percentage": 35.05, "elapsed_time": "1:38:13", "remaining_time": "3:01:58", "throughput": 2302.9, "total_tokens": 13571088} {"current_steps": 23540, "total_steps": 67140, "loss": 0.6131, "lr": 4.1029828301319836e-05, "epoch": 3.5061066428358654, "percentage": 35.06, "elapsed_time": "1:38:14", "remaining_time": "3:01:56", "throughput": 2302.93, "total_tokens": 13573840} {"current_steps": 23545, "total_steps": 67140, "loss": 0.6614, "lr": 4.102484068063954e-05, "epoch": 3.5068513553768246, "percentage": 35.07, "elapsed_time": "1:38:15", "remaining_time": "3:01:55", "throughput": 2302.97, "total_tokens": 13576624} {"current_steps": 23550, "total_steps": 67140, "loss": 0.4512, "lr": 4.1019851977065674e-05, "epoch": 3.5075960679177838, "percentage": 35.08, "elapsed_time": "1:38:16", "remaining_time": "3:01:53", "throughput": 2303.01, "total_tokens": 13579472} {"current_steps": 23555, "total_steps": 67140, "loss": 0.5374, "lr": 4.101486219093533e-05, "epoch": 3.508340780458743, "percentage": 35.08, "elapsed_time": "1:38:17", "remaining_time": "3:01:52", "throughput": 2303.05, "total_tokens": 13582288} {"current_steps": 23560, "total_steps": 67140, "loss": 0.5099, "lr": 4.100987132258571e-05, "epoch": 3.509085492999702, "percentage": 35.09, "elapsed_time": "1:38:18", "remaining_time": "3:01:51", "throughput": 2303.1, "total_tokens": 13585200} {"current_steps": 23565, "total_steps": 67140, "loss": 0.5596, "lr": 4.1004879372354085e-05, "epoch": 3.5098302055406614, "percentage": 35.1, "elapsed_time": "1:38:19", "remaining_time": "3:01:49", "throughput": 2303.13, "total_tokens": 13587984} {"current_steps": 23570, "total_steps": 67140, "loss": 0.5732, "lr": 4.099988634057778e-05, "epoch": 3.5105749180816206, "percentage": 35.11, "elapsed_time": "1:38:20", "remaining_time": "3:01:48", "throughput": 2303.19, "total_tokens": 13591024} {"current_steps": 23575, "total_steps": 67140, "loss": 0.7244, "lr": 4.09948922275942e-05, "epoch": 3.51131963062258, "percentage": 35.11, "elapsed_time": "1:38:22", "remaining_time": "3:01:46", "throughput": 2303.24, "total_tokens": 13593904} {"current_steps": 23580, "total_steps": 67140, "loss": 0.6478, "lr": 4.098989703374084e-05, "epoch": 3.512064343163539, "percentage": 35.12, "elapsed_time": "1:38:23", "remaining_time": "3:01:45", "throughput": 2303.31, "total_tokens": 13597072} {"current_steps": 23585, "total_steps": 67140, "loss": 0.7017, "lr": 4.0984900759355254e-05, "epoch": 3.512809055704498, "percentage": 35.13, "elapsed_time": "1:38:24", "remaining_time": "3:01:43", "throughput": 2303.39, "total_tokens": 13600176} {"current_steps": 23590, "total_steps": 67140, "loss": 0.7001, "lr": 4.097990340477507e-05, "epoch": 3.5135537682454574, "percentage": 35.14, "elapsed_time": "1:38:25", "remaining_time": "3:01:42", "throughput": 2303.44, "total_tokens": 13603088} {"current_steps": 23595, "total_steps": 67140, "loss": 0.5307, "lr": 4.097490497033797e-05, "epoch": 3.5142984807864166, "percentage": 35.14, "elapsed_time": "1:38:26", "remaining_time": "3:01:40", "throughput": 2303.48, "total_tokens": 13605968} {"current_steps": 23600, "total_steps": 67140, "loss": 0.709, "lr": 4.096990545638174e-05, "epoch": 3.515043193327376, "percentage": 35.15, "elapsed_time": "1:38:27", "remaining_time": "3:01:39", "throughput": 2303.53, "total_tokens": 13608816} {"current_steps": 23605, "total_steps": 67140, "loss": 0.6647, "lr": 4.096490486324424e-05, "epoch": 3.5157879058683346, "percentage": 35.16, "elapsed_time": "1:38:28", "remaining_time": "3:01:37", "throughput": 2303.59, "total_tokens": 13611856} {"current_steps": 23610, "total_steps": 67140, "loss": 0.648, "lr": 4.095990319126337e-05, "epoch": 3.516532618409294, "percentage": 35.17, "elapsed_time": "1:38:30", "remaining_time": "3:01:36", "throughput": 2303.64, "total_tokens": 13614832} {"current_steps": 23615, "total_steps": 67140, "loss": 0.5258, "lr": 4.0954900440777125e-05, "epoch": 3.517277330950253, "percentage": 35.17, "elapsed_time": "1:38:31", "remaining_time": "3:01:35", "throughput": 2303.67, "total_tokens": 13617584} {"current_steps": 23620, "total_steps": 67140, "loss": 0.8297, "lr": 4.094989661212359e-05, "epoch": 3.5180220434912126, "percentage": 35.18, "elapsed_time": "1:38:32", "remaining_time": "3:01:33", "throughput": 2303.73, "total_tokens": 13620560} {"current_steps": 23625, "total_steps": 67140, "loss": 0.4968, "lr": 4.094489170564088e-05, "epoch": 3.5187667560321714, "percentage": 35.19, "elapsed_time": "1:38:33", "remaining_time": "3:01:32", "throughput": 2303.76, "total_tokens": 13623248} {"current_steps": 23630, "total_steps": 67140, "loss": 0.5606, "lr": 4.0939885721667216e-05, "epoch": 3.519511468573131, "percentage": 35.2, "elapsed_time": "1:38:34", "remaining_time": "3:01:30", "throughput": 2303.82, "total_tokens": 13626320} {"current_steps": 23635, "total_steps": 67140, "loss": 0.4394, "lr": 4.093487866054088e-05, "epoch": 3.5202561811140898, "percentage": 35.2, "elapsed_time": "1:38:35", "remaining_time": "3:01:29", "throughput": 2303.87, "total_tokens": 13629296} {"current_steps": 23640, "total_steps": 67140, "loss": 0.9005, "lr": 4.0929870522600233e-05, "epoch": 3.5210008936550494, "percentage": 35.21, "elapsed_time": "1:38:36", "remaining_time": "3:01:27", "throughput": 2303.9, "total_tokens": 13632112} {"current_steps": 23645, "total_steps": 67140, "loss": 0.7468, "lr": 4.092486130818371e-05, "epoch": 3.521745606196008, "percentage": 35.22, "elapsed_time": "1:38:38", "remaining_time": "3:01:26", "throughput": 2303.97, "total_tokens": 13635184} {"current_steps": 23650, "total_steps": 67140, "loss": 0.5825, "lr": 4.09198510176298e-05, "epoch": 3.5224903187369674, "percentage": 35.22, "elapsed_time": "1:38:39", "remaining_time": "3:01:24", "throughput": 2304.04, "total_tokens": 13638256} {"current_steps": 23655, "total_steps": 67140, "loss": 0.5839, "lr": 4.091483965127708e-05, "epoch": 3.5232350312779266, "percentage": 35.23, "elapsed_time": "1:38:40", "remaining_time": "3:01:23", "throughput": 2304.07, "total_tokens": 13641040} {"current_steps": 23660, "total_steps": 67140, "loss": 0.6428, "lr": 4.09098272094642e-05, "epoch": 3.523979743818886, "percentage": 35.24, "elapsed_time": "1:38:41", "remaining_time": "3:01:21", "throughput": 2304.09, "total_tokens": 13643664} {"current_steps": 23665, "total_steps": 67140, "loss": 0.697, "lr": 4.0904813692529886e-05, "epoch": 3.524724456359845, "percentage": 35.25, "elapsed_time": "1:38:42", "remaining_time": "3:01:20", "throughput": 2304.13, "total_tokens": 13646544} {"current_steps": 23670, "total_steps": 67140, "loss": 0.6837, "lr": 4.089979910081293e-05, "epoch": 3.525469168900804, "percentage": 35.25, "elapsed_time": "1:38:43", "remaining_time": "3:01:19", "throughput": 2304.2, "total_tokens": 13649616} {"current_steps": 23675, "total_steps": 67140, "loss": 0.6741, "lr": 4.089478343465219e-05, "epoch": 3.5262138814417634, "percentage": 35.26, "elapsed_time": "1:38:44", "remaining_time": "3:01:17", "throughput": 2304.24, "total_tokens": 13652432} {"current_steps": 23680, "total_steps": 67140, "loss": 0.6505, "lr": 4.088976669438661e-05, "epoch": 3.5269585939827226, "percentage": 35.27, "elapsed_time": "1:38:46", "remaining_time": "3:01:16", "throughput": 2304.23, "total_tokens": 13654928} {"current_steps": 23685, "total_steps": 67140, "loss": 0.6057, "lr": 4.088474888035519e-05, "epoch": 3.527703306523682, "percentage": 35.28, "elapsed_time": "1:38:47", "remaining_time": "3:01:14", "throughput": 2304.31, "total_tokens": 13658096} {"current_steps": 23690, "total_steps": 67140, "loss": 0.6164, "lr": 4.087972999289704e-05, "epoch": 3.528448019064641, "percentage": 35.28, "elapsed_time": "1:38:48", "remaining_time": "3:01:13", "throughput": 2304.36, "total_tokens": 13661008} {"current_steps": 23695, "total_steps": 67140, "loss": 0.7062, "lr": 4.0874710032351296e-05, "epoch": 3.5291927316056, "percentage": 35.29, "elapsed_time": "1:38:49", "remaining_time": "3:01:11", "throughput": 2304.39, "total_tokens": 13663792} {"current_steps": 23700, "total_steps": 67140, "loss": 0.5458, "lr": 4.086968899905719e-05, "epoch": 3.5299374441465594, "percentage": 35.3, "elapsed_time": "1:38:50", "remaining_time": "3:01:10", "throughput": 2304.43, "total_tokens": 13666576} {"current_steps": 23705, "total_steps": 67140, "loss": 0.7283, "lr": 4.086466689335402e-05, "epoch": 3.5306821566875186, "percentage": 35.31, "elapsed_time": "1:38:51", "remaining_time": "3:01:08", "throughput": 2304.46, "total_tokens": 13669360} {"current_steps": 23710, "total_steps": 67140, "loss": 0.5943, "lr": 4.085964371558116e-05, "epoch": 3.531426869228478, "percentage": 35.31, "elapsed_time": "1:38:52", "remaining_time": "3:01:07", "throughput": 2304.5, "total_tokens": 13672240} {"current_steps": 23715, "total_steps": 67140, "loss": 0.6151, "lr": 4.085461946607806e-05, "epoch": 3.532171581769437, "percentage": 35.32, "elapsed_time": "1:38:54", "remaining_time": "3:01:05", "throughput": 2304.59, "total_tokens": 13675472} {"current_steps": 23720, "total_steps": 67140, "loss": 0.6711, "lr": 4.084959414518423e-05, "epoch": 3.532916294310396, "percentage": 35.33, "elapsed_time": "1:38:55", "remaining_time": "3:01:04", "throughput": 2304.64, "total_tokens": 13678384} {"current_steps": 23725, "total_steps": 67140, "loss": 0.8216, "lr": 4.0844567753239276e-05, "epoch": 3.5336610068513554, "percentage": 35.34, "elapsed_time": "1:38:56", "remaining_time": "3:01:02", "throughput": 2304.64, "total_tokens": 13680848} {"current_steps": 23730, "total_steps": 67140, "loss": 0.5728, "lr": 4.0839540290582856e-05, "epoch": 3.5344057193923146, "percentage": 35.34, "elapsed_time": "1:38:57", "remaining_time": "3:01:01", "throughput": 2304.74, "total_tokens": 13684208} {"current_steps": 23735, "total_steps": 67140, "loss": 0.7141, "lr": 4.08345117575547e-05, "epoch": 3.535150431933274, "percentage": 35.35, "elapsed_time": "1:38:58", "remaining_time": "3:01:00", "throughput": 2304.78, "total_tokens": 13687120} {"current_steps": 23740, "total_steps": 67140, "loss": 0.7898, "lr": 4.082948215449461e-05, "epoch": 3.535895144474233, "percentage": 35.36, "elapsed_time": "1:38:59", "remaining_time": "3:00:58", "throughput": 2304.84, "total_tokens": 13690096} {"current_steps": 23745, "total_steps": 67140, "loss": 0.6066, "lr": 4.0824451481742475e-05, "epoch": 3.5366398570151922, "percentage": 35.37, "elapsed_time": "1:39:00", "remaining_time": "3:00:57", "throughput": 2304.93, "total_tokens": 13693360} {"current_steps": 23750, "total_steps": 67140, "loss": 0.9377, "lr": 4.081941973963825e-05, "epoch": 3.5373845695561514, "percentage": 35.37, "elapsed_time": "1:39:02", "remaining_time": "3:00:55", "throughput": 2304.99, "total_tokens": 13696464} {"current_steps": 23755, "total_steps": 67140, "loss": 0.5657, "lr": 4.0814386928521964e-05, "epoch": 3.5381292820971106, "percentage": 35.38, "elapsed_time": "1:39:03", "remaining_time": "3:00:54", "throughput": 2305.03, "total_tokens": 13699312} {"current_steps": 23760, "total_steps": 67140, "loss": 0.7693, "lr": 4.0809353048733696e-05, "epoch": 3.53887399463807, "percentage": 35.39, "elapsed_time": "1:39:04", "remaining_time": "3:00:52", "throughput": 2305.06, "total_tokens": 13702096} {"current_steps": 23765, "total_steps": 67140, "loss": 0.665, "lr": 4.0804318100613624e-05, "epoch": 3.539618707179029, "percentage": 35.4, "elapsed_time": "1:39:05", "remaining_time": "3:00:51", "throughput": 2305.11, "total_tokens": 13704976} {"current_steps": 23770, "total_steps": 67140, "loss": 0.5095, "lr": 4.0799282084502e-05, "epoch": 3.5403634197199882, "percentage": 35.4, "elapsed_time": "1:39:06", "remaining_time": "3:00:50", "throughput": 2305.17, "total_tokens": 13707984} {"current_steps": 23775, "total_steps": 67140, "loss": 0.7324, "lr": 4.079424500073912e-05, "epoch": 3.5411081322609474, "percentage": 35.41, "elapsed_time": "1:39:07", "remaining_time": "3:00:48", "throughput": 2305.21, "total_tokens": 13710864} {"current_steps": 23780, "total_steps": 67140, "loss": 0.6408, "lr": 4.078920684966538e-05, "epoch": 3.541852844801906, "percentage": 35.42, "elapsed_time": "1:39:08", "remaining_time": "3:00:47", "throughput": 2305.27, "total_tokens": 13713808} {"current_steps": 23785, "total_steps": 67140, "loss": 0.5614, "lr": 4.078416763162123e-05, "epoch": 3.542597557342866, "percentage": 35.43, "elapsed_time": "1:39:10", "remaining_time": "3:00:45", "throughput": 2305.29, "total_tokens": 13716496} {"current_steps": 23790, "total_steps": 67140, "loss": 0.6, "lr": 4.0779127346947214e-05, "epoch": 3.5433422698838246, "percentage": 35.43, "elapsed_time": "1:39:11", "remaining_time": "3:00:44", "throughput": 2305.3, "total_tokens": 13719088} {"current_steps": 23795, "total_steps": 67140, "loss": 0.7158, "lr": 4.077408599598392e-05, "epoch": 3.5440869824247843, "percentage": 35.44, "elapsed_time": "1:39:12", "remaining_time": "3:00:42", "throughput": 2305.36, "total_tokens": 13722128} {"current_steps": 23800, "total_steps": 67140, "loss": 0.6356, "lr": 4.076904357907203e-05, "epoch": 3.544831694965743, "percentage": 35.45, "elapsed_time": "1:39:13", "remaining_time": "3:00:41", "throughput": 2305.4, "total_tokens": 13725008} {"current_steps": 23805, "total_steps": 67140, "loss": 0.6402, "lr": 4.076400009655228e-05, "epoch": 3.5455764075067027, "percentage": 35.46, "elapsed_time": "1:39:14", "remaining_time": "3:00:39", "throughput": 2305.45, "total_tokens": 13727856} {"current_steps": 23810, "total_steps": 67140, "loss": 0.5472, "lr": 4.0758955548765505e-05, "epoch": 3.5463211200476614, "percentage": 35.46, "elapsed_time": "1:39:15", "remaining_time": "3:00:38", "throughput": 2305.5, "total_tokens": 13730736} {"current_steps": 23815, "total_steps": 67140, "loss": 0.7836, "lr": 4.075390993605258e-05, "epoch": 3.5470658325886206, "percentage": 35.47, "elapsed_time": "1:39:16", "remaining_time": "3:00:36", "throughput": 2305.53, "total_tokens": 13733520} {"current_steps": 23820, "total_steps": 67140, "loss": 0.7285, "lr": 4.074886325875447e-05, "epoch": 3.54781054512958, "percentage": 35.48, "elapsed_time": "1:39:17", "remaining_time": "3:00:35", "throughput": 2305.6, "total_tokens": 13736624} {"current_steps": 23825, "total_steps": 67140, "loss": 0.7416, "lr": 4.074381551721221e-05, "epoch": 3.548555257670539, "percentage": 35.49, "elapsed_time": "1:39:19", "remaining_time": "3:00:33", "throughput": 2305.64, "total_tokens": 13739440} {"current_steps": 23830, "total_steps": 67140, "loss": 0.7092, "lr": 4.073876671176692e-05, "epoch": 3.5492999702114982, "percentage": 35.49, "elapsed_time": "1:39:20", "remaining_time": "3:00:32", "throughput": 2305.69, "total_tokens": 13742352} {"current_steps": 23835, "total_steps": 67140, "loss": 0.5018, "lr": 4.073371684275976e-05, "epoch": 3.5500446827524574, "percentage": 35.5, "elapsed_time": "1:39:21", "remaining_time": "3:00:31", "throughput": 2305.77, "total_tokens": 13745616} {"current_steps": 23840, "total_steps": 67140, "loss": 0.7062, "lr": 4.072866591053197e-05, "epoch": 3.5507893952934166, "percentage": 35.51, "elapsed_time": "1:39:22", "remaining_time": "3:00:29", "throughput": 2305.82, "total_tokens": 13748560} {"current_steps": 23845, "total_steps": 67140, "loss": 0.6774, "lr": 4.0723613915424894e-05, "epoch": 3.551534107834376, "percentage": 35.52, "elapsed_time": "1:39:23", "remaining_time": "3:00:28", "throughput": 2305.9, "total_tokens": 13751696} {"current_steps": 23850, "total_steps": 67140, "loss": 0.5184, "lr": 4.071856085777993e-05, "epoch": 3.552278820375335, "percentage": 35.52, "elapsed_time": "1:39:24", "remaining_time": "3:00:26", "throughput": 2305.96, "total_tokens": 13754704} {"current_steps": 23855, "total_steps": 67140, "loss": 0.611, "lr": 4.071350673793852e-05, "epoch": 3.5530235329162942, "percentage": 35.53, "elapsed_time": "1:39:25", "remaining_time": "3:00:25", "throughput": 2306.0, "total_tokens": 13757520} {"current_steps": 23860, "total_steps": 67140, "loss": 0.7806, "lr": 4.070845155624221e-05, "epoch": 3.5537682454572534, "percentage": 35.54, "elapsed_time": "1:39:27", "remaining_time": "3:00:23", "throughput": 2306.05, "total_tokens": 13760528} {"current_steps": 23865, "total_steps": 67140, "loss": 0.4979, "lr": 4.070339531303261e-05, "epoch": 3.5545129579982127, "percentage": 35.55, "elapsed_time": "1:39:28", "remaining_time": "3:00:22", "throughput": 2306.08, "total_tokens": 13763248} {"current_steps": 23870, "total_steps": 67140, "loss": 0.6537, "lr": 4.0698338008651405e-05, "epoch": 3.555257670539172, "percentage": 35.55, "elapsed_time": "1:39:29", "remaining_time": "3:00:20", "throughput": 2306.11, "total_tokens": 13766000} {"current_steps": 23875, "total_steps": 67140, "loss": 0.6188, "lr": 4.0693279643440326e-05, "epoch": 3.556002383080131, "percentage": 35.56, "elapsed_time": "1:39:30", "remaining_time": "3:00:19", "throughput": 2306.16, "total_tokens": 13768944} {"current_steps": 23880, "total_steps": 67140, "loss": 0.5502, "lr": 4.068822021774123e-05, "epoch": 3.5567470956210903, "percentage": 35.57, "elapsed_time": "1:39:31", "remaining_time": "3:00:17", "throughput": 2306.21, "total_tokens": 13771824} {"current_steps": 23885, "total_steps": 67140, "loss": 0.4835, "lr": 4.0683159731895994e-05, "epoch": 3.5574918081620495, "percentage": 35.57, "elapsed_time": "1:39:32", "remaining_time": "3:00:16", "throughput": 2306.29, "total_tokens": 13775056} {"current_steps": 23890, "total_steps": 67140, "loss": 0.7372, "lr": 4.067809818624658e-05, "epoch": 3.5582365207030087, "percentage": 35.58, "elapsed_time": "1:39:33", "remaining_time": "3:00:15", "throughput": 2306.34, "total_tokens": 13777968} {"current_steps": 23895, "total_steps": 67140, "loss": 0.6317, "lr": 4.067303558113503e-05, "epoch": 3.558981233243968, "percentage": 35.59, "elapsed_time": "1:39:35", "remaining_time": "3:00:13", "throughput": 2306.37, "total_tokens": 13780688} {"current_steps": 23900, "total_steps": 67140, "loss": 0.6701, "lr": 4.066797191690347e-05, "epoch": 3.559725945784927, "percentage": 35.6, "elapsed_time": "1:39:36", "remaining_time": "3:00:12", "throughput": 2306.39, "total_tokens": 13783312} {"current_steps": 23905, "total_steps": 67140, "loss": 0.7972, "lr": 4.066290719389406e-05, "epoch": 3.5604706583258863, "percentage": 35.6, "elapsed_time": "1:39:37", "remaining_time": "3:00:10", "throughput": 2306.42, "total_tokens": 13786096} {"current_steps": 23910, "total_steps": 67140, "loss": 0.6941, "lr": 4.065784141244907e-05, "epoch": 3.5612153708668455, "percentage": 35.61, "elapsed_time": "1:39:38", "remaining_time": "3:00:09", "throughput": 2306.44, "total_tokens": 13788752} {"current_steps": 23915, "total_steps": 67140, "loss": 0.7484, "lr": 4.065277457291081e-05, "epoch": 3.5619600834078047, "percentage": 35.62, "elapsed_time": "1:39:39", "remaining_time": "3:00:07", "throughput": 2306.49, "total_tokens": 13791664} {"current_steps": 23920, "total_steps": 67140, "loss": 0.6782, "lr": 4.0647706675621685e-05, "epoch": 3.562704795948764, "percentage": 35.63, "elapsed_time": "1:39:40", "remaining_time": "3:00:06", "throughput": 2306.54, "total_tokens": 13794576} {"current_steps": 23925, "total_steps": 67140, "loss": 0.7205, "lr": 4.064263772092416e-05, "epoch": 3.563449508489723, "percentage": 35.63, "elapsed_time": "1:39:41", "remaining_time": "3:00:04", "throughput": 2306.57, "total_tokens": 13797360} {"current_steps": 23930, "total_steps": 67140, "loss": 0.6958, "lr": 4.0637567709160786e-05, "epoch": 3.5641942210306823, "percentage": 35.64, "elapsed_time": "1:39:42", "remaining_time": "3:00:03", "throughput": 2306.58, "total_tokens": 13799888} {"current_steps": 23935, "total_steps": 67140, "loss": 0.5871, "lr": 4.0632496640674156e-05, "epoch": 3.5649389335716415, "percentage": 35.65, "elapsed_time": "1:39:43", "remaining_time": "3:00:01", "throughput": 2306.62, "total_tokens": 13802832} {"current_steps": 23940, "total_steps": 67140, "loss": 0.721, "lr": 4.0627424515806957e-05, "epoch": 3.5656836461126007, "percentage": 35.66, "elapsed_time": "1:39:45", "remaining_time": "3:00:00", "throughput": 2306.71, "total_tokens": 13806064} {"current_steps": 23945, "total_steps": 67140, "loss": 0.5664, "lr": 4.062235133490195e-05, "epoch": 3.5664283586535594, "percentage": 35.66, "elapsed_time": "1:39:46", "remaining_time": "2:59:58", "throughput": 2306.76, "total_tokens": 13809072} {"current_steps": 23950, "total_steps": 67140, "loss": 0.6321, "lr": 4.061727709830196e-05, "epoch": 3.567173071194519, "percentage": 35.67, "elapsed_time": "1:39:47", "remaining_time": "2:59:57", "throughput": 2306.83, "total_tokens": 13812208} {"current_steps": 23955, "total_steps": 67140, "loss": 0.6805, "lr": 4.061220180634987e-05, "epoch": 3.567917783735478, "percentage": 35.68, "elapsed_time": "1:39:48", "remaining_time": "2:59:56", "throughput": 2306.87, "total_tokens": 13815024} {"current_steps": 23960, "total_steps": 67140, "loss": 0.602, "lr": 4.060712545938866e-05, "epoch": 3.5686624962764375, "percentage": 35.69, "elapsed_time": "1:39:49", "remaining_time": "2:59:54", "throughput": 2306.9, "total_tokens": 13817808} {"current_steps": 23965, "total_steps": 67140, "loss": 0.6209, "lr": 4.0602048057761365e-05, "epoch": 3.5694072088173963, "percentage": 35.69, "elapsed_time": "1:39:50", "remaining_time": "2:59:53", "throughput": 2306.94, "total_tokens": 13820624} {"current_steps": 23970, "total_steps": 67140, "loss": 0.6113, "lr": 4.0596969601811095e-05, "epoch": 3.570151921358356, "percentage": 35.7, "elapsed_time": "1:39:52", "remaining_time": "2:59:51", "throughput": 2306.97, "total_tokens": 13823376} {"current_steps": 23975, "total_steps": 67140, "loss": 0.7212, "lr": 4.059189009188104e-05, "epoch": 3.5708966338993147, "percentage": 35.71, "elapsed_time": "1:39:53", "remaining_time": "2:59:50", "throughput": 2307.02, "total_tokens": 13826352} {"current_steps": 23980, "total_steps": 67140, "loss": 0.5651, "lr": 4.058680952831444e-05, "epoch": 3.5716413464402743, "percentage": 35.72, "elapsed_time": "1:39:54", "remaining_time": "2:59:48", "throughput": 2307.04, "total_tokens": 13829040} {"current_steps": 23985, "total_steps": 67140, "loss": 0.7206, "lr": 4.058172791145461e-05, "epoch": 3.572386058981233, "percentage": 35.72, "elapsed_time": "1:39:55", "remaining_time": "2:59:47", "throughput": 2307.12, "total_tokens": 13832336} {"current_steps": 23990, "total_steps": 67140, "loss": 0.6945, "lr": 4.0576645241644985e-05, "epoch": 3.5731307715221923, "percentage": 35.73, "elapsed_time": "1:39:56", "remaining_time": "2:59:45", "throughput": 2307.14, "total_tokens": 13835024} {"current_steps": 23995, "total_steps": 67140, "loss": 0.6265, "lr": 4.0571561519228984e-05, "epoch": 3.5738754840631515, "percentage": 35.74, "elapsed_time": "1:39:57", "remaining_time": "2:59:44", "throughput": 2307.17, "total_tokens": 13837680} {"current_steps": 24000, "total_steps": 67140, "loss": 0.5825, "lr": 4.056647674455017e-05, "epoch": 3.5746201966041107, "percentage": 35.75, "elapsed_time": "1:39:58", "remaining_time": "2:59:42", "throughput": 2307.21, "total_tokens": 13840560} {"current_steps": 24005, "total_steps": 67140, "loss": 0.7003, "lr": 4.056139091795215e-05, "epoch": 3.57536490914507, "percentage": 35.75, "elapsed_time": "1:39:59", "remaining_time": "2:59:41", "throughput": 2307.25, "total_tokens": 13843376} {"current_steps": 24010, "total_steps": 67140, "loss": 0.6508, "lr": 4.05563040397786e-05, "epoch": 3.576109621686029, "percentage": 35.76, "elapsed_time": "1:40:01", "remaining_time": "2:59:39", "throughput": 2307.29, "total_tokens": 13846224} {"current_steps": 24015, "total_steps": 67140, "loss": 0.6346, "lr": 4.055121611037326e-05, "epoch": 3.5768543342269883, "percentage": 35.77, "elapsed_time": "1:40:02", "remaining_time": "2:59:38", "throughput": 2307.36, "total_tokens": 13849360} {"current_steps": 24020, "total_steps": 67140, "loss": 0.6582, "lr": 4.054612713007997e-05, "epoch": 3.5775990467679475, "percentage": 35.78, "elapsed_time": "1:40:03", "remaining_time": "2:59:37", "throughput": 2307.41, "total_tokens": 13852368} {"current_steps": 24025, "total_steps": 67140, "loss": 0.7607, "lr": 4.054103709924262e-05, "epoch": 3.5783437593089067, "percentage": 35.78, "elapsed_time": "1:40:04", "remaining_time": "2:59:35", "throughput": 2307.48, "total_tokens": 13855536} {"current_steps": 24030, "total_steps": 67140, "loss": 0.6502, "lr": 4.0535946018205156e-05, "epoch": 3.579088471849866, "percentage": 35.79, "elapsed_time": "1:40:05", "remaining_time": "2:59:34", "throughput": 2307.51, "total_tokens": 13858288} {"current_steps": 24035, "total_steps": 67140, "loss": 0.7182, "lr": 4.0530853887311634e-05, "epoch": 3.579833184390825, "percentage": 35.8, "elapsed_time": "1:40:06", "remaining_time": "2:59:32", "throughput": 2307.53, "total_tokens": 13860880} {"current_steps": 24040, "total_steps": 67140, "loss": 0.6612, "lr": 4.052576070690615e-05, "epoch": 3.5805778969317843, "percentage": 35.81, "elapsed_time": "1:40:07", "remaining_time": "2:59:31", "throughput": 2307.57, "total_tokens": 13863792} {"current_steps": 24045, "total_steps": 67140, "loss": 0.5625, "lr": 4.052066647733287e-05, "epoch": 3.5813226094727435, "percentage": 35.81, "elapsed_time": "1:40:09", "remaining_time": "2:59:29", "throughput": 2307.62, "total_tokens": 13866704} {"current_steps": 24050, "total_steps": 67140, "loss": 0.6335, "lr": 4.051557119893606e-05, "epoch": 3.5820673220137027, "percentage": 35.82, "elapsed_time": "1:40:10", "remaining_time": "2:59:28", "throughput": 2307.67, "total_tokens": 13869616} {"current_steps": 24055, "total_steps": 67140, "loss": 0.6672, "lr": 4.051047487206003e-05, "epoch": 3.582812034554662, "percentage": 35.83, "elapsed_time": "1:40:11", "remaining_time": "2:59:26", "throughput": 2307.72, "total_tokens": 13872496} {"current_steps": 24060, "total_steps": 67140, "loss": 0.6604, "lr": 4.050537749704917e-05, "epoch": 3.583556747095621, "percentage": 35.84, "elapsed_time": "1:40:12", "remaining_time": "2:59:25", "throughput": 2307.76, "total_tokens": 13875376} {"current_steps": 24065, "total_steps": 67140, "loss": 0.6338, "lr": 4.050027907424794e-05, "epoch": 3.5843014596365803, "percentage": 35.84, "elapsed_time": "1:40:13", "remaining_time": "2:59:23", "throughput": 2307.8, "total_tokens": 13878160} {"current_steps": 24070, "total_steps": 67140, "loss": 0.7037, "lr": 4.049517960400086e-05, "epoch": 3.5850461721775395, "percentage": 35.85, "elapsed_time": "1:40:14", "remaining_time": "2:59:22", "throughput": 2307.83, "total_tokens": 13880912} {"current_steps": 24075, "total_steps": 67140, "loss": 0.6447, "lr": 4.049007908665255e-05, "epoch": 3.5857908847184987, "percentage": 35.86, "elapsed_time": "1:40:15", "remaining_time": "2:59:21", "throughput": 2307.88, "total_tokens": 13883856} {"current_steps": 24080, "total_steps": 67140, "loss": 0.6267, "lr": 4.0484977522547676e-05, "epoch": 3.586535597259458, "percentage": 35.87, "elapsed_time": "1:40:16", "remaining_time": "2:59:19", "throughput": 2307.92, "total_tokens": 13886768} {"current_steps": 24085, "total_steps": 67140, "loss": 0.6353, "lr": 4.047987491203097e-05, "epoch": 3.587280309800417, "percentage": 35.87, "elapsed_time": "1:40:18", "remaining_time": "2:59:18", "throughput": 2307.95, "total_tokens": 13889488} {"current_steps": 24090, "total_steps": 67140, "loss": 0.6608, "lr": 4.0474771255447256e-05, "epoch": 3.5880250223413763, "percentage": 35.88, "elapsed_time": "1:40:19", "remaining_time": "2:59:16", "throughput": 2307.99, "total_tokens": 13892336} {"current_steps": 24095, "total_steps": 67140, "loss": 0.7465, "lr": 4.046966655314142e-05, "epoch": 3.5887697348823355, "percentage": 35.89, "elapsed_time": "1:40:20", "remaining_time": "2:59:15", "throughput": 2308.02, "total_tokens": 13895152} {"current_steps": 24100, "total_steps": 67140, "loss": 0.4341, "lr": 4.0464560805458405e-05, "epoch": 3.5895144474232947, "percentage": 35.9, "elapsed_time": "1:40:21", "remaining_time": "2:59:13", "throughput": 2308.06, "total_tokens": 13898000} {"current_steps": 24105, "total_steps": 67140, "loss": 0.854, "lr": 4.045945401274326e-05, "epoch": 3.590259159964254, "percentage": 35.9, "elapsed_time": "1:40:22", "remaining_time": "2:59:12", "throughput": 2308.11, "total_tokens": 13900880} {"current_steps": 24110, "total_steps": 67140, "loss": 0.8519, "lr": 4.0454346175341054e-05, "epoch": 3.591003872505213, "percentage": 35.91, "elapsed_time": "1:40:23", "remaining_time": "2:59:10", "throughput": 2308.17, "total_tokens": 13903952} {"current_steps": 24115, "total_steps": 67140, "loss": 0.6142, "lr": 4.0449237293596975e-05, "epoch": 3.5917485850461723, "percentage": 35.92, "elapsed_time": "1:40:24", "remaining_time": "2:59:09", "throughput": 2308.21, "total_tokens": 13906768} {"current_steps": 24120, "total_steps": 67140, "loss": 0.6586, "lr": 4.0444127367856246e-05, "epoch": 3.592493297587131, "percentage": 35.92, "elapsed_time": "1:40:26", "remaining_time": "2:59:07", "throughput": 2308.24, "total_tokens": 13909520} {"current_steps": 24125, "total_steps": 67140, "loss": 0.5396, "lr": 4.043901639846418e-05, "epoch": 3.5932380101280907, "percentage": 35.93, "elapsed_time": "1:40:27", "remaining_time": "2:59:06", "throughput": 2308.29, "total_tokens": 13912464} {"current_steps": 24130, "total_steps": 67140, "loss": 0.6524, "lr": 4.043390438576616e-05, "epoch": 3.5939827226690495, "percentage": 35.94, "elapsed_time": "1:40:28", "remaining_time": "2:59:05", "throughput": 2308.35, "total_tokens": 13915536} {"current_steps": 24135, "total_steps": 67140, "loss": 0.5544, "lr": 4.042879133010763e-05, "epoch": 3.594727435210009, "percentage": 35.95, "elapsed_time": "1:40:29", "remaining_time": "2:59:03", "throughput": 2308.39, "total_tokens": 13918384} {"current_steps": 24140, "total_steps": 67140, "loss": 0.7706, "lr": 4.042367723183411e-05, "epoch": 3.595472147750968, "percentage": 35.95, "elapsed_time": "1:40:30", "remaining_time": "2:59:02", "throughput": 2308.48, "total_tokens": 13921648} {"current_steps": 24145, "total_steps": 67140, "loss": 0.715, "lr": 4.041856209129119e-05, "epoch": 3.5962168602919276, "percentage": 35.96, "elapsed_time": "1:40:31", "remaining_time": "2:59:00", "throughput": 2308.49, "total_tokens": 13924176} {"current_steps": 24150, "total_steps": 67140, "loss": 0.607, "lr": 4.0413445908824534e-05, "epoch": 3.5969615728328863, "percentage": 35.97, "elapsed_time": "1:40:32", "remaining_time": "2:58:59", "throughput": 2308.51, "total_tokens": 13926928} {"current_steps": 24155, "total_steps": 67140, "loss": 0.6578, "lr": 4.040832868477987e-05, "epoch": 3.597706285373846, "percentage": 35.98, "elapsed_time": "1:40:33", "remaining_time": "2:58:57", "throughput": 2308.53, "total_tokens": 13929616} {"current_steps": 24160, "total_steps": 67140, "loss": 0.5948, "lr": 4.040321041950299e-05, "epoch": 3.5984509979148047, "percentage": 35.98, "elapsed_time": "1:40:35", "remaining_time": "2:58:56", "throughput": 2308.56, "total_tokens": 13932368} {"current_steps": 24165, "total_steps": 67140, "loss": 0.7125, "lr": 4.039809111333979e-05, "epoch": 3.599195710455764, "percentage": 35.99, "elapsed_time": "1:40:36", "remaining_time": "2:58:54", "throughput": 2308.59, "total_tokens": 13935120} {"current_steps": 24170, "total_steps": 67140, "loss": 0.7409, "lr": 4.039297076663619e-05, "epoch": 3.599940422996723, "percentage": 36.0, "elapsed_time": "1:40:37", "remaining_time": "2:58:53", "throughput": 2308.63, "total_tokens": 13937904} {"current_steps": 24175, "total_steps": 67140, "loss": 0.7317, "lr": 4.03878493797382e-05, "epoch": 3.6006851355376823, "percentage": 36.01, "elapsed_time": "1:40:38", "remaining_time": "2:58:51", "throughput": 2308.66, "total_tokens": 13940688} {"current_steps": 24180, "total_steps": 67140, "loss": 0.7673, "lr": 4.0382726952991924e-05, "epoch": 3.6014298480786415, "percentage": 36.01, "elapsed_time": "1:40:39", "remaining_time": "2:58:50", "throughput": 2308.69, "total_tokens": 13943504} {"current_steps": 24185, "total_steps": 67140, "loss": 0.5815, "lr": 4.037760348674349e-05, "epoch": 3.6021745606196007, "percentage": 36.02, "elapsed_time": "1:40:40", "remaining_time": "2:58:48", "throughput": 2308.73, "total_tokens": 13946352} {"current_steps": 24190, "total_steps": 67140, "loss": 0.6832, "lr": 4.037247898133915e-05, "epoch": 3.60291927316056, "percentage": 36.03, "elapsed_time": "1:40:41", "remaining_time": "2:58:47", "throughput": 2308.79, "total_tokens": 13949328} {"current_steps": 24195, "total_steps": 67140, "loss": 0.6959, "lr": 4.036735343712516e-05, "epoch": 3.603663985701519, "percentage": 36.04, "elapsed_time": "1:40:42", "remaining_time": "2:58:45", "throughput": 2308.84, "total_tokens": 13952240} {"current_steps": 24200, "total_steps": 67140, "loss": 0.7776, "lr": 4.036222685444792e-05, "epoch": 3.6044086982424783, "percentage": 36.04, "elapsed_time": "1:40:44", "remaining_time": "2:58:44", "throughput": 2308.89, "total_tokens": 13955184} {"current_steps": 24205, "total_steps": 67140, "loss": 0.5575, "lr": 4.035709923365384e-05, "epoch": 3.6051534107834375, "percentage": 36.05, "elapsed_time": "1:40:45", "remaining_time": "2:58:43", "throughput": 2308.92, "total_tokens": 13957904} {"current_steps": 24210, "total_steps": 67140, "loss": 0.6665, "lr": 4.0351970575089435e-05, "epoch": 3.6058981233243967, "percentage": 36.06, "elapsed_time": "1:40:46", "remaining_time": "2:58:41", "throughput": 2308.97, "total_tokens": 13960848} {"current_steps": 24215, "total_steps": 67140, "loss": 0.6918, "lr": 4.0346840879101277e-05, "epoch": 3.606642835865356, "percentage": 36.07, "elapsed_time": "1:40:47", "remaining_time": "2:58:40", "throughput": 2309.03, "total_tokens": 13963824} {"current_steps": 24220, "total_steps": 67140, "loss": 0.5798, "lr": 4.0341710146036e-05, "epoch": 3.607387548406315, "percentage": 36.07, "elapsed_time": "1:40:48", "remaining_time": "2:58:38", "throughput": 2309.06, "total_tokens": 13966608} {"current_steps": 24225, "total_steps": 67140, "loss": 0.7709, "lr": 4.033657837624033e-05, "epoch": 3.6081322609472744, "percentage": 36.08, "elapsed_time": "1:40:49", "remaining_time": "2:58:37", "throughput": 2309.11, "total_tokens": 13969584} {"current_steps": 24230, "total_steps": 67140, "loss": 0.537, "lr": 4.033144557006104e-05, "epoch": 3.6088769734882336, "percentage": 36.09, "elapsed_time": "1:40:50", "remaining_time": "2:58:35", "throughput": 2309.15, "total_tokens": 13972464} {"current_steps": 24235, "total_steps": 67140, "loss": 0.7924, "lr": 4.032631172784501e-05, "epoch": 3.6096216860291928, "percentage": 36.1, "elapsed_time": "1:40:52", "remaining_time": "2:58:34", "throughput": 2309.18, "total_tokens": 13975216} {"current_steps": 24240, "total_steps": 67140, "loss": 0.5972, "lr": 4.0321176849939135e-05, "epoch": 3.610366398570152, "percentage": 36.1, "elapsed_time": "1:40:53", "remaining_time": "2:58:32", "throughput": 2309.25, "total_tokens": 13978320} {"current_steps": 24245, "total_steps": 67140, "loss": 0.6611, "lr": 4.031604093669042e-05, "epoch": 3.611111111111111, "percentage": 36.11, "elapsed_time": "1:40:54", "remaining_time": "2:58:31", "throughput": 2309.29, "total_tokens": 13981200} {"current_steps": 24250, "total_steps": 67140, "loss": 0.667, "lr": 4.031090398844593e-05, "epoch": 3.6118558236520704, "percentage": 36.12, "elapsed_time": "1:40:55", "remaining_time": "2:58:30", "throughput": 2309.34, "total_tokens": 13984112} {"current_steps": 24255, "total_steps": 67140, "loss": 0.6576, "lr": 4.030576600555279e-05, "epoch": 3.6126005361930296, "percentage": 36.13, "elapsed_time": "1:40:56", "remaining_time": "2:58:28", "throughput": 2309.38, "total_tokens": 13986992} {"current_steps": 24260, "total_steps": 67140, "loss": 0.6787, "lr": 4.030062698835822e-05, "epoch": 3.6133452487339888, "percentage": 36.13, "elapsed_time": "1:40:57", "remaining_time": "2:58:27", "throughput": 2309.45, "total_tokens": 13990160} {"current_steps": 24265, "total_steps": 67140, "loss": 0.6739, "lr": 4.029548693720949e-05, "epoch": 3.614089961274948, "percentage": 36.14, "elapsed_time": "1:40:58", "remaining_time": "2:58:25", "throughput": 2309.51, "total_tokens": 13993200} {"current_steps": 24270, "total_steps": 67140, "loss": 0.6637, "lr": 4.029034585245393e-05, "epoch": 3.614834673815907, "percentage": 36.15, "elapsed_time": "1:41:00", "remaining_time": "2:58:24", "throughput": 2309.56, "total_tokens": 13996176} {"current_steps": 24275, "total_steps": 67140, "loss": 0.5997, "lr": 4.028520373443897e-05, "epoch": 3.6155793863568664, "percentage": 36.16, "elapsed_time": "1:41:01", "remaining_time": "2:58:23", "throughput": 2309.61, "total_tokens": 13999152} {"current_steps": 24280, "total_steps": 67140, "loss": 0.681, "lr": 4.028006058351208e-05, "epoch": 3.6163240988978256, "percentage": 36.16, "elapsed_time": "1:41:02", "remaining_time": "2:58:21", "throughput": 2309.64, "total_tokens": 14001904} {"current_steps": 24285, "total_steps": 67140, "loss": 0.6267, "lr": 4.027491640002083e-05, "epoch": 3.617068811438785, "percentage": 36.17, "elapsed_time": "1:41:03", "remaining_time": "2:58:20", "throughput": 2309.64, "total_tokens": 14004432} {"current_steps": 24290, "total_steps": 67140, "loss": 0.6589, "lr": 4.0269771184312824e-05, "epoch": 3.617813523979744, "percentage": 36.18, "elapsed_time": "1:41:04", "remaining_time": "2:58:18", "throughput": 2309.7, "total_tokens": 14007440} {"current_steps": 24295, "total_steps": 67140, "loss": 0.6741, "lr": 4.0264624936735776e-05, "epoch": 3.6185582365207027, "percentage": 36.19, "elapsed_time": "1:41:05", "remaining_time": "2:58:17", "throughput": 2309.76, "total_tokens": 14010576} {"current_steps": 24300, "total_steps": 67140, "loss": 0.6698, "lr": 4.0259477657637424e-05, "epoch": 3.6193029490616624, "percentage": 36.19, "elapsed_time": "1:41:06", "remaining_time": "2:58:15", "throughput": 2309.79, "total_tokens": 14013328} {"current_steps": 24305, "total_steps": 67140, "loss": 0.5818, "lr": 4.0254329347365614e-05, "epoch": 3.620047661602621, "percentage": 36.2, "elapsed_time": "1:41:08", "remaining_time": "2:58:14", "throughput": 2309.84, "total_tokens": 14016272} {"current_steps": 24310, "total_steps": 67140, "loss": 0.6223, "lr": 4.024918000626825e-05, "epoch": 3.620792374143581, "percentage": 36.21, "elapsed_time": "1:41:09", "remaining_time": "2:58:12", "throughput": 2309.86, "total_tokens": 14018928} {"current_steps": 24315, "total_steps": 67140, "loss": 0.8281, "lr": 4.024402963469329e-05, "epoch": 3.6215370866845396, "percentage": 36.22, "elapsed_time": "1:41:10", "remaining_time": "2:58:11", "throughput": 2309.9, "total_tokens": 14021744} {"current_steps": 24320, "total_steps": 67140, "loss": 0.6651, "lr": 4.02388782329888e-05, "epoch": 3.622281799225499, "percentage": 36.22, "elapsed_time": "1:41:11", "remaining_time": "2:58:09", "throughput": 2309.91, "total_tokens": 14024304} {"current_steps": 24325, "total_steps": 67140, "loss": 0.7558, "lr": 4.023372580150286e-05, "epoch": 3.623026511766458, "percentage": 36.23, "elapsed_time": "1:41:12", "remaining_time": "2:58:08", "throughput": 2309.94, "total_tokens": 14027120} {"current_steps": 24330, "total_steps": 67140, "loss": 0.7639, "lr": 4.022857234058368e-05, "epoch": 3.6237712243074176, "percentage": 36.24, "elapsed_time": "1:41:13", "remaining_time": "2:58:06", "throughput": 2309.97, "total_tokens": 14029840} {"current_steps": 24335, "total_steps": 67140, "loss": 0.7804, "lr": 4.022341785057949e-05, "epoch": 3.6245159368483764, "percentage": 36.25, "elapsed_time": "1:41:14", "remaining_time": "2:58:05", "throughput": 2310.02, "total_tokens": 14032752} {"current_steps": 24340, "total_steps": 67140, "loss": 0.6222, "lr": 4.021826233183862e-05, "epoch": 3.6252606493893356, "percentage": 36.25, "elapsed_time": "1:41:15", "remaining_time": "2:58:03", "throughput": 2310.07, "total_tokens": 14035696} {"current_steps": 24345, "total_steps": 67140, "loss": 0.7502, "lr": 4.0213105784709445e-05, "epoch": 3.6260053619302948, "percentage": 36.26, "elapsed_time": "1:41:17", "remaining_time": "2:58:02", "throughput": 2310.12, "total_tokens": 14038704} {"current_steps": 24350, "total_steps": 67140, "loss": 0.5205, "lr": 4.020794820954044e-05, "epoch": 3.626750074471254, "percentage": 36.27, "elapsed_time": "1:41:18", "remaining_time": "2:58:01", "throughput": 2310.15, "total_tokens": 14041424} {"current_steps": 24355, "total_steps": 67140, "loss": 0.7087, "lr": 4.0202789606680136e-05, "epoch": 3.627494787012213, "percentage": 36.27, "elapsed_time": "1:41:19", "remaining_time": "2:57:59", "throughput": 2310.19, "total_tokens": 14044304} {"current_steps": 24360, "total_steps": 67140, "loss": 0.5351, "lr": 4.01976299764771e-05, "epoch": 3.6282394995531724, "percentage": 36.28, "elapsed_time": "1:41:20", "remaining_time": "2:57:58", "throughput": 2310.24, "total_tokens": 14047216} {"current_steps": 24365, "total_steps": 67140, "loss": 0.633, "lr": 4.019246931928004e-05, "epoch": 3.6289842120941316, "percentage": 36.29, "elapsed_time": "1:41:21", "remaining_time": "2:57:56", "throughput": 2310.27, "total_tokens": 14050032} {"current_steps": 24370, "total_steps": 67140, "loss": 0.6877, "lr": 4.018730763543765e-05, "epoch": 3.629728924635091, "percentage": 36.3, "elapsed_time": "1:41:22", "remaining_time": "2:57:55", "throughput": 2310.28, "total_tokens": 14052592} {"current_steps": 24375, "total_steps": 67140, "loss": 0.6913, "lr": 4.018214492529877e-05, "epoch": 3.63047363717605, "percentage": 36.3, "elapsed_time": "1:41:23", "remaining_time": "2:57:53", "throughput": 2310.32, "total_tokens": 14055440} {"current_steps": 24380, "total_steps": 67140, "loss": 0.7733, "lr": 4.017698118921226e-05, "epoch": 3.631218349717009, "percentage": 36.31, "elapsed_time": "1:41:24", "remaining_time": "2:57:52", "throughput": 2310.33, "total_tokens": 14058064} {"current_steps": 24385, "total_steps": 67140, "loss": 0.717, "lr": 4.0171816427527064e-05, "epoch": 3.6319630622579684, "percentage": 36.32, "elapsed_time": "1:41:25", "remaining_time": "2:57:50", "throughput": 2310.37, "total_tokens": 14060880} {"current_steps": 24390, "total_steps": 67140, "loss": 0.5494, "lr": 4.016665064059219e-05, "epoch": 3.6327077747989276, "percentage": 36.33, "elapsed_time": "1:41:27", "remaining_time": "2:57:49", "throughput": 2310.43, "total_tokens": 14063952} {"current_steps": 24395, "total_steps": 67140, "loss": 0.821, "lr": 4.016148382875675e-05, "epoch": 3.633452487339887, "percentage": 36.33, "elapsed_time": "1:41:28", "remaining_time": "2:57:47", "throughput": 2310.47, "total_tokens": 14066768} {"current_steps": 24400, "total_steps": 67140, "loss": 0.6, "lr": 4.0156315992369864e-05, "epoch": 3.634197199880846, "percentage": 36.34, "elapsed_time": "1:41:29", "remaining_time": "2:57:46", "throughput": 2310.51, "total_tokens": 14069712} {"current_steps": 24405, "total_steps": 67140, "loss": 0.4798, "lr": 4.015114713178077e-05, "epoch": 3.634941912421805, "percentage": 36.35, "elapsed_time": "1:41:30", "remaining_time": "2:57:45", "throughput": 2310.57, "total_tokens": 14072720} {"current_steps": 24410, "total_steps": 67140, "loss": 0.6314, "lr": 4.014597724733874e-05, "epoch": 3.6356866249627644, "percentage": 36.36, "elapsed_time": "1:41:31", "remaining_time": "2:57:43", "throughput": 2310.59, "total_tokens": 14075376} {"current_steps": 24415, "total_steps": 67140, "loss": 0.7409, "lr": 4.0140806339393156e-05, "epoch": 3.6364313375037236, "percentage": 36.36, "elapsed_time": "1:41:32", "remaining_time": "2:57:42", "throughput": 2310.63, "total_tokens": 14078192} {"current_steps": 24420, "total_steps": 67140, "loss": 0.699, "lr": 4.013563440829343e-05, "epoch": 3.637176050044683, "percentage": 36.37, "elapsed_time": "1:41:33", "remaining_time": "2:57:40", "throughput": 2310.67, "total_tokens": 14081072} {"current_steps": 24425, "total_steps": 67140, "loss": 0.8155, "lr": 4.013046145438908e-05, "epoch": 3.637920762585642, "percentage": 36.38, "elapsed_time": "1:41:35", "remaining_time": "2:57:39", "throughput": 2310.72, "total_tokens": 14084080} {"current_steps": 24430, "total_steps": 67140, "loss": 0.616, "lr": 4.012528747802965e-05, "epoch": 3.638665475126601, "percentage": 36.39, "elapsed_time": "1:41:36", "remaining_time": "2:57:37", "throughput": 2310.77, "total_tokens": 14087024} {"current_steps": 24435, "total_steps": 67140, "loss": 0.6753, "lr": 4.0120112479564795e-05, "epoch": 3.6394101876675604, "percentage": 36.39, "elapsed_time": "1:41:37", "remaining_time": "2:57:36", "throughput": 2310.8, "total_tokens": 14089808} {"current_steps": 24440, "total_steps": 67140, "loss": 0.8113, "lr": 4.01149364593442e-05, "epoch": 3.6401549002085196, "percentage": 36.4, "elapsed_time": "1:41:38", "remaining_time": "2:57:34", "throughput": 2310.85, "total_tokens": 14092784} {"current_steps": 24445, "total_steps": 67140, "loss": 0.5204, "lr": 4.010975941771766e-05, "epoch": 3.640899612749479, "percentage": 36.41, "elapsed_time": "1:41:39", "remaining_time": "2:57:33", "throughput": 2310.89, "total_tokens": 14095600} {"current_steps": 24450, "total_steps": 67140, "loss": 0.6188, "lr": 4.0104581355035015e-05, "epoch": 3.641644325290438, "percentage": 36.42, "elapsed_time": "1:41:40", "remaining_time": "2:57:32", "throughput": 2310.94, "total_tokens": 14098544} {"current_steps": 24455, "total_steps": 67140, "loss": 0.7214, "lr": 4.0099402271646166e-05, "epoch": 3.6423890378313972, "percentage": 36.42, "elapsed_time": "1:41:41", "remaining_time": "2:57:30", "throughput": 2311.0, "total_tokens": 14101552} {"current_steps": 24460, "total_steps": 67140, "loss": 0.6886, "lr": 4.009422216790111e-05, "epoch": 3.6431337503723564, "percentage": 36.43, "elapsed_time": "1:41:43", "remaining_time": "2:57:29", "throughput": 2311.07, "total_tokens": 14104656} {"current_steps": 24465, "total_steps": 67140, "loss": 0.5042, "lr": 4.008904104414988e-05, "epoch": 3.6438784629133156, "percentage": 36.44, "elapsed_time": "1:41:44", "remaining_time": "2:57:27", "throughput": 2311.1, "total_tokens": 14107504} {"current_steps": 24470, "total_steps": 67140, "loss": 0.5816, "lr": 4.0083858900742604e-05, "epoch": 3.6446231754542744, "percentage": 36.45, "elapsed_time": "1:41:45", "remaining_time": "2:57:26", "throughput": 2311.14, "total_tokens": 14110384} {"current_steps": 24475, "total_steps": 67140, "loss": 0.7465, "lr": 4.007867573802947e-05, "epoch": 3.645367887995234, "percentage": 36.45, "elapsed_time": "1:41:46", "remaining_time": "2:57:24", "throughput": 2311.18, "total_tokens": 14113264} {"current_steps": 24480, "total_steps": 67140, "loss": 0.7177, "lr": 4.007349155636074e-05, "epoch": 3.646112600536193, "percentage": 36.46, "elapsed_time": "1:41:47", "remaining_time": "2:57:23", "throughput": 2311.21, "total_tokens": 14115984} {"current_steps": 24485, "total_steps": 67140, "loss": 0.61, "lr": 4.006830635608673e-05, "epoch": 3.6468573130771524, "percentage": 36.47, "elapsed_time": "1:41:48", "remaining_time": "2:57:21", "throughput": 2311.27, "total_tokens": 14118960} {"current_steps": 24490, "total_steps": 67140, "loss": 0.7285, "lr": 4.006312013755784e-05, "epoch": 3.647602025618111, "percentage": 36.48, "elapsed_time": "1:41:49", "remaining_time": "2:57:20", "throughput": 2311.35, "total_tokens": 14122160} {"current_steps": 24495, "total_steps": 67140, "loss": 0.6126, "lr": 4.005793290112454e-05, "epoch": 3.648346738159071, "percentage": 36.48, "elapsed_time": "1:41:51", "remaining_time": "2:57:19", "throughput": 2311.35, "total_tokens": 14124688} {"current_steps": 24500, "total_steps": 67140, "loss": 0.696, "lr": 4.005274464713735e-05, "epoch": 3.6490914507000296, "percentage": 36.49, "elapsed_time": "1:41:52", "remaining_time": "2:57:17", "throughput": 2311.38, "total_tokens": 14127504} {"current_steps": 24505, "total_steps": 67140, "loss": 0.5622, "lr": 4.0047555375946876e-05, "epoch": 3.6498361632409893, "percentage": 36.5, "elapsed_time": "1:41:53", "remaining_time": "2:57:16", "throughput": 2311.42, "total_tokens": 14130352} {"current_steps": 24510, "total_steps": 67140, "loss": 0.6014, "lr": 4.004236508790379e-05, "epoch": 3.650580875781948, "percentage": 36.51, "elapsed_time": "1:41:54", "remaining_time": "2:57:14", "throughput": 2311.5, "total_tokens": 14133552} {"current_steps": 24515, "total_steps": 67140, "loss": 0.6513, "lr": 4.003717378335883e-05, "epoch": 3.651325588322907, "percentage": 36.51, "elapsed_time": "1:41:55", "remaining_time": "2:57:13", "throughput": 2311.52, "total_tokens": 14136240} {"current_steps": 24520, "total_steps": 67140, "loss": 0.7191, "lr": 4.0031981462662806e-05, "epoch": 3.6520703008638664, "percentage": 36.52, "elapsed_time": "1:41:56", "remaining_time": "2:57:11", "throughput": 2311.58, "total_tokens": 14139280} {"current_steps": 24525, "total_steps": 67140, "loss": 0.73, "lr": 4.002678812616658e-05, "epoch": 3.6528150134048256, "percentage": 36.53, "elapsed_time": "1:41:57", "remaining_time": "2:57:10", "throughput": 2311.62, "total_tokens": 14142160} {"current_steps": 24530, "total_steps": 67140, "loss": 0.7637, "lr": 4.002159377422111e-05, "epoch": 3.653559725945785, "percentage": 36.54, "elapsed_time": "1:41:59", "remaining_time": "2:57:09", "throughput": 2311.67, "total_tokens": 14145104} {"current_steps": 24535, "total_steps": 67140, "loss": 0.7711, "lr": 4.001639840717741e-05, "epoch": 3.654304438486744, "percentage": 36.54, "elapsed_time": "1:42:00", "remaining_time": "2:57:07", "throughput": 2311.72, "total_tokens": 14148016} {"current_steps": 24540, "total_steps": 67140, "loss": 0.5954, "lr": 4.001120202538656e-05, "epoch": 3.6550491510277032, "percentage": 36.55, "elapsed_time": "1:42:01", "remaining_time": "2:57:06", "throughput": 2311.74, "total_tokens": 14150768} {"current_steps": 24545, "total_steps": 67140, "loss": 0.7862, "lr": 4.000600462919971e-05, "epoch": 3.6557938635686624, "percentage": 36.56, "elapsed_time": "1:42:02", "remaining_time": "2:57:04", "throughput": 2311.79, "total_tokens": 14153648} {"current_steps": 24550, "total_steps": 67140, "loss": 0.4991, "lr": 4.000080621896807e-05, "epoch": 3.6565385761096216, "percentage": 36.57, "elapsed_time": "1:42:03", "remaining_time": "2:57:03", "throughput": 2311.84, "total_tokens": 14156688} {"current_steps": 24555, "total_steps": 67140, "loss": 0.6425, "lr": 3.9995606795042936e-05, "epoch": 3.657283288650581, "percentage": 36.57, "elapsed_time": "1:42:04", "remaining_time": "2:57:01", "throughput": 2311.88, "total_tokens": 14159504} {"current_steps": 24560, "total_steps": 67140, "loss": 0.7374, "lr": 3.9990406357775664e-05, "epoch": 3.65802800119154, "percentage": 36.58, "elapsed_time": "1:42:05", "remaining_time": "2:57:00", "throughput": 2311.93, "total_tokens": 14162544} {"current_steps": 24565, "total_steps": 67140, "loss": 0.7062, "lr": 3.998520490751767e-05, "epoch": 3.6587727137324992, "percentage": 36.59, "elapsed_time": "1:42:06", "remaining_time": "2:56:59", "throughput": 2311.99, "total_tokens": 14165520} {"current_steps": 24570, "total_steps": 67140, "loss": 0.5305, "lr": 3.998000244462046e-05, "epoch": 3.6595174262734584, "percentage": 36.6, "elapsed_time": "1:42:08", "remaining_time": "2:56:57", "throughput": 2312.02, "total_tokens": 14168272} {"current_steps": 24575, "total_steps": 67140, "loss": 0.6513, "lr": 3.997479896943559e-05, "epoch": 3.6602621388144176, "percentage": 36.6, "elapsed_time": "1:42:09", "remaining_time": "2:56:56", "throughput": 2312.08, "total_tokens": 14171312} {"current_steps": 24580, "total_steps": 67140, "loss": 0.6227, "lr": 3.996959448231469e-05, "epoch": 3.661006851355377, "percentage": 36.61, "elapsed_time": "1:42:10", "remaining_time": "2:56:54", "throughput": 2312.12, "total_tokens": 14174160} {"current_steps": 24585, "total_steps": 67140, "loss": 0.8717, "lr": 3.9964388983609455e-05, "epoch": 3.661751563896336, "percentage": 36.62, "elapsed_time": "1:42:11", "remaining_time": "2:56:53", "throughput": 2312.17, "total_tokens": 14177104} {"current_steps": 24590, "total_steps": 67140, "loss": 0.7574, "lr": 3.995918247367165e-05, "epoch": 3.6624962764372953, "percentage": 36.62, "elapsed_time": "1:42:12", "remaining_time": "2:56:51", "throughput": 2312.2, "total_tokens": 14179888} {"current_steps": 24595, "total_steps": 67140, "loss": 0.6333, "lr": 3.9953974952853125e-05, "epoch": 3.6632409889782545, "percentage": 36.63, "elapsed_time": "1:42:13", "remaining_time": "2:56:50", "throughput": 2312.22, "total_tokens": 14182544} {"current_steps": 24600, "total_steps": 67140, "loss": 0.6424, "lr": 3.994876642150576e-05, "epoch": 3.6639857015192137, "percentage": 36.64, "elapsed_time": "1:42:14", "remaining_time": "2:56:48", "throughput": 2312.25, "total_tokens": 14185264} {"current_steps": 24605, "total_steps": 67140, "loss": 0.7045, "lr": 3.9943556879981534e-05, "epoch": 3.664730414060173, "percentage": 36.65, "elapsed_time": "1:42:16", "remaining_time": "2:56:47", "throughput": 2312.3, "total_tokens": 14188272} {"current_steps": 24610, "total_steps": 67140, "loss": 0.4465, "lr": 3.993834632863249e-05, "epoch": 3.665475126601132, "percentage": 36.65, "elapsed_time": "1:42:17", "remaining_time": "2:56:46", "throughput": 2312.37, "total_tokens": 14191440} {"current_steps": 24615, "total_steps": 67140, "loss": 0.5006, "lr": 3.993313476781075e-05, "epoch": 3.6662198391420913, "percentage": 36.66, "elapsed_time": "1:42:18", "remaining_time": "2:56:44", "throughput": 2312.41, "total_tokens": 14194256} {"current_steps": 24620, "total_steps": 67140, "loss": 0.6256, "lr": 3.992792219786847e-05, "epoch": 3.6669645516830505, "percentage": 36.67, "elapsed_time": "1:42:19", "remaining_time": "2:56:43", "throughput": 2312.46, "total_tokens": 14197296} {"current_steps": 24625, "total_steps": 67140, "loss": 0.5116, "lr": 3.9922708619157894e-05, "epoch": 3.6677092642240097, "percentage": 36.68, "elapsed_time": "1:42:20", "remaining_time": "2:56:41", "throughput": 2312.51, "total_tokens": 14200176} {"current_steps": 24630, "total_steps": 67140, "loss": 0.659, "lr": 3.9917494032031346e-05, "epoch": 3.668453976764969, "percentage": 36.68, "elapsed_time": "1:42:21", "remaining_time": "2:56:40", "throughput": 2312.55, "total_tokens": 14203088} {"current_steps": 24635, "total_steps": 67140, "loss": 0.6733, "lr": 3.99122784368412e-05, "epoch": 3.669198689305928, "percentage": 36.69, "elapsed_time": "1:42:22", "remaining_time": "2:56:38", "throughput": 2312.6, "total_tokens": 14206000} {"current_steps": 24640, "total_steps": 67140, "loss": 0.8641, "lr": 3.990706183393991e-05, "epoch": 3.6699434018468873, "percentage": 36.7, "elapsed_time": "1:42:24", "remaining_time": "2:56:37", "throughput": 2312.68, "total_tokens": 14209232} {"current_steps": 24645, "total_steps": 67140, "loss": 0.6302, "lr": 3.990184422367998e-05, "epoch": 3.670688114387846, "percentage": 36.71, "elapsed_time": "1:42:25", "remaining_time": "2:56:35", "throughput": 2312.68, "total_tokens": 14211792} {"current_steps": 24650, "total_steps": 67140, "loss": 0.7426, "lr": 3.989662560641401e-05, "epoch": 3.6714328269288057, "percentage": 36.71, "elapsed_time": "1:42:26", "remaining_time": "2:56:34", "throughput": 2312.72, "total_tokens": 14214640} {"current_steps": 24655, "total_steps": 67140, "loss": 0.5657, "lr": 3.9891405982494647e-05, "epoch": 3.6721775394697644, "percentage": 36.72, "elapsed_time": "1:42:27", "remaining_time": "2:56:33", "throughput": 2312.8, "total_tokens": 14217904} {"current_steps": 24660, "total_steps": 67140, "loss": 0.5596, "lr": 3.988618535227461e-05, "epoch": 3.672922252010724, "percentage": 36.73, "elapsed_time": "1:42:28", "remaining_time": "2:56:31", "throughput": 2312.88, "total_tokens": 14221136} {"current_steps": 24665, "total_steps": 67140, "loss": 0.6462, "lr": 3.988096371610669e-05, "epoch": 3.673666964551683, "percentage": 36.74, "elapsed_time": "1:42:29", "remaining_time": "2:56:30", "throughput": 2312.94, "total_tokens": 14224176} {"current_steps": 24670, "total_steps": 67140, "loss": 0.6016, "lr": 3.9875741074343744e-05, "epoch": 3.6744116770926425, "percentage": 36.74, "elapsed_time": "1:42:30", "remaining_time": "2:56:29", "throughput": 2312.99, "total_tokens": 14227152} {"current_steps": 24675, "total_steps": 67140, "loss": 0.7594, "lr": 3.98705174273387e-05, "epoch": 3.6751563896336013, "percentage": 36.75, "elapsed_time": "1:42:32", "remaining_time": "2:56:27", "throughput": 2313.0, "total_tokens": 14229776} {"current_steps": 24680, "total_steps": 67140, "loss": 0.6809, "lr": 3.986529277544454e-05, "epoch": 3.675901102174561, "percentage": 36.76, "elapsed_time": "1:42:33", "remaining_time": "2:56:26", "throughput": 2313.05, "total_tokens": 14232720} {"current_steps": 24685, "total_steps": 67140, "loss": 0.5604, "lr": 3.9860067119014334e-05, "epoch": 3.6766458147155197, "percentage": 36.77, "elapsed_time": "1:42:34", "remaining_time": "2:56:24", "throughput": 2313.08, "total_tokens": 14235536} {"current_steps": 24690, "total_steps": 67140, "loss": 0.7306, "lr": 3.985484045840121e-05, "epoch": 3.677390527256479, "percentage": 36.77, "elapsed_time": "1:42:35", "remaining_time": "2:56:23", "throughput": 2313.13, "total_tokens": 14238448} {"current_steps": 24695, "total_steps": 67140, "loss": 0.7712, "lr": 3.984961279395836e-05, "epoch": 3.678135239797438, "percentage": 36.78, "elapsed_time": "1:42:36", "remaining_time": "2:56:21", "throughput": 2313.15, "total_tokens": 14241168} {"current_steps": 24700, "total_steps": 67140, "loss": 0.5615, "lr": 3.9844384126039055e-05, "epoch": 3.6788799523383973, "percentage": 36.79, "elapsed_time": "1:42:37", "remaining_time": "2:56:20", "throughput": 2313.2, "total_tokens": 14244080} {"current_steps": 24705, "total_steps": 67140, "loss": 0.6598, "lr": 3.983915445499663e-05, "epoch": 3.6796246648793565, "percentage": 36.8, "elapsed_time": "1:42:38", "remaining_time": "2:56:18", "throughput": 2313.26, "total_tokens": 14247088} {"current_steps": 24710, "total_steps": 67140, "loss": 0.7473, "lr": 3.983392378118447e-05, "epoch": 3.6803693774203157, "percentage": 36.8, "elapsed_time": "1:42:40", "remaining_time": "2:56:17", "throughput": 2313.33, "total_tokens": 14250288} {"current_steps": 24715, "total_steps": 67140, "loss": 0.4832, "lr": 3.9828692104956054e-05, "epoch": 3.681114089961275, "percentage": 36.81, "elapsed_time": "1:42:41", "remaining_time": "2:56:16", "throughput": 2313.45, "total_tokens": 14253872} {"current_steps": 24720, "total_steps": 67140, "loss": 0.6859, "lr": 3.982345942666492e-05, "epoch": 3.681858802502234, "percentage": 36.82, "elapsed_time": "1:42:42", "remaining_time": "2:56:14", "throughput": 2313.48, "total_tokens": 14256688} {"current_steps": 24725, "total_steps": 67140, "loss": 0.6112, "lr": 3.981822574666466e-05, "epoch": 3.6826035150431933, "percentage": 36.83, "elapsed_time": "1:42:43", "remaining_time": "2:56:13", "throughput": 2313.49, "total_tokens": 14259280} {"current_steps": 24730, "total_steps": 67140, "loss": 0.605, "lr": 3.9812991065308946e-05, "epoch": 3.6833482275841525, "percentage": 36.83, "elapsed_time": "1:42:44", "remaining_time": "2:56:11", "throughput": 2313.5, "total_tokens": 14261872} {"current_steps": 24735, "total_steps": 67140, "loss": 0.7541, "lr": 3.980775538295153e-05, "epoch": 3.6840929401251117, "percentage": 36.84, "elapsed_time": "1:42:45", "remaining_time": "2:56:10", "throughput": 2313.54, "total_tokens": 14264752} {"current_steps": 24740, "total_steps": 67140, "loss": 0.5684, "lr": 3.98025186999462e-05, "epoch": 3.684837652666071, "percentage": 36.85, "elapsed_time": "1:42:46", "remaining_time": "2:56:09", "throughput": 2313.6, "total_tokens": 14267792} {"current_steps": 24745, "total_steps": 67140, "loss": 0.6911, "lr": 3.979728101664685e-05, "epoch": 3.68558236520703, "percentage": 36.86, "elapsed_time": "1:42:48", "remaining_time": "2:56:07", "throughput": 2313.63, "total_tokens": 14270544} {"current_steps": 24750, "total_steps": 67140, "loss": 0.7071, "lr": 3.9792042333407404e-05, "epoch": 3.6863270777479893, "percentage": 36.86, "elapsed_time": "1:42:49", "remaining_time": "2:56:06", "throughput": 2313.67, "total_tokens": 14273488} {"current_steps": 24755, "total_steps": 67140, "loss": 0.6786, "lr": 3.978680265058187e-05, "epoch": 3.6870717902889485, "percentage": 36.87, "elapsed_time": "1:42:50", "remaining_time": "2:56:04", "throughput": 2313.73, "total_tokens": 14276560} {"current_steps": 24760, "total_steps": 67140, "loss": 0.6232, "lr": 3.978156196852435e-05, "epoch": 3.6878165028299077, "percentage": 36.88, "elapsed_time": "1:42:51", "remaining_time": "2:56:03", "throughput": 2313.77, "total_tokens": 14279472} {"current_steps": 24765, "total_steps": 67140, "loss": 0.6607, "lr": 3.977632028758895e-05, "epoch": 3.688561215370867, "percentage": 36.89, "elapsed_time": "1:42:52", "remaining_time": "2:56:01", "throughput": 2313.82, "total_tokens": 14282416} {"current_steps": 24770, "total_steps": 67140, "loss": 0.5073, "lr": 3.977107760812991e-05, "epoch": 3.689305927911826, "percentage": 36.89, "elapsed_time": "1:42:53", "remaining_time": "2:56:00", "throughput": 2313.86, "total_tokens": 14285264} {"current_steps": 24775, "total_steps": 67140, "loss": 0.7386, "lr": 3.976583393050151e-05, "epoch": 3.6900506404527853, "percentage": 36.9, "elapsed_time": "1:42:54", "remaining_time": "2:55:59", "throughput": 2313.91, "total_tokens": 14288240} {"current_steps": 24780, "total_steps": 67140, "loss": 0.6211, "lr": 3.976058925505807e-05, "epoch": 3.6907953529937445, "percentage": 36.91, "elapsed_time": "1:42:56", "remaining_time": "2:55:57", "throughput": 2313.95, "total_tokens": 14291088} {"current_steps": 24785, "total_steps": 67140, "loss": 0.699, "lr": 3.975534358215403e-05, "epoch": 3.6915400655347037, "percentage": 36.92, "elapsed_time": "1:42:57", "remaining_time": "2:55:56", "throughput": 2314.03, "total_tokens": 14294384} {"current_steps": 24790, "total_steps": 67140, "loss": 0.6197, "lr": 3.9750096912143855e-05, "epoch": 3.692284778075663, "percentage": 36.92, "elapsed_time": "1:42:58", "remaining_time": "2:55:54", "throughput": 2314.07, "total_tokens": 14297232} {"current_steps": 24795, "total_steps": 67140, "loss": 0.6416, "lr": 3.97448492453821e-05, "epoch": 3.693029490616622, "percentage": 36.93, "elapsed_time": "1:42:59", "remaining_time": "2:55:53", "throughput": 2314.13, "total_tokens": 14300336} {"current_steps": 24800, "total_steps": 67140, "loss": 0.8815, "lr": 3.973960058222339e-05, "epoch": 3.6937742031575813, "percentage": 36.94, "elapsed_time": "1:43:00", "remaining_time": "2:55:52", "throughput": 2314.16, "total_tokens": 14303088} {"current_steps": 24805, "total_steps": 67140, "loss": 0.5211, "lr": 3.973435092302239e-05, "epoch": 3.6945189156985405, "percentage": 36.95, "elapsed_time": "1:43:01", "remaining_time": "2:55:50", "throughput": 2314.18, "total_tokens": 14305744} {"current_steps": 24810, "total_steps": 67140, "loss": 0.6987, "lr": 3.972910026813387e-05, "epoch": 3.6952636282394993, "percentage": 36.95, "elapsed_time": "1:43:02", "remaining_time": "2:55:49", "throughput": 2314.25, "total_tokens": 14308912} {"current_steps": 24815, "total_steps": 67140, "loss": 0.5181, "lr": 3.972384861791263e-05, "epoch": 3.696008340780459, "percentage": 36.96, "elapsed_time": "1:43:04", "remaining_time": "2:55:47", "throughput": 2314.29, "total_tokens": 14311792} {"current_steps": 24820, "total_steps": 67140, "loss": 0.578, "lr": 3.971859597271357e-05, "epoch": 3.6967530533214177, "percentage": 36.97, "elapsed_time": "1:43:05", "remaining_time": "2:55:46", "throughput": 2314.3, "total_tokens": 14314416} {"current_steps": 24825, "total_steps": 67140, "loss": 0.6452, "lr": 3.9713342332891625e-05, "epoch": 3.6974977658623773, "percentage": 36.97, "elapsed_time": "1:43:06", "remaining_time": "2:55:44", "throughput": 2314.35, "total_tokens": 14317328} {"current_steps": 24830, "total_steps": 67140, "loss": 0.6244, "lr": 3.9708087698801834e-05, "epoch": 3.698242478403336, "percentage": 36.98, "elapsed_time": "1:43:07", "remaining_time": "2:55:43", "throughput": 2314.38, "total_tokens": 14320144} {"current_steps": 24835, "total_steps": 67140, "loss": 0.5892, "lr": 3.9702832070799265e-05, "epoch": 3.6989871909442957, "percentage": 36.99, "elapsed_time": "1:43:08", "remaining_time": "2:55:41", "throughput": 2314.42, "total_tokens": 14323024} {"current_steps": 24840, "total_steps": 67140, "loss": 0.6132, "lr": 3.969757544923909e-05, "epoch": 3.6997319034852545, "percentage": 37.0, "elapsed_time": "1:43:09", "remaining_time": "2:55:40", "throughput": 2314.42, "total_tokens": 14325520} {"current_steps": 24845, "total_steps": 67140, "loss": 0.5734, "lr": 3.969231783447652e-05, "epoch": 3.700476616026214, "percentage": 37.0, "elapsed_time": "1:43:10", "remaining_time": "2:55:39", "throughput": 2314.48, "total_tokens": 14328624} {"current_steps": 24850, "total_steps": 67140, "loss": 0.4622, "lr": 3.9687059226866854e-05, "epoch": 3.701221328567173, "percentage": 37.01, "elapsed_time": "1:43:11", "remaining_time": "2:55:37", "throughput": 2314.51, "total_tokens": 14331312} {"current_steps": 24855, "total_steps": 67140, "loss": 0.7431, "lr": 3.9681799626765425e-05, "epoch": 3.701966041108132, "percentage": 37.02, "elapsed_time": "1:43:13", "remaining_time": "2:55:36", "throughput": 2314.55, "total_tokens": 14334256} {"current_steps": 24860, "total_steps": 67140, "loss": 0.6902, "lr": 3.9676539034527684e-05, "epoch": 3.7027107536490913, "percentage": 37.03, "elapsed_time": "1:43:14", "remaining_time": "2:55:34", "throughput": 2314.64, "total_tokens": 14337552} {"current_steps": 24865, "total_steps": 67140, "loss": 0.7836, "lr": 3.9671277450509094e-05, "epoch": 3.7034554661900505, "percentage": 37.03, "elapsed_time": "1:43:15", "remaining_time": "2:55:33", "throughput": 2314.68, "total_tokens": 14340432} {"current_steps": 24870, "total_steps": 67140, "loss": 0.6116, "lr": 3.9666014875065226e-05, "epoch": 3.7042001787310097, "percentage": 37.04, "elapsed_time": "1:43:16", "remaining_time": "2:55:31", "throughput": 2314.74, "total_tokens": 14343504} {"current_steps": 24875, "total_steps": 67140, "loss": 0.658, "lr": 3.9660751308551705e-05, "epoch": 3.704944891271969, "percentage": 37.05, "elapsed_time": "1:43:17", "remaining_time": "2:55:30", "throughput": 2314.77, "total_tokens": 14346224} {"current_steps": 24880, "total_steps": 67140, "loss": 0.5477, "lr": 3.965548675132421e-05, "epoch": 3.705689603812928, "percentage": 37.06, "elapsed_time": "1:43:18", "remaining_time": "2:55:29", "throughput": 2314.85, "total_tokens": 14349520} {"current_steps": 24885, "total_steps": 67140, "loss": 0.8209, "lr": 3.96502212037385e-05, "epoch": 3.7064343163538873, "percentage": 37.06, "elapsed_time": "1:43:20", "remaining_time": "2:55:27", "throughput": 2314.92, "total_tokens": 14352624} {"current_steps": 24890, "total_steps": 67140, "loss": 0.6101, "lr": 3.964495466615042e-05, "epoch": 3.7071790288948465, "percentage": 37.07, "elapsed_time": "1:43:21", "remaining_time": "2:55:26", "throughput": 2314.94, "total_tokens": 14355344} {"current_steps": 24895, "total_steps": 67140, "loss": 0.6466, "lr": 3.963968713891584e-05, "epoch": 3.7079237414358057, "percentage": 37.08, "elapsed_time": "1:43:22", "remaining_time": "2:55:24", "throughput": 2314.97, "total_tokens": 14358160} {"current_steps": 24900, "total_steps": 67140, "loss": 0.6036, "lr": 3.9634418622390727e-05, "epoch": 3.708668453976765, "percentage": 37.09, "elapsed_time": "1:43:23", "remaining_time": "2:55:23", "throughput": 2315.01, "total_tokens": 14361008} {"current_steps": 24905, "total_steps": 67140, "loss": 0.735, "lr": 3.9629149116931086e-05, "epoch": 3.709413166517724, "percentage": 37.09, "elapsed_time": "1:43:24", "remaining_time": "2:55:21", "throughput": 2315.04, "total_tokens": 14363824} {"current_steps": 24910, "total_steps": 67140, "loss": 0.666, "lr": 3.962387862289304e-05, "epoch": 3.7101578790586833, "percentage": 37.1, "elapsed_time": "1:43:25", "remaining_time": "2:55:20", "throughput": 2315.1, "total_tokens": 14366928} {"current_steps": 24915, "total_steps": 67140, "loss": 0.6158, "lr": 3.9618607140632724e-05, "epoch": 3.7109025915996425, "percentage": 37.11, "elapsed_time": "1:43:26", "remaining_time": "2:55:19", "throughput": 2315.14, "total_tokens": 14369776} {"current_steps": 24920, "total_steps": 67140, "loss": 0.5559, "lr": 3.9613334670506384e-05, "epoch": 3.7116473041406017, "percentage": 37.12, "elapsed_time": "1:43:28", "remaining_time": "2:55:17", "throughput": 2315.18, "total_tokens": 14372688} {"current_steps": 24925, "total_steps": 67140, "loss": 0.6498, "lr": 3.9608061212870294e-05, "epoch": 3.712392016681561, "percentage": 37.12, "elapsed_time": "1:43:29", "remaining_time": "2:55:16", "throughput": 2315.22, "total_tokens": 14375568} {"current_steps": 24930, "total_steps": 67140, "loss": 0.5951, "lr": 3.960278676808082e-05, "epoch": 3.71313672922252, "percentage": 37.13, "elapsed_time": "1:43:30", "remaining_time": "2:55:14", "throughput": 2315.24, "total_tokens": 14378224} {"current_steps": 24935, "total_steps": 67140, "loss": 0.8287, "lr": 3.959751133649439e-05, "epoch": 3.7138814417634793, "percentage": 37.14, "elapsed_time": "1:43:31", "remaining_time": "2:55:13", "throughput": 2315.26, "total_tokens": 14380944} {"current_steps": 24940, "total_steps": 67140, "loss": 0.5997, "lr": 3.959223491846749e-05, "epoch": 3.7146261543044385, "percentage": 37.15, "elapsed_time": "1:43:32", "remaining_time": "2:55:11", "throughput": 2315.31, "total_tokens": 14383888} {"current_steps": 24945, "total_steps": 67140, "loss": 0.8499, "lr": 3.958695751435668e-05, "epoch": 3.7153708668453977, "percentage": 37.15, "elapsed_time": "1:43:33", "remaining_time": "2:55:10", "throughput": 2315.37, "total_tokens": 14386928} {"current_steps": 24950, "total_steps": 67140, "loss": 0.5251, "lr": 3.958167912451859e-05, "epoch": 3.716115579386357, "percentage": 37.16, "elapsed_time": "1:43:34", "remaining_time": "2:55:09", "throughput": 2315.4, "total_tokens": 14389680} {"current_steps": 24955, "total_steps": 67140, "loss": 0.6896, "lr": 3.95763997493099e-05, "epoch": 3.716860291927316, "percentage": 37.17, "elapsed_time": "1:43:35", "remaining_time": "2:55:07", "throughput": 2315.45, "total_tokens": 14392656} {"current_steps": 24960, "total_steps": 67140, "loss": 0.9011, "lr": 3.95711193890874e-05, "epoch": 3.7176050044682754, "percentage": 37.18, "elapsed_time": "1:43:37", "remaining_time": "2:55:06", "throughput": 2315.47, "total_tokens": 14395408} {"current_steps": 24965, "total_steps": 67140, "loss": 0.6879, "lr": 3.956583804420787e-05, "epoch": 3.7183497170092346, "percentage": 37.18, "elapsed_time": "1:43:38", "remaining_time": "2:55:04", "throughput": 2315.55, "total_tokens": 14398640} {"current_steps": 24970, "total_steps": 67140, "loss": 0.7332, "lr": 3.9560555715028235e-05, "epoch": 3.7190944295501938, "percentage": 37.19, "elapsed_time": "1:43:39", "remaining_time": "2:55:03", "throughput": 2315.63, "total_tokens": 14401936} {"current_steps": 24975, "total_steps": 67140, "loss": 0.6144, "lr": 3.9555272401905445e-05, "epoch": 3.719839142091153, "percentage": 37.2, "elapsed_time": "1:43:40", "remaining_time": "2:55:02", "throughput": 2315.67, "total_tokens": 14404784} {"current_steps": 24980, "total_steps": 67140, "loss": 0.5677, "lr": 3.9549988105196525e-05, "epoch": 3.720583854632112, "percentage": 37.21, "elapsed_time": "1:43:41", "remaining_time": "2:55:00", "throughput": 2315.71, "total_tokens": 14407728} {"current_steps": 24985, "total_steps": 67140, "loss": 0.7363, "lr": 3.954470282525856e-05, "epoch": 3.721328567173071, "percentage": 37.21, "elapsed_time": "1:43:42", "remaining_time": "2:54:59", "throughput": 2315.74, "total_tokens": 14410544} {"current_steps": 24990, "total_steps": 67140, "loss": 0.6217, "lr": 3.9539416562448715e-05, "epoch": 3.7220732797140306, "percentage": 37.22, "elapsed_time": "1:43:44", "remaining_time": "2:54:57", "throughput": 2315.79, "total_tokens": 14413520} {"current_steps": 24995, "total_steps": 67140, "loss": 0.5948, "lr": 3.953412931712421e-05, "epoch": 3.7228179922549893, "percentage": 37.23, "elapsed_time": "1:43:45", "remaining_time": "2:54:56", "throughput": 2315.84, "total_tokens": 14416464} {"current_steps": 25000, "total_steps": 67140, "loss": 0.6115, "lr": 3.952884108964234e-05, "epoch": 3.723562704795949, "percentage": 37.24, "elapsed_time": "1:43:46", "remaining_time": "2:54:55", "throughput": 2315.87, "total_tokens": 14419216} {"current_steps": 25005, "total_steps": 67140, "loss": 0.6722, "lr": 3.952355188036046e-05, "epoch": 3.7243074173369077, "percentage": 37.24, "elapsed_time": "1:43:47", "remaining_time": "2:54:53", "throughput": 2315.9, "total_tokens": 14422032} {"current_steps": 25010, "total_steps": 67140, "loss": 0.6319, "lr": 3.9518261689635995e-05, "epoch": 3.7250521298778674, "percentage": 37.25, "elapsed_time": "1:43:48", "remaining_time": "2:54:52", "throughput": 2315.9, "total_tokens": 14424592} {"current_steps": 25015, "total_steps": 67140, "loss": 0.7375, "lr": 3.951297051782643e-05, "epoch": 3.725796842418826, "percentage": 37.26, "elapsed_time": "1:43:49", "remaining_time": "2:54:50", "throughput": 2315.94, "total_tokens": 14427440} {"current_steps": 25020, "total_steps": 67140, "loss": 0.4483, "lr": 3.9507678365289316e-05, "epoch": 3.726541554959786, "percentage": 37.27, "elapsed_time": "1:43:50", "remaining_time": "2:54:49", "throughput": 2316.02, "total_tokens": 14430704} {"current_steps": 25025, "total_steps": 67140, "loss": 0.8261, "lr": 3.950238523238229e-05, "epoch": 3.7272862675007445, "percentage": 37.27, "elapsed_time": "1:43:51", "remaining_time": "2:54:47", "throughput": 2316.06, "total_tokens": 14433616} {"current_steps": 25030, "total_steps": 67140, "loss": 0.6503, "lr": 3.949709111946303e-05, "epoch": 3.7280309800417037, "percentage": 37.28, "elapsed_time": "1:43:53", "remaining_time": "2:54:46", "throughput": 2316.08, "total_tokens": 14436336} {"current_steps": 25035, "total_steps": 67140, "loss": 0.6095, "lr": 3.949179602688928e-05, "epoch": 3.728775692582663, "percentage": 37.29, "elapsed_time": "1:43:54", "remaining_time": "2:54:44", "throughput": 2316.11, "total_tokens": 14439088} {"current_steps": 25040, "total_steps": 67140, "loss": 0.6655, "lr": 3.9486499955018893e-05, "epoch": 3.729520405123622, "percentage": 37.3, "elapsed_time": "1:43:55", "remaining_time": "2:54:43", "throughput": 2316.15, "total_tokens": 14442032} {"current_steps": 25045, "total_steps": 67140, "loss": 0.5979, "lr": 3.948120290420973e-05, "epoch": 3.7302651176645814, "percentage": 37.3, "elapsed_time": "1:43:56", "remaining_time": "2:54:42", "throughput": 2316.23, "total_tokens": 14445296} {"current_steps": 25050, "total_steps": 67140, "loss": 0.5142, "lr": 3.947590487481975e-05, "epoch": 3.7310098302055406, "percentage": 37.31, "elapsed_time": "1:43:57", "remaining_time": "2:54:40", "throughput": 2316.25, "total_tokens": 14447952} {"current_steps": 25055, "total_steps": 67140, "loss": 0.8159, "lr": 3.9470605867206976e-05, "epoch": 3.7317545427464998, "percentage": 37.32, "elapsed_time": "1:43:58", "remaining_time": "2:54:39", "throughput": 2316.28, "total_tokens": 14450672} {"current_steps": 25060, "total_steps": 67140, "loss": 0.527, "lr": 3.946530588172949e-05, "epoch": 3.732499255287459, "percentage": 37.32, "elapsed_time": "1:43:59", "remaining_time": "2:54:37", "throughput": 2316.34, "total_tokens": 14453744} {"current_steps": 25065, "total_steps": 67140, "loss": 0.8719, "lr": 3.946000491874544e-05, "epoch": 3.733243967828418, "percentage": 37.33, "elapsed_time": "1:44:01", "remaining_time": "2:54:36", "throughput": 2316.37, "total_tokens": 14456592} {"current_steps": 25070, "total_steps": 67140, "loss": 0.4947, "lr": 3.945470297861305e-05, "epoch": 3.7339886803693774, "percentage": 37.34, "elapsed_time": "1:44:02", "remaining_time": "2:54:35", "throughput": 2316.42, "total_tokens": 14459472} {"current_steps": 25075, "total_steps": 67140, "loss": 0.5909, "lr": 3.94494000616906e-05, "epoch": 3.7347333929103366, "percentage": 37.35, "elapsed_time": "1:44:03", "remaining_time": "2:54:33", "throughput": 2316.45, "total_tokens": 14462352} {"current_steps": 25080, "total_steps": 67140, "loss": 0.7091, "lr": 3.944409616833645e-05, "epoch": 3.7354781054512958, "percentage": 37.35, "elapsed_time": "1:44:04", "remaining_time": "2:54:32", "throughput": 2316.5, "total_tokens": 14465264} {"current_steps": 25085, "total_steps": 67140, "loss": 1.0465, "lr": 3.9438791298909e-05, "epoch": 3.736222817992255, "percentage": 37.36, "elapsed_time": "1:44:05", "remaining_time": "2:54:30", "throughput": 2316.54, "total_tokens": 14468176} {"current_steps": 25090, "total_steps": 67140, "loss": 0.7031, "lr": 3.943348545376673e-05, "epoch": 3.736967530533214, "percentage": 37.37, "elapsed_time": "1:44:06", "remaining_time": "2:54:29", "throughput": 2316.6, "total_tokens": 14471216} {"current_steps": 25095, "total_steps": 67140, "loss": 0.7158, "lr": 3.94281786332682e-05, "epoch": 3.7377122430741734, "percentage": 37.38, "elapsed_time": "1:44:07", "remaining_time": "2:54:27", "throughput": 2316.64, "total_tokens": 14474064} {"current_steps": 25100, "total_steps": 67140, "loss": 0.6795, "lr": 3.942287083777203e-05, "epoch": 3.7384569556151326, "percentage": 37.38, "elapsed_time": "1:44:08", "remaining_time": "2:54:26", "throughput": 2316.68, "total_tokens": 14476912} {"current_steps": 25105, "total_steps": 67140, "loss": 0.7147, "lr": 3.941756206763687e-05, "epoch": 3.739201668156092, "percentage": 37.39, "elapsed_time": "1:44:10", "remaining_time": "2:54:25", "throughput": 2316.72, "total_tokens": 14479824} {"current_steps": 25110, "total_steps": 67140, "loss": 0.6597, "lr": 3.9412252323221495e-05, "epoch": 3.739946380697051, "percentage": 37.4, "elapsed_time": "1:44:11", "remaining_time": "2:54:23", "throughput": 2316.76, "total_tokens": 14482672} {"current_steps": 25115, "total_steps": 67140, "loss": 0.5964, "lr": 3.94069416048847e-05, "epoch": 3.74069109323801, "percentage": 37.41, "elapsed_time": "1:44:12", "remaining_time": "2:54:22", "throughput": 2316.77, "total_tokens": 14485264} {"current_steps": 25120, "total_steps": 67140, "loss": 0.6317, "lr": 3.940162991298537e-05, "epoch": 3.7414358057789694, "percentage": 37.41, "elapsed_time": "1:44:13", "remaining_time": "2:54:20", "throughput": 2316.79, "total_tokens": 14488016} {"current_steps": 25125, "total_steps": 67140, "loss": 0.5818, "lr": 3.9396317247882444e-05, "epoch": 3.7421805183199286, "percentage": 37.42, "elapsed_time": "1:44:14", "remaining_time": "2:54:19", "throughput": 2316.82, "total_tokens": 14490768} {"current_steps": 25130, "total_steps": 67140, "loss": 0.6163, "lr": 3.939100360993492e-05, "epoch": 3.742925230860888, "percentage": 37.43, "elapsed_time": "1:44:15", "remaining_time": "2:54:17", "throughput": 2316.85, "total_tokens": 14493488} {"current_steps": 25135, "total_steps": 67140, "loss": 0.663, "lr": 3.938568899950188e-05, "epoch": 3.743669943401847, "percentage": 37.44, "elapsed_time": "1:44:16", "remaining_time": "2:54:16", "throughput": 2316.89, "total_tokens": 14496432} {"current_steps": 25140, "total_steps": 67140, "loss": 0.5308, "lr": 3.9380373416942474e-05, "epoch": 3.744414655942806, "percentage": 37.44, "elapsed_time": "1:44:17", "remaining_time": "2:54:14", "throughput": 2316.96, "total_tokens": 14499504} {"current_steps": 25145, "total_steps": 67140, "loss": 0.5941, "lr": 3.93750568626159e-05, "epoch": 3.7451593684837654, "percentage": 37.45, "elapsed_time": "1:44:19", "remaining_time": "2:54:13", "throughput": 2316.96, "total_tokens": 14502096} {"current_steps": 25150, "total_steps": 67140, "loss": 0.5805, "lr": 3.9369739336881426e-05, "epoch": 3.7459040810247246, "percentage": 37.46, "elapsed_time": "1:44:20", "remaining_time": "2:54:11", "throughput": 2317.0, "total_tokens": 14504912} {"current_steps": 25155, "total_steps": 67140, "loss": 0.6475, "lr": 3.936442084009839e-05, "epoch": 3.746648793565684, "percentage": 37.47, "elapsed_time": "1:44:21", "remaining_time": "2:54:10", "throughput": 2317.02, "total_tokens": 14507664} {"current_steps": 25160, "total_steps": 67140, "loss": 0.694, "lr": 3.9359101372626195e-05, "epoch": 3.7473935061066426, "percentage": 37.47, "elapsed_time": "1:44:22", "remaining_time": "2:54:09", "throughput": 2317.08, "total_tokens": 14510704} {"current_steps": 25165, "total_steps": 67140, "loss": 0.5927, "lr": 3.935378093482431e-05, "epoch": 3.748138218647602, "percentage": 37.48, "elapsed_time": "1:44:23", "remaining_time": "2:54:07", "throughput": 2317.12, "total_tokens": 14513584} {"current_steps": 25170, "total_steps": 67140, "loss": 0.5145, "lr": 3.9348459527052264e-05, "epoch": 3.748882931188561, "percentage": 37.49, "elapsed_time": "1:44:24", "remaining_time": "2:54:06", "throughput": 2317.17, "total_tokens": 14516528} {"current_steps": 25175, "total_steps": 67140, "loss": 0.5557, "lr": 3.9343137149669665e-05, "epoch": 3.7496276437295206, "percentage": 37.5, "elapsed_time": "1:44:25", "remaining_time": "2:54:04", "throughput": 2317.24, "total_tokens": 14519696} {"current_steps": 25180, "total_steps": 67140, "loss": 0.8125, "lr": 3.933781380303617e-05, "epoch": 3.7503723562704794, "percentage": 37.5, "elapsed_time": "1:44:27", "remaining_time": "2:54:03", "throughput": 2317.3, "total_tokens": 14522800} {"current_steps": 25185, "total_steps": 67140, "loss": 0.6036, "lr": 3.933248948751151e-05, "epoch": 3.751117068811439, "percentage": 37.51, "elapsed_time": "1:44:28", "remaining_time": "2:54:02", "throughput": 2317.35, "total_tokens": 14525712} {"current_steps": 25190, "total_steps": 67140, "loss": 0.6462, "lr": 3.932716420345548e-05, "epoch": 3.751861781352398, "percentage": 37.52, "elapsed_time": "1:44:29", "remaining_time": "2:54:00", "throughput": 2317.4, "total_tokens": 14528688} {"current_steps": 25195, "total_steps": 67140, "loss": 0.5836, "lr": 3.932183795122795e-05, "epoch": 3.7526064938933574, "percentage": 37.53, "elapsed_time": "1:44:30", "remaining_time": "2:53:59", "throughput": 2317.49, "total_tokens": 14532016} {"current_steps": 25200, "total_steps": 67140, "loss": 0.5945, "lr": 3.931651073118884e-05, "epoch": 3.753351206434316, "percentage": 37.53, "elapsed_time": "1:44:31", "remaining_time": "2:53:57", "throughput": 2317.56, "total_tokens": 14535152} {"current_steps": 25205, "total_steps": 67140, "loss": 0.6686, "lr": 3.931118254369813e-05, "epoch": 3.7540959189752754, "percentage": 37.54, "elapsed_time": "1:44:32", "remaining_time": "2:53:56", "throughput": 2317.59, "total_tokens": 14537968} {"current_steps": 25210, "total_steps": 67140, "loss": 0.8965, "lr": 3.93058533891159e-05, "epoch": 3.7548406315162346, "percentage": 37.55, "elapsed_time": "1:44:33", "remaining_time": "2:53:55", "throughput": 2317.62, "total_tokens": 14540688} {"current_steps": 25215, "total_steps": 67140, "loss": 0.6049, "lr": 3.930052326780225e-05, "epoch": 3.755585344057194, "percentage": 37.56, "elapsed_time": "1:44:35", "remaining_time": "2:53:53", "throughput": 2317.65, "total_tokens": 14543440} {"current_steps": 25220, "total_steps": 67140, "loss": 0.6841, "lr": 3.929519218011739e-05, "epoch": 3.756330056598153, "percentage": 37.56, "elapsed_time": "1:44:36", "remaining_time": "2:53:52", "throughput": 2317.69, "total_tokens": 14546352} {"current_steps": 25225, "total_steps": 67140, "loss": 0.599, "lr": 3.928986012642156e-05, "epoch": 3.757074769139112, "percentage": 37.57, "elapsed_time": "1:44:37", "remaining_time": "2:53:50", "throughput": 2317.76, "total_tokens": 14549520} {"current_steps": 25230, "total_steps": 67140, "loss": 0.7179, "lr": 3.9284527107075075e-05, "epoch": 3.7578194816800714, "percentage": 37.58, "elapsed_time": "1:44:38", "remaining_time": "2:53:49", "throughput": 2317.82, "total_tokens": 14552592} {"current_steps": 25235, "total_steps": 67140, "loss": 0.5164, "lr": 3.927919312243833e-05, "epoch": 3.7585641942210306, "percentage": 37.59, "elapsed_time": "1:44:39", "remaining_time": "2:53:48", "throughput": 2317.9, "total_tokens": 14555984} {"current_steps": 25240, "total_steps": 67140, "loss": 0.7056, "lr": 3.927385817287177e-05, "epoch": 3.75930890676199, "percentage": 37.59, "elapsed_time": "1:44:40", "remaining_time": "2:53:46", "throughput": 2317.94, "total_tokens": 14558800} {"current_steps": 25245, "total_steps": 67140, "loss": 0.6105, "lr": 3.926852225873591e-05, "epoch": 3.760053619302949, "percentage": 37.6, "elapsed_time": "1:44:42", "remaining_time": "2:53:45", "throughput": 2317.97, "total_tokens": 14561584} {"current_steps": 25250, "total_steps": 67140, "loss": 0.6958, "lr": 3.926318538039132e-05, "epoch": 3.760798331843908, "percentage": 37.61, "elapsed_time": "1:44:43", "remaining_time": "2:53:43", "throughput": 2318.02, "total_tokens": 14564656} {"current_steps": 25255, "total_steps": 67140, "loss": 0.7751, "lr": 3.9257847538198654e-05, "epoch": 3.7615430443848674, "percentage": 37.62, "elapsed_time": "1:44:44", "remaining_time": "2:53:42", "throughput": 2318.07, "total_tokens": 14567632} {"current_steps": 25260, "total_steps": 67140, "loss": 0.6453, "lr": 3.9252508732518625e-05, "epoch": 3.7622877569258266, "percentage": 37.62, "elapsed_time": "1:44:45", "remaining_time": "2:53:41", "throughput": 2318.12, "total_tokens": 14570544} {"current_steps": 25265, "total_steps": 67140, "loss": 0.7019, "lr": 3.9247168963712e-05, "epoch": 3.763032469466786, "percentage": 37.63, "elapsed_time": "1:44:46", "remaining_time": "2:53:39", "throughput": 2318.17, "total_tokens": 14573520} {"current_steps": 25270, "total_steps": 67140, "loss": 0.6061, "lr": 3.924182823213962e-05, "epoch": 3.763777182007745, "percentage": 37.64, "elapsed_time": "1:44:47", "remaining_time": "2:53:38", "throughput": 2318.22, "total_tokens": 14576496} {"current_steps": 25275, "total_steps": 67140, "loss": 0.6044, "lr": 3.923648653816239e-05, "epoch": 3.7645218945487042, "percentage": 37.65, "elapsed_time": "1:44:48", "remaining_time": "2:53:36", "throughput": 2318.23, "total_tokens": 14579120} {"current_steps": 25280, "total_steps": 67140, "loss": 0.5841, "lr": 3.923114388214128e-05, "epoch": 3.7652666070896634, "percentage": 37.65, "elapsed_time": "1:44:50", "remaining_time": "2:53:35", "throughput": 2318.27, "total_tokens": 14582000} {"current_steps": 25285, "total_steps": 67140, "loss": 0.5814, "lr": 3.922580026443733e-05, "epoch": 3.7660113196306226, "percentage": 37.66, "elapsed_time": "1:44:51", "remaining_time": "2:53:33", "throughput": 2318.29, "total_tokens": 14584784} {"current_steps": 25290, "total_steps": 67140, "loss": 0.7267, "lr": 3.922045568541164e-05, "epoch": 3.766756032171582, "percentage": 37.67, "elapsed_time": "1:44:52", "remaining_time": "2:53:32", "throughput": 2318.33, "total_tokens": 14587600} {"current_steps": 25295, "total_steps": 67140, "loss": 0.5267, "lr": 3.921511014542536e-05, "epoch": 3.767500744712541, "percentage": 37.68, "elapsed_time": "1:44:53", "remaining_time": "2:53:31", "throughput": 2318.38, "total_tokens": 14590640} {"current_steps": 25300, "total_steps": 67140, "loss": 0.5832, "lr": 3.9209763644839736e-05, "epoch": 3.7682454572535002, "percentage": 37.68, "elapsed_time": "1:44:54", "remaining_time": "2:53:29", "throughput": 2318.4, "total_tokens": 14593360} {"current_steps": 25305, "total_steps": 67140, "loss": 0.5481, "lr": 3.9204416184016055e-05, "epoch": 3.7689901697944594, "percentage": 37.69, "elapsed_time": "1:44:55", "remaining_time": "2:53:28", "throughput": 2318.47, "total_tokens": 14596496} {"current_steps": 25310, "total_steps": 67140, "loss": 0.6551, "lr": 3.9199067763315685e-05, "epoch": 3.7697348823354186, "percentage": 37.7, "elapsed_time": "1:44:56", "remaining_time": "2:53:26", "throughput": 2318.54, "total_tokens": 14599664} {"current_steps": 25315, "total_steps": 67140, "loss": 0.7168, "lr": 3.919371838310004e-05, "epoch": 3.770479594876378, "percentage": 37.7, "elapsed_time": "1:44:58", "remaining_time": "2:53:25", "throughput": 2318.58, "total_tokens": 14602640} {"current_steps": 25320, "total_steps": 67140, "loss": 0.5622, "lr": 3.9188368043730615e-05, "epoch": 3.771224307417337, "percentage": 37.71, "elapsed_time": "1:44:59", "remaining_time": "2:53:24", "throughput": 2318.66, "total_tokens": 14605936} {"current_steps": 25325, "total_steps": 67140, "loss": 0.7481, "lr": 3.918301674556897e-05, "epoch": 3.7719690199582963, "percentage": 37.72, "elapsed_time": "1:45:00", "remaining_time": "2:53:22", "throughput": 2318.68, "total_tokens": 14608592} {"current_steps": 25330, "total_steps": 67140, "loss": 0.5524, "lr": 3.917766448897671e-05, "epoch": 3.7727137324992555, "percentage": 37.73, "elapsed_time": "1:45:01", "remaining_time": "2:53:21", "throughput": 2318.72, "total_tokens": 14611440} {"current_steps": 25335, "total_steps": 67140, "loss": 0.6722, "lr": 3.917231127431552e-05, "epoch": 3.773458445040214, "percentage": 37.73, "elapsed_time": "1:45:02", "remaining_time": "2:53:19", "throughput": 2318.77, "total_tokens": 14614448} {"current_steps": 25340, "total_steps": 67140, "loss": 0.6465, "lr": 3.9166957101947166e-05, "epoch": 3.774203157581174, "percentage": 37.74, "elapsed_time": "1:45:03", "remaining_time": "2:53:18", "throughput": 2318.81, "total_tokens": 14617328} {"current_steps": 25345, "total_steps": 67140, "loss": 0.7106, "lr": 3.916160197223344e-05, "epoch": 3.7749478701221326, "percentage": 37.75, "elapsed_time": "1:45:04", "remaining_time": "2:53:17", "throughput": 2318.87, "total_tokens": 14620400} {"current_steps": 25350, "total_steps": 67140, "loss": 0.4987, "lr": 3.915624588553624e-05, "epoch": 3.7756925826630923, "percentage": 37.76, "elapsed_time": "1:45:06", "remaining_time": "2:53:15", "throughput": 2318.88, "total_tokens": 14622960} {"current_steps": 25355, "total_steps": 67140, "loss": 0.5784, "lr": 3.915088884221749e-05, "epoch": 3.776437295204051, "percentage": 37.76, "elapsed_time": "1:45:07", "remaining_time": "2:53:14", "throughput": 2318.89, "total_tokens": 14625648} {"current_steps": 25360, "total_steps": 67140, "loss": 0.5915, "lr": 3.914553084263921e-05, "epoch": 3.7771820077450107, "percentage": 37.77, "elapsed_time": "1:45:08", "remaining_time": "2:53:12", "throughput": 2318.9, "total_tokens": 14628208} {"current_steps": 25365, "total_steps": 67140, "loss": 0.6269, "lr": 3.914017188716347e-05, "epoch": 3.7779267202859694, "percentage": 37.78, "elapsed_time": "1:45:09", "remaining_time": "2:53:11", "throughput": 2318.94, "total_tokens": 14631088} {"current_steps": 25370, "total_steps": 67140, "loss": 0.6809, "lr": 3.9134811976152393e-05, "epoch": 3.778671432826929, "percentage": 37.79, "elapsed_time": "1:45:10", "remaining_time": "2:53:09", "throughput": 2318.97, "total_tokens": 14633872} {"current_steps": 25375, "total_steps": 67140, "loss": 0.5529, "lr": 3.91294511099682e-05, "epoch": 3.779416145367888, "percentage": 37.79, "elapsed_time": "1:45:11", "remaining_time": "2:53:08", "throughput": 2318.99, "total_tokens": 14636528} {"current_steps": 25380, "total_steps": 67140, "loss": 0.5575, "lr": 3.912408928897314e-05, "epoch": 3.780160857908847, "percentage": 37.8, "elapsed_time": "1:45:12", "remaining_time": "2:53:06", "throughput": 2319.0, "total_tokens": 14639248} {"current_steps": 25385, "total_steps": 67140, "loss": 0.7118, "lr": 3.911872651352956e-05, "epoch": 3.7809055704498062, "percentage": 37.81, "elapsed_time": "1:45:13", "remaining_time": "2:53:05", "throughput": 2319.06, "total_tokens": 14642288} {"current_steps": 25390, "total_steps": 67140, "loss": 0.6249, "lr": 3.911336278399984e-05, "epoch": 3.7816502829907654, "percentage": 37.82, "elapsed_time": "1:45:15", "remaining_time": "2:53:04", "throughput": 2319.12, "total_tokens": 14645328} {"current_steps": 25395, "total_steps": 67140, "loss": 0.6896, "lr": 3.9107998100746444e-05, "epoch": 3.7823949955317246, "percentage": 37.82, "elapsed_time": "1:45:16", "remaining_time": "2:53:02", "throughput": 2319.16, "total_tokens": 14648208} {"current_steps": 25400, "total_steps": 67140, "loss": 0.6481, "lr": 3.9102632464131895e-05, "epoch": 3.783139708072684, "percentage": 37.83, "elapsed_time": "1:45:17", "remaining_time": "2:53:01", "throughput": 2319.17, "total_tokens": 14650864} {"current_steps": 25405, "total_steps": 67140, "loss": 0.6315, "lr": 3.909726587451878e-05, "epoch": 3.783884420613643, "percentage": 37.84, "elapsed_time": "1:45:18", "remaining_time": "2:52:59", "throughput": 2319.2, "total_tokens": 14653616} {"current_steps": 25410, "total_steps": 67140, "loss": 0.6209, "lr": 3.9091898332269746e-05, "epoch": 3.7846291331546023, "percentage": 37.85, "elapsed_time": "1:45:19", "remaining_time": "2:52:58", "throughput": 2319.28, "total_tokens": 14656848} {"current_steps": 25415, "total_steps": 67140, "loss": 0.6255, "lr": 3.908652983774753e-05, "epoch": 3.7853738456955615, "percentage": 37.85, "elapsed_time": "1:45:20", "remaining_time": "2:52:57", "throughput": 2319.3, "total_tokens": 14659632} {"current_steps": 25420, "total_steps": 67140, "loss": 0.5926, "lr": 3.908116039131489e-05, "epoch": 3.7861185582365207, "percentage": 37.86, "elapsed_time": "1:45:21", "remaining_time": "2:52:55", "throughput": 2319.33, "total_tokens": 14662448} {"current_steps": 25425, "total_steps": 67140, "loss": 0.5053, "lr": 3.9075789993334686e-05, "epoch": 3.78686327077748, "percentage": 37.87, "elapsed_time": "1:45:22", "remaining_time": "2:52:54", "throughput": 2319.35, "total_tokens": 14665168} {"current_steps": 25430, "total_steps": 67140, "loss": 0.7472, "lr": 3.907041864416982e-05, "epoch": 3.787607983318439, "percentage": 37.88, "elapsed_time": "1:45:24", "remaining_time": "2:52:52", "throughput": 2319.4, "total_tokens": 14668112} {"current_steps": 25435, "total_steps": 67140, "loss": 0.7781, "lr": 3.9065046344183265e-05, "epoch": 3.7883526958593983, "percentage": 37.88, "elapsed_time": "1:45:25", "remaining_time": "2:52:51", "throughput": 2319.42, "total_tokens": 14670832} {"current_steps": 25440, "total_steps": 67140, "loss": 0.6668, "lr": 3.905967309373806e-05, "epoch": 3.7890974084003575, "percentage": 37.89, "elapsed_time": "1:45:26", "remaining_time": "2:52:49", "throughput": 2319.45, "total_tokens": 14673552} {"current_steps": 25445, "total_steps": 67140, "loss": 0.5205, "lr": 3.905429889319732e-05, "epoch": 3.7898421209413167, "percentage": 37.9, "elapsed_time": "1:45:27", "remaining_time": "2:52:48", "throughput": 2319.47, "total_tokens": 14676304} {"current_steps": 25450, "total_steps": 67140, "loss": 0.6522, "lr": 3.904892374292419e-05, "epoch": 3.790586833482276, "percentage": 37.91, "elapsed_time": "1:45:28", "remaining_time": "2:52:46", "throughput": 2319.52, "total_tokens": 14679280} {"current_steps": 25455, "total_steps": 67140, "loss": 0.7557, "lr": 3.904354764328192e-05, "epoch": 3.791331546023235, "percentage": 37.91, "elapsed_time": "1:45:29", "remaining_time": "2:52:45", "throughput": 2319.59, "total_tokens": 14682448} {"current_steps": 25460, "total_steps": 67140, "loss": 0.6408, "lr": 3.903817059463379e-05, "epoch": 3.7920762585641943, "percentage": 37.92, "elapsed_time": "1:45:30", "remaining_time": "2:52:44", "throughput": 2319.62, "total_tokens": 14685296} {"current_steps": 25465, "total_steps": 67140, "loss": 0.7299, "lr": 3.903279259734318e-05, "epoch": 3.7928209711051535, "percentage": 37.93, "elapsed_time": "1:45:32", "remaining_time": "2:52:42", "throughput": 2319.66, "total_tokens": 14688208} {"current_steps": 25470, "total_steps": 67140, "loss": 0.5806, "lr": 3.902741365177349e-05, "epoch": 3.7935656836461127, "percentage": 37.94, "elapsed_time": "1:45:33", "remaining_time": "2:52:41", "throughput": 2319.72, "total_tokens": 14691184} {"current_steps": 25475, "total_steps": 67140, "loss": 0.6482, "lr": 3.902203375828822e-05, "epoch": 3.794310396187072, "percentage": 37.94, "elapsed_time": "1:45:34", "remaining_time": "2:52:39", "throughput": 2319.77, "total_tokens": 14694192} {"current_steps": 25480, "total_steps": 67140, "loss": 0.5889, "lr": 3.901665291725091e-05, "epoch": 3.795055108728031, "percentage": 37.95, "elapsed_time": "1:45:35", "remaining_time": "2:52:38", "throughput": 2319.83, "total_tokens": 14697232} {"current_steps": 25485, "total_steps": 67140, "loss": 0.6686, "lr": 3.901127112902519e-05, "epoch": 3.7957998212689903, "percentage": 37.96, "elapsed_time": "1:45:36", "remaining_time": "2:52:37", "throughput": 2319.87, "total_tokens": 14700080} {"current_steps": 25490, "total_steps": 67140, "loss": 0.5472, "lr": 3.9005888393974735e-05, "epoch": 3.7965445338099495, "percentage": 37.97, "elapsed_time": "1:45:37", "remaining_time": "2:52:35", "throughput": 2319.92, "total_tokens": 14703024} {"current_steps": 25495, "total_steps": 67140, "loss": 0.6617, "lr": 3.900050471246328e-05, "epoch": 3.7972892463509087, "percentage": 37.97, "elapsed_time": "1:45:38", "remaining_time": "2:52:34", "throughput": 2319.92, "total_tokens": 14705584} {"current_steps": 25500, "total_steps": 67140, "loss": 0.5878, "lr": 3.899512008485464e-05, "epoch": 3.798033958891868, "percentage": 37.98, "elapsed_time": "1:45:39", "remaining_time": "2:52:32", "throughput": 2319.96, "total_tokens": 14708432} {"current_steps": 25505, "total_steps": 67140, "loss": 0.5614, "lr": 3.898973451151269e-05, "epoch": 3.798778671432827, "percentage": 37.99, "elapsed_time": "1:45:41", "remaining_time": "2:52:31", "throughput": 2319.97, "total_tokens": 14711024} {"current_steps": 25510, "total_steps": 67140, "loss": 0.5472, "lr": 3.8984347992801355e-05, "epoch": 3.799523383973786, "percentage": 38.0, "elapsed_time": "1:45:42", "remaining_time": "2:52:29", "throughput": 2320.0, "total_tokens": 14713776} {"current_steps": 25515, "total_steps": 67140, "loss": 0.6577, "lr": 3.897896052908464e-05, "epoch": 3.8002680965147455, "percentage": 38.0, "elapsed_time": "1:45:43", "remaining_time": "2:52:28", "throughput": 2320.04, "total_tokens": 14716656} {"current_steps": 25520, "total_steps": 67140, "loss": 0.6372, "lr": 3.897357212072661e-05, "epoch": 3.8010128090557043, "percentage": 38.01, "elapsed_time": "1:45:44", "remaining_time": "2:52:27", "throughput": 2320.09, "total_tokens": 14719696} {"current_steps": 25525, "total_steps": 67140, "loss": 0.6762, "lr": 3.896818276809139e-05, "epoch": 3.801757521596664, "percentage": 38.02, "elapsed_time": "1:45:45", "remaining_time": "2:52:25", "throughput": 2320.14, "total_tokens": 14722608} {"current_steps": 25530, "total_steps": 67140, "loss": 0.6147, "lr": 3.896279247154316e-05, "epoch": 3.8025022341376227, "percentage": 38.03, "elapsed_time": "1:45:46", "remaining_time": "2:52:24", "throughput": 2320.18, "total_tokens": 14725520} {"current_steps": 25535, "total_steps": 67140, "loss": 0.5758, "lr": 3.8957401231446186e-05, "epoch": 3.8032469466785823, "percentage": 38.03, "elapsed_time": "1:45:47", "remaining_time": "2:52:22", "throughput": 2320.2, "total_tokens": 14728176} {"current_steps": 25540, "total_steps": 67140, "loss": 0.684, "lr": 3.895200904816478e-05, "epoch": 3.803991659219541, "percentage": 38.04, "elapsed_time": "1:45:48", "remaining_time": "2:52:21", "throughput": 2320.23, "total_tokens": 14731024} {"current_steps": 25545, "total_steps": 67140, "loss": 0.5392, "lr": 3.8946615922063334e-05, "epoch": 3.8047363717605007, "percentage": 38.05, "elapsed_time": "1:45:50", "remaining_time": "2:52:19", "throughput": 2320.26, "total_tokens": 14733808} {"current_steps": 25550, "total_steps": 67140, "loss": 0.8005, "lr": 3.894122185350629e-05, "epoch": 3.8054810843014595, "percentage": 38.05, "elapsed_time": "1:45:51", "remaining_time": "2:52:18", "throughput": 2320.33, "total_tokens": 14737040} {"current_steps": 25555, "total_steps": 67140, "loss": 0.7049, "lr": 3.8935826842858144e-05, "epoch": 3.8062257968424187, "percentage": 38.06, "elapsed_time": "1:45:52", "remaining_time": "2:52:17", "throughput": 2320.38, "total_tokens": 14740016} {"current_steps": 25560, "total_steps": 67140, "loss": 0.5628, "lr": 3.8930430890483486e-05, "epoch": 3.806970509383378, "percentage": 38.07, "elapsed_time": "1:45:53", "remaining_time": "2:52:15", "throughput": 2320.46, "total_tokens": 14743344} {"current_steps": 25565, "total_steps": 67140, "loss": 0.7269, "lr": 3.892503399674694e-05, "epoch": 3.807715221924337, "percentage": 38.08, "elapsed_time": "1:45:54", "remaining_time": "2:52:14", "throughput": 2320.49, "total_tokens": 14746096} {"current_steps": 25570, "total_steps": 67140, "loss": 0.786, "lr": 3.8919636162013216e-05, "epoch": 3.8084599344652963, "percentage": 38.08, "elapsed_time": "1:45:55", "remaining_time": "2:52:12", "throughput": 2320.53, "total_tokens": 14748976} {"current_steps": 25575, "total_steps": 67140, "loss": 0.5625, "lr": 3.8914237386647076e-05, "epoch": 3.8092046470062555, "percentage": 38.09, "elapsed_time": "1:45:56", "remaining_time": "2:52:11", "throughput": 2320.55, "total_tokens": 14751664} {"current_steps": 25580, "total_steps": 67140, "loss": 0.6377, "lr": 3.8908837671013345e-05, "epoch": 3.8099493595472147, "percentage": 38.1, "elapsed_time": "1:45:58", "remaining_time": "2:52:10", "throughput": 2320.59, "total_tokens": 14754608} {"current_steps": 25585, "total_steps": 67140, "loss": 0.6246, "lr": 3.8903437015476903e-05, "epoch": 3.810694072088174, "percentage": 38.11, "elapsed_time": "1:45:59", "remaining_time": "2:52:08", "throughput": 2320.64, "total_tokens": 14757648} {"current_steps": 25590, "total_steps": 67140, "loss": 0.7759, "lr": 3.889803542040272e-05, "epoch": 3.811438784629133, "percentage": 38.11, "elapsed_time": "1:46:00", "remaining_time": "2:52:07", "throughput": 2320.65, "total_tokens": 14760240} {"current_steps": 25595, "total_steps": 67140, "loss": 0.5495, "lr": 3.889263288615581e-05, "epoch": 3.8121834971700923, "percentage": 38.12, "elapsed_time": "1:46:01", "remaining_time": "2:52:05", "throughput": 2320.7, "total_tokens": 14763280} {"current_steps": 25600, "total_steps": 67140, "loss": 0.5418, "lr": 3.888722941310126e-05, "epoch": 3.8129282097110515, "percentage": 38.13, "elapsed_time": "1:46:02", "remaining_time": "2:52:04", "throughput": 2320.75, "total_tokens": 14766224} {"current_steps": 25605, "total_steps": 67140, "loss": 0.5541, "lr": 3.88818250016042e-05, "epoch": 3.8136729222520107, "percentage": 38.14, "elapsed_time": "1:46:03", "remaining_time": "2:52:03", "throughput": 2320.79, "total_tokens": 14769168} {"current_steps": 25610, "total_steps": 67140, "loss": 0.5807, "lr": 3.887641965202984e-05, "epoch": 3.81441763479297, "percentage": 38.14, "elapsed_time": "1:46:04", "remaining_time": "2:52:01", "throughput": 2320.86, "total_tokens": 14772240} {"current_steps": 25615, "total_steps": 67140, "loss": 0.6265, "lr": 3.887101336474346e-05, "epoch": 3.815162347333929, "percentage": 38.15, "elapsed_time": "1:46:06", "remaining_time": "2:52:00", "throughput": 2320.88, "total_tokens": 14774992} {"current_steps": 25620, "total_steps": 67140, "loss": 0.7103, "lr": 3.88656061401104e-05, "epoch": 3.8159070598748883, "percentage": 38.16, "elapsed_time": "1:46:07", "remaining_time": "2:51:58", "throughput": 2320.94, "total_tokens": 14778000} {"current_steps": 25625, "total_steps": 67140, "loss": 0.6319, "lr": 3.886019797849605e-05, "epoch": 3.8166517724158475, "percentage": 38.17, "elapsed_time": "1:46:08", "remaining_time": "2:51:57", "throughput": 2320.98, "total_tokens": 14780912} {"current_steps": 25630, "total_steps": 67140, "loss": 0.4918, "lr": 3.8854788880265865e-05, "epoch": 3.8173964849568067, "percentage": 38.17, "elapsed_time": "1:46:09", "remaining_time": "2:51:56", "throughput": 2321.04, "total_tokens": 14783952} {"current_steps": 25635, "total_steps": 67140, "loss": 0.4873, "lr": 3.884937884578538e-05, "epoch": 3.818141197497766, "percentage": 38.18, "elapsed_time": "1:46:10", "remaining_time": "2:51:54", "throughput": 2321.07, "total_tokens": 14786768} {"current_steps": 25640, "total_steps": 67140, "loss": 0.5613, "lr": 3.884396787542017e-05, "epoch": 3.818885910038725, "percentage": 38.19, "elapsed_time": "1:46:11", "remaining_time": "2:51:53", "throughput": 2321.1, "total_tokens": 14789520} {"current_steps": 25645, "total_steps": 67140, "loss": 0.6012, "lr": 3.8838555969535915e-05, "epoch": 3.8196306225796843, "percentage": 38.2, "elapsed_time": "1:46:12", "remaining_time": "2:51:51", "throughput": 2321.18, "total_tokens": 14792752} {"current_steps": 25650, "total_steps": 67140, "loss": 0.5302, "lr": 3.8833143128498303e-05, "epoch": 3.8203753351206435, "percentage": 38.2, "elapsed_time": "1:46:14", "remaining_time": "2:51:50", "throughput": 2321.23, "total_tokens": 14795760} {"current_steps": 25655, "total_steps": 67140, "loss": 0.5914, "lr": 3.882772935267312e-05, "epoch": 3.8211200476616027, "percentage": 38.21, "elapsed_time": "1:46:15", "remaining_time": "2:51:48", "throughput": 2321.27, "total_tokens": 14798672} {"current_steps": 25660, "total_steps": 67140, "loss": 0.4233, "lr": 3.8822314642426204e-05, "epoch": 3.821864760202562, "percentage": 38.22, "elapsed_time": "1:46:16", "remaining_time": "2:51:47", "throughput": 2321.27, "total_tokens": 14801200} {"current_steps": 25665, "total_steps": 67140, "loss": 0.6018, "lr": 3.8816898998123464e-05, "epoch": 3.822609472743521, "percentage": 38.23, "elapsed_time": "1:46:17", "remaining_time": "2:51:46", "throughput": 2321.32, "total_tokens": 14804176} {"current_steps": 25670, "total_steps": 67140, "loss": 0.5883, "lr": 3.8811482420130866e-05, "epoch": 3.8233541852844803, "percentage": 38.23, "elapsed_time": "1:46:18", "remaining_time": "2:51:44", "throughput": 2321.35, "total_tokens": 14806992} {"current_steps": 25675, "total_steps": 67140, "loss": 0.7353, "lr": 3.8806064908814435e-05, "epoch": 3.824098897825439, "percentage": 38.24, "elapsed_time": "1:46:19", "remaining_time": "2:51:43", "throughput": 2321.4, "total_tokens": 14810000} {"current_steps": 25680, "total_steps": 67140, "loss": 0.4645, "lr": 3.880064646454027e-05, "epoch": 3.8248436103663987, "percentage": 38.25, "elapsed_time": "1:46:20", "remaining_time": "2:51:41", "throughput": 2321.45, "total_tokens": 14813008} {"current_steps": 25685, "total_steps": 67140, "loss": 0.6494, "lr": 3.8795227087674535e-05, "epoch": 3.8255883229073575, "percentage": 38.26, "elapsed_time": "1:46:22", "remaining_time": "2:51:40", "throughput": 2321.5, "total_tokens": 14816016} {"current_steps": 25690, "total_steps": 67140, "loss": 0.4381, "lr": 3.878980677858344e-05, "epoch": 3.826333035448317, "percentage": 38.26, "elapsed_time": "1:46:23", "remaining_time": "2:51:39", "throughput": 2321.51, "total_tokens": 14818608} {"current_steps": 25695, "total_steps": 67140, "loss": 0.6437, "lr": 3.878438553763326e-05, "epoch": 3.827077747989276, "percentage": 38.27, "elapsed_time": "1:46:24", "remaining_time": "2:51:37", "throughput": 2321.55, "total_tokens": 14821392} {"current_steps": 25700, "total_steps": 67140, "loss": 0.6178, "lr": 3.877896336519035e-05, "epoch": 3.8278224605302356, "percentage": 38.28, "elapsed_time": "1:46:25", "remaining_time": "2:51:36", "throughput": 2321.61, "total_tokens": 14824528} {"current_steps": 25705, "total_steps": 67140, "loss": 0.7442, "lr": 3.877354026162112e-05, "epoch": 3.8285671730711943, "percentage": 38.29, "elapsed_time": "1:46:26", "remaining_time": "2:51:34", "throughput": 2321.67, "total_tokens": 14827536} {"current_steps": 25710, "total_steps": 67140, "loss": 0.6054, "lr": 3.876811622729203e-05, "epoch": 3.829311885612154, "percentage": 38.29, "elapsed_time": "1:46:27", "remaining_time": "2:51:33", "throughput": 2321.7, "total_tokens": 14830320} {"current_steps": 25715, "total_steps": 67140, "loss": 0.6206, "lr": 3.8762691262569625e-05, "epoch": 3.8300565981531127, "percentage": 38.3, "elapsed_time": "1:46:28", "remaining_time": "2:51:31", "throughput": 2321.71, "total_tokens": 14832944} {"current_steps": 25720, "total_steps": 67140, "loss": 0.7547, "lr": 3.875726536782051e-05, "epoch": 3.830801310694072, "percentage": 38.31, "elapsed_time": "1:46:29", "remaining_time": "2:51:30", "throughput": 2321.75, "total_tokens": 14835920} {"current_steps": 25725, "total_steps": 67140, "loss": 0.7319, "lr": 3.8751838543411325e-05, "epoch": 3.831546023235031, "percentage": 38.32, "elapsed_time": "1:46:31", "remaining_time": "2:51:29", "throughput": 2321.8, "total_tokens": 14838896} {"current_steps": 25730, "total_steps": 67140, "loss": 0.7198, "lr": 3.8746410789708806e-05, "epoch": 3.8322907357759903, "percentage": 38.32, "elapsed_time": "1:46:32", "remaining_time": "2:51:27", "throughput": 2321.83, "total_tokens": 14841776} {"current_steps": 25735, "total_steps": 67140, "loss": 0.5246, "lr": 3.8740982107079735e-05, "epoch": 3.8330354483169495, "percentage": 38.33, "elapsed_time": "1:46:33", "remaining_time": "2:51:26", "throughput": 2321.89, "total_tokens": 14844784} {"current_steps": 25740, "total_steps": 67140, "loss": 0.7123, "lr": 3.873555249589096e-05, "epoch": 3.8337801608579087, "percentage": 38.34, "elapsed_time": "1:46:34", "remaining_time": "2:51:24", "throughput": 2321.94, "total_tokens": 14847792} {"current_steps": 25745, "total_steps": 67140, "loss": 0.7453, "lr": 3.873012195650939e-05, "epoch": 3.834524873398868, "percentage": 38.35, "elapsed_time": "1:46:35", "remaining_time": "2:51:23", "throughput": 2321.96, "total_tokens": 14850544} {"current_steps": 25750, "total_steps": 67140, "loss": 0.7233, "lr": 3.8724690489302004e-05, "epoch": 3.835269585939827, "percentage": 38.35, "elapsed_time": "1:46:36", "remaining_time": "2:51:22", "throughput": 2322.01, "total_tokens": 14853488} {"current_steps": 25755, "total_steps": 67140, "loss": 0.6233, "lr": 3.871925809463583e-05, "epoch": 3.8360142984807863, "percentage": 38.36, "elapsed_time": "1:46:37", "remaining_time": "2:51:20", "throughput": 2322.05, "total_tokens": 14856336} {"current_steps": 25760, "total_steps": 67140, "loss": 0.7231, "lr": 3.871382477287797e-05, "epoch": 3.8367590110217455, "percentage": 38.37, "elapsed_time": "1:46:39", "remaining_time": "2:51:19", "throughput": 2322.07, "total_tokens": 14859120} {"current_steps": 25765, "total_steps": 67140, "loss": 0.8262, "lr": 3.87083905243956e-05, "epoch": 3.8375037235627047, "percentage": 38.38, "elapsed_time": "1:46:40", "remaining_time": "2:51:17", "throughput": 2322.14, "total_tokens": 14862288} {"current_steps": 25770, "total_steps": 67140, "loss": 0.6837, "lr": 3.8702955349555924e-05, "epoch": 3.838248436103664, "percentage": 38.38, "elapsed_time": "1:46:41", "remaining_time": "2:51:16", "throughput": 2322.18, "total_tokens": 14865136} {"current_steps": 25775, "total_steps": 67140, "loss": 0.5932, "lr": 3.8697519248726236e-05, "epoch": 3.838993148644623, "percentage": 38.39, "elapsed_time": "1:46:42", "remaining_time": "2:51:15", "throughput": 2322.24, "total_tokens": 14868272} {"current_steps": 25780, "total_steps": 67140, "loss": 0.757, "lr": 3.869208222227389e-05, "epoch": 3.8397378611855824, "percentage": 38.4, "elapsed_time": "1:46:43", "remaining_time": "2:51:13", "throughput": 2322.25, "total_tokens": 14870896} {"current_steps": 25785, "total_steps": 67140, "loss": 0.6924, "lr": 3.86866442705663e-05, "epoch": 3.8404825737265416, "percentage": 38.4, "elapsed_time": "1:46:44", "remaining_time": "2:51:12", "throughput": 2322.28, "total_tokens": 14873680} {"current_steps": 25790, "total_steps": 67140, "loss": 0.5982, "lr": 3.868120539397093e-05, "epoch": 3.8412272862675008, "percentage": 38.41, "elapsed_time": "1:46:45", "remaining_time": "2:51:10", "throughput": 2322.33, "total_tokens": 14876656} {"current_steps": 25795, "total_steps": 67140, "loss": 0.6266, "lr": 3.867576559285533e-05, "epoch": 3.84197199880846, "percentage": 38.42, "elapsed_time": "1:46:46", "remaining_time": "2:51:09", "throughput": 2322.34, "total_tokens": 14879184} {"current_steps": 25800, "total_steps": 67140, "loss": 0.6714, "lr": 3.867032486758708e-05, "epoch": 3.842716711349419, "percentage": 38.43, "elapsed_time": "1:46:48", "remaining_time": "2:51:07", "throughput": 2322.36, "total_tokens": 14881936} {"current_steps": 25805, "total_steps": 67140, "loss": 0.5429, "lr": 3.8664883218533873e-05, "epoch": 3.8434614238903784, "percentage": 38.43, "elapsed_time": "1:46:49", "remaining_time": "2:51:06", "throughput": 2322.43, "total_tokens": 14885136} {"current_steps": 25810, "total_steps": 67140, "loss": 0.5071, "lr": 3.8659440646063404e-05, "epoch": 3.8442061364313376, "percentage": 38.44, "elapsed_time": "1:46:50", "remaining_time": "2:51:05", "throughput": 2322.45, "total_tokens": 14887856} {"current_steps": 25815, "total_steps": 67140, "loss": 0.84, "lr": 3.865399715054347e-05, "epoch": 3.8449508489722968, "percentage": 38.45, "elapsed_time": "1:46:51", "remaining_time": "2:51:03", "throughput": 2322.47, "total_tokens": 14890512} {"current_steps": 25820, "total_steps": 67140, "loss": 0.663, "lr": 3.8648552732341925e-05, "epoch": 3.845695561513256, "percentage": 38.46, "elapsed_time": "1:46:52", "remaining_time": "2:51:02", "throughput": 2322.51, "total_tokens": 14893488} {"current_steps": 25825, "total_steps": 67140, "loss": 0.5354, "lr": 3.8643107391826676e-05, "epoch": 3.846440274054215, "percentage": 38.46, "elapsed_time": "1:46:53", "remaining_time": "2:51:00", "throughput": 2322.57, "total_tokens": 14896496} {"current_steps": 25830, "total_steps": 67140, "loss": 0.6288, "lr": 3.86376611293657e-05, "epoch": 3.8471849865951744, "percentage": 38.47, "elapsed_time": "1:46:54", "remaining_time": "2:50:59", "throughput": 2322.62, "total_tokens": 14899504} {"current_steps": 25835, "total_steps": 67140, "loss": 0.5, "lr": 3.8632213945327036e-05, "epoch": 3.8479296991361336, "percentage": 38.48, "elapsed_time": "1:46:56", "remaining_time": "2:50:57", "throughput": 2322.64, "total_tokens": 14902192} {"current_steps": 25840, "total_steps": 67140, "loss": 0.6083, "lr": 3.8626765840078765e-05, "epoch": 3.848674411677093, "percentage": 38.49, "elapsed_time": "1:46:57", "remaining_time": "2:50:56", "throughput": 2322.71, "total_tokens": 14905424} {"current_steps": 25845, "total_steps": 67140, "loss": 0.5399, "lr": 3.862131681398907e-05, "epoch": 3.849419124218052, "percentage": 38.49, "elapsed_time": "1:46:58", "remaining_time": "2:50:55", "throughput": 2322.74, "total_tokens": 14908240} {"current_steps": 25850, "total_steps": 67140, "loss": 0.6754, "lr": 3.8615866867426164e-05, "epoch": 3.8501638367590107, "percentage": 38.5, "elapsed_time": "1:46:59", "remaining_time": "2:50:53", "throughput": 2322.77, "total_tokens": 14911024} {"current_steps": 25855, "total_steps": 67140, "loss": 0.864, "lr": 3.8610416000758334e-05, "epoch": 3.8509085492999704, "percentage": 38.51, "elapsed_time": "1:47:00", "remaining_time": "2:50:52", "throughput": 2322.83, "total_tokens": 14914064} {"current_steps": 25860, "total_steps": 67140, "loss": 0.5279, "lr": 3.860496421435392e-05, "epoch": 3.851653261840929, "percentage": 38.52, "elapsed_time": "1:47:01", "remaining_time": "2:50:51", "throughput": 2322.86, "total_tokens": 14916912} {"current_steps": 25865, "total_steps": 67140, "loss": 0.6717, "lr": 3.859951150858135e-05, "epoch": 3.852397974381889, "percentage": 38.52, "elapsed_time": "1:47:02", "remaining_time": "2:50:49", "throughput": 2322.91, "total_tokens": 14919856} {"current_steps": 25870, "total_steps": 67140, "loss": 0.682, "lr": 3.859405788380908e-05, "epoch": 3.8531426869228476, "percentage": 38.53, "elapsed_time": "1:47:04", "remaining_time": "2:50:48", "throughput": 2322.94, "total_tokens": 14922704} {"current_steps": 25875, "total_steps": 67140, "loss": 0.6689, "lr": 3.858860334040564e-05, "epoch": 3.853887399463807, "percentage": 38.54, "elapsed_time": "1:47:05", "remaining_time": "2:50:46", "throughput": 2323.0, "total_tokens": 14925872} {"current_steps": 25880, "total_steps": 67140, "loss": 0.6667, "lr": 3.858314787873964e-05, "epoch": 3.854632112004766, "percentage": 38.55, "elapsed_time": "1:47:06", "remaining_time": "2:50:45", "throughput": 2323.04, "total_tokens": 14928720} {"current_steps": 25885, "total_steps": 67140, "loss": 0.7758, "lr": 3.857769149917973e-05, "epoch": 3.8553768245457256, "percentage": 38.55, "elapsed_time": "1:47:07", "remaining_time": "2:50:44", "throughput": 2323.09, "total_tokens": 14931696} {"current_steps": 25890, "total_steps": 67140, "loss": 0.6712, "lr": 3.857223420209464e-05, "epoch": 3.8561215370866844, "percentage": 38.56, "elapsed_time": "1:47:08", "remaining_time": "2:50:42", "throughput": 2323.13, "total_tokens": 14934672} {"current_steps": 25895, "total_steps": 67140, "loss": 0.4994, "lr": 3.856677598785313e-05, "epoch": 3.8568662496276436, "percentage": 38.57, "elapsed_time": "1:47:09", "remaining_time": "2:50:41", "throughput": 2323.16, "total_tokens": 14937488} {"current_steps": 25900, "total_steps": 67140, "loss": 0.6737, "lr": 3.856131685682406e-05, "epoch": 3.8576109621686028, "percentage": 38.58, "elapsed_time": "1:47:10", "remaining_time": "2:50:39", "throughput": 2323.22, "total_tokens": 14940560} {"current_steps": 25905, "total_steps": 67140, "loss": 0.4799, "lr": 3.855585680937634e-05, "epoch": 3.858355674709562, "percentage": 38.58, "elapsed_time": "1:47:12", "remaining_time": "2:50:38", "throughput": 2323.27, "total_tokens": 14943536} {"current_steps": 25910, "total_steps": 67140, "loss": 0.5963, "lr": 3.8550395845878925e-05, "epoch": 3.859100387250521, "percentage": 38.59, "elapsed_time": "1:47:13", "remaining_time": "2:50:37", "throughput": 2323.31, "total_tokens": 14946480} {"current_steps": 25915, "total_steps": 67140, "loss": 0.5441, "lr": 3.854493396670085e-05, "epoch": 3.8598450997914804, "percentage": 38.6, "elapsed_time": "1:47:14", "remaining_time": "2:50:35", "throughput": 2323.31, "total_tokens": 14948976} {"current_steps": 25920, "total_steps": 67140, "loss": 0.6994, "lr": 3.8539471172211204e-05, "epoch": 3.8605898123324396, "percentage": 38.61, "elapsed_time": "1:47:15", "remaining_time": "2:50:34", "throughput": 2323.33, "total_tokens": 14951696} {"current_steps": 25925, "total_steps": 67140, "loss": 0.6257, "lr": 3.8534007462779154e-05, "epoch": 3.861334524873399, "percentage": 38.61, "elapsed_time": "1:47:16", "remaining_time": "2:50:32", "throughput": 2323.35, "total_tokens": 14954384} {"current_steps": 25930, "total_steps": 67140, "loss": 0.7268, "lr": 3.85285428387739e-05, "epoch": 3.862079237414358, "percentage": 38.62, "elapsed_time": "1:47:17", "remaining_time": "2:50:31", "throughput": 2323.42, "total_tokens": 14957584} {"current_steps": 25935, "total_steps": 67140, "loss": 0.6226, "lr": 3.852307730056472e-05, "epoch": 3.862823949955317, "percentage": 38.63, "elapsed_time": "1:47:18", "remaining_time": "2:50:29", "throughput": 2323.46, "total_tokens": 14960464} {"current_steps": 25940, "total_steps": 67140, "loss": 0.6607, "lr": 3.851761084852096e-05, "epoch": 3.8635686624962764, "percentage": 38.64, "elapsed_time": "1:47:20", "remaining_time": "2:50:28", "throughput": 2323.52, "total_tokens": 14963568} {"current_steps": 25945, "total_steps": 67140, "loss": 0.7024, "lr": 3.851214348301202e-05, "epoch": 3.8643133750372356, "percentage": 38.64, "elapsed_time": "1:47:21", "remaining_time": "2:50:27", "throughput": 2323.54, "total_tokens": 14966288} {"current_steps": 25950, "total_steps": 67140, "loss": 0.6816, "lr": 3.850667520440735e-05, "epoch": 3.865058087578195, "percentage": 38.65, "elapsed_time": "1:47:22", "remaining_time": "2:50:25", "throughput": 2323.56, "total_tokens": 14969008} {"current_steps": 25955, "total_steps": 67140, "loss": 0.8112, "lr": 3.8501206013076494e-05, "epoch": 3.865802800119154, "percentage": 38.66, "elapsed_time": "1:47:23", "remaining_time": "2:50:24", "throughput": 2323.59, "total_tokens": 14971824} {"current_steps": 25960, "total_steps": 67140, "loss": 0.5294, "lr": 3.849573590938903e-05, "epoch": 3.866547512660113, "percentage": 38.67, "elapsed_time": "1:47:24", "remaining_time": "2:50:22", "throughput": 2323.64, "total_tokens": 14974832} {"current_steps": 25965, "total_steps": 67140, "loss": 0.6333, "lr": 3.849026489371459e-05, "epoch": 3.8672922252010724, "percentage": 38.67, "elapsed_time": "1:47:25", "remaining_time": "2:50:21", "throughput": 2323.68, "total_tokens": 14977712} {"current_steps": 25970, "total_steps": 67140, "loss": 0.5919, "lr": 3.848479296642291e-05, "epoch": 3.8680369377420316, "percentage": 38.68, "elapsed_time": "1:47:26", "remaining_time": "2:50:20", "throughput": 2323.71, "total_tokens": 14980528} {"current_steps": 25975, "total_steps": 67140, "loss": 0.5706, "lr": 3.8479320127883744e-05, "epoch": 3.868781650282991, "percentage": 38.69, "elapsed_time": "1:47:27", "remaining_time": "2:50:18", "throughput": 2323.78, "total_tokens": 14983664} {"current_steps": 25980, "total_steps": 67140, "loss": 0.5406, "lr": 3.8473846378466915e-05, "epoch": 3.86952636282395, "percentage": 38.7, "elapsed_time": "1:47:29", "remaining_time": "2:50:17", "throughput": 2323.8, "total_tokens": 14986416} {"current_steps": 25985, "total_steps": 67140, "loss": 0.7447, "lr": 3.846837171854234e-05, "epoch": 3.870271075364909, "percentage": 38.7, "elapsed_time": "1:47:30", "remaining_time": "2:50:15", "throughput": 2323.83, "total_tokens": 14989200} {"current_steps": 25990, "total_steps": 67140, "loss": 0.6024, "lr": 3.8462896148479966e-05, "epoch": 3.8710157879058684, "percentage": 38.71, "elapsed_time": "1:47:31", "remaining_time": "2:50:14", "throughput": 2323.87, "total_tokens": 14992112} {"current_steps": 25995, "total_steps": 67140, "loss": 0.6815, "lr": 3.8457419668649795e-05, "epoch": 3.8717605004468276, "percentage": 38.72, "elapsed_time": "1:47:32", "remaining_time": "2:50:12", "throughput": 2323.9, "total_tokens": 14994864} {"current_steps": 26000, "total_steps": 67140, "loss": 0.658, "lr": 3.845194227942192e-05, "epoch": 3.872505212987787, "percentage": 38.73, "elapsed_time": "1:47:33", "remaining_time": "2:50:11", "throughput": 2323.93, "total_tokens": 14997744} {"current_steps": 26005, "total_steps": 67140, "loss": 0.6926, "lr": 3.844646398116648e-05, "epoch": 3.873249925528746, "percentage": 38.73, "elapsed_time": "1:47:34", "remaining_time": "2:50:10", "throughput": 2323.99, "total_tokens": 15000912} {"current_steps": 26010, "total_steps": 67140, "loss": 0.6982, "lr": 3.844098477425368e-05, "epoch": 3.8739946380697052, "percentage": 38.74, "elapsed_time": "1:47:35", "remaining_time": "2:50:08", "throughput": 2324.03, "total_tokens": 15003824} {"current_steps": 26015, "total_steps": 67140, "loss": 0.5993, "lr": 3.843550465905376e-05, "epoch": 3.8747393506106644, "percentage": 38.75, "elapsed_time": "1:47:37", "remaining_time": "2:50:07", "throughput": 2324.08, "total_tokens": 15006768} {"current_steps": 26020, "total_steps": 67140, "loss": 0.698, "lr": 3.843002363593707e-05, "epoch": 3.8754840631516236, "percentage": 38.75, "elapsed_time": "1:47:38", "remaining_time": "2:50:06", "throughput": 2324.11, "total_tokens": 15009616} {"current_steps": 26025, "total_steps": 67140, "loss": 0.7, "lr": 3.842454170527398e-05, "epoch": 3.8762287756925824, "percentage": 38.76, "elapsed_time": "1:47:39", "remaining_time": "2:50:04", "throughput": 2324.13, "total_tokens": 15012272} {"current_steps": 26030, "total_steps": 67140, "loss": 0.56, "lr": 3.841905886743494e-05, "epoch": 3.876973488233542, "percentage": 38.77, "elapsed_time": "1:47:40", "remaining_time": "2:50:03", "throughput": 2324.16, "total_tokens": 15015152} {"current_steps": 26035, "total_steps": 67140, "loss": 0.7086, "lr": 3.841357512279047e-05, "epoch": 3.877718200774501, "percentage": 38.78, "elapsed_time": "1:47:41", "remaining_time": "2:50:01", "throughput": 2324.24, "total_tokens": 15018384} {"current_steps": 26040, "total_steps": 67140, "loss": 0.4885, "lr": 3.8408090471711125e-05, "epoch": 3.8784629133154604, "percentage": 38.78, "elapsed_time": "1:47:42", "remaining_time": "2:50:00", "throughput": 2324.25, "total_tokens": 15021040} {"current_steps": 26045, "total_steps": 67140, "loss": 0.5726, "lr": 3.840260491456753e-05, "epoch": 3.879207625856419, "percentage": 38.79, "elapsed_time": "1:47:43", "remaining_time": "2:49:58", "throughput": 2324.28, "total_tokens": 15023760} {"current_steps": 26050, "total_steps": 67140, "loss": 0.787, "lr": 3.83971184517304e-05, "epoch": 3.879952338397379, "percentage": 38.8, "elapsed_time": "1:47:44", "remaining_time": "2:49:57", "throughput": 2324.29, "total_tokens": 15026384} {"current_steps": 26055, "total_steps": 67140, "loss": 0.7593, "lr": 3.8391631083570464e-05, "epoch": 3.8806970509383376, "percentage": 38.81, "elapsed_time": "1:47:46", "remaining_time": "2:49:56", "throughput": 2324.34, "total_tokens": 15029424} {"current_steps": 26060, "total_steps": 67140, "loss": 0.6411, "lr": 3.838614281045855e-05, "epoch": 3.8814417634792973, "percentage": 38.81, "elapsed_time": "1:47:47", "remaining_time": "2:49:54", "throughput": 2324.36, "total_tokens": 15032144} {"current_steps": 26065, "total_steps": 67140, "loss": 0.5001, "lr": 3.838065363276553e-05, "epoch": 3.882186476020256, "percentage": 38.82, "elapsed_time": "1:47:48", "remaining_time": "2:49:53", "throughput": 2324.38, "total_tokens": 15034768} {"current_steps": 26070, "total_steps": 67140, "loss": 0.7262, "lr": 3.837516355086234e-05, "epoch": 3.882931188561215, "percentage": 38.83, "elapsed_time": "1:47:49", "remaining_time": "2:49:51", "throughput": 2324.43, "total_tokens": 15037808} {"current_steps": 26075, "total_steps": 67140, "loss": 0.5854, "lr": 3.8369672565119975e-05, "epoch": 3.8836759011021744, "percentage": 38.84, "elapsed_time": "1:47:50", "remaining_time": "2:49:50", "throughput": 2324.46, "total_tokens": 15040624} {"current_steps": 26080, "total_steps": 67140, "loss": 0.657, "lr": 3.836418067590949e-05, "epoch": 3.8844206136431336, "percentage": 38.84, "elapsed_time": "1:47:51", "remaining_time": "2:49:48", "throughput": 2324.49, "total_tokens": 15043440} {"current_steps": 26085, "total_steps": 67140, "loss": 0.5705, "lr": 3.835868788360201e-05, "epoch": 3.885165326184093, "percentage": 38.85, "elapsed_time": "1:47:52", "remaining_time": "2:49:47", "throughput": 2324.51, "total_tokens": 15046160} {"current_steps": 26090, "total_steps": 67140, "loss": 0.4916, "lr": 3.8353194188568725e-05, "epoch": 3.885910038725052, "percentage": 38.86, "elapsed_time": "1:47:53", "remaining_time": "2:49:46", "throughput": 2324.56, "total_tokens": 15049104} {"current_steps": 26095, "total_steps": 67140, "loss": 0.8314, "lr": 3.8347699591180855e-05, "epoch": 3.8866547512660112, "percentage": 38.87, "elapsed_time": "1:47:55", "remaining_time": "2:49:44", "throughput": 2324.63, "total_tokens": 15052272} {"current_steps": 26100, "total_steps": 67140, "loss": 0.656, "lr": 3.8342204091809716e-05, "epoch": 3.8873994638069704, "percentage": 38.87, "elapsed_time": "1:47:56", "remaining_time": "2:49:43", "throughput": 2324.67, "total_tokens": 15055248} {"current_steps": 26105, "total_steps": 67140, "loss": 0.5997, "lr": 3.8336707690826676e-05, "epoch": 3.8881441763479296, "percentage": 38.88, "elapsed_time": "1:47:57", "remaining_time": "2:49:41", "throughput": 2324.7, "total_tokens": 15058032} {"current_steps": 26110, "total_steps": 67140, "loss": 0.4778, "lr": 3.8331210388603155e-05, "epoch": 3.888888888888889, "percentage": 38.89, "elapsed_time": "1:47:58", "remaining_time": "2:49:40", "throughput": 2324.7, "total_tokens": 15060592} {"current_steps": 26115, "total_steps": 67140, "loss": 0.6171, "lr": 3.8325712185510635e-05, "epoch": 3.889633601429848, "percentage": 38.9, "elapsed_time": "1:47:59", "remaining_time": "2:49:39", "throughput": 2324.77, "total_tokens": 15063728} {"current_steps": 26120, "total_steps": 67140, "loss": 0.7728, "lr": 3.8320213081920664e-05, "epoch": 3.8903783139708072, "percentage": 38.9, "elapsed_time": "1:48:00", "remaining_time": "2:49:37", "throughput": 2324.82, "total_tokens": 15066704} {"current_steps": 26125, "total_steps": 67140, "loss": 0.6513, "lr": 3.831471307820485e-05, "epoch": 3.8911230265117664, "percentage": 38.91, "elapsed_time": "1:48:01", "remaining_time": "2:49:36", "throughput": 2324.85, "total_tokens": 15069584} {"current_steps": 26130, "total_steps": 67140, "loss": 0.8099, "lr": 3.8309212174734856e-05, "epoch": 3.8918677390527256, "percentage": 38.92, "elapsed_time": "1:48:03", "remaining_time": "2:49:34", "throughput": 2324.88, "total_tokens": 15072368} {"current_steps": 26135, "total_steps": 67140, "loss": 0.7233, "lr": 3.8303710371882414e-05, "epoch": 3.892612451593685, "percentage": 38.93, "elapsed_time": "1:48:04", "remaining_time": "2:49:33", "throughput": 2325.02, "total_tokens": 15076432} {"current_steps": 26140, "total_steps": 67140, "loss": 0.5295, "lr": 3.8298207670019315e-05, "epoch": 3.893357164134644, "percentage": 38.93, "elapsed_time": "1:48:05", "remaining_time": "2:49:32", "throughput": 2325.04, "total_tokens": 15079216} {"current_steps": 26145, "total_steps": 67140, "loss": 0.66, "lr": 3.82927040695174e-05, "epoch": 3.8941018766756033, "percentage": 38.94, "elapsed_time": "1:48:06", "remaining_time": "2:49:31", "throughput": 2325.08, "total_tokens": 15082096} {"current_steps": 26150, "total_steps": 67140, "loss": 0.6439, "lr": 3.828719957074861e-05, "epoch": 3.8948465892165625, "percentage": 38.95, "elapsed_time": "1:48:07", "remaining_time": "2:49:29", "throughput": 2325.1, "total_tokens": 15084784} {"current_steps": 26155, "total_steps": 67140, "loss": 0.6193, "lr": 3.828169417408488e-05, "epoch": 3.8955913017575217, "percentage": 38.96, "elapsed_time": "1:48:08", "remaining_time": "2:49:28", "throughput": 2325.14, "total_tokens": 15087728} {"current_steps": 26160, "total_steps": 67140, "loss": 0.598, "lr": 3.8276187879898255e-05, "epoch": 3.896336014298481, "percentage": 38.96, "elapsed_time": "1:48:10", "remaining_time": "2:49:26", "throughput": 2325.16, "total_tokens": 15090512} {"current_steps": 26165, "total_steps": 67140, "loss": 0.6175, "lr": 3.827068068856083e-05, "epoch": 3.89708072683944, "percentage": 38.97, "elapsed_time": "1:48:11", "remaining_time": "2:49:25", "throughput": 2325.23, "total_tokens": 15093648} {"current_steps": 26170, "total_steps": 67140, "loss": 0.5993, "lr": 3.826517260044477e-05, "epoch": 3.8978254393803993, "percentage": 38.98, "elapsed_time": "1:48:12", "remaining_time": "2:49:24", "throughput": 2325.25, "total_tokens": 15096432} {"current_steps": 26175, "total_steps": 67140, "loss": 0.5557, "lr": 3.825966361592227e-05, "epoch": 3.8985701519213585, "percentage": 38.99, "elapsed_time": "1:48:13", "remaining_time": "2:49:22", "throughput": 2325.3, "total_tokens": 15099344} {"current_steps": 26180, "total_steps": 67140, "loss": 0.7272, "lr": 3.8254153735365614e-05, "epoch": 3.8993148644623177, "percentage": 38.99, "elapsed_time": "1:48:14", "remaining_time": "2:49:21", "throughput": 2325.34, "total_tokens": 15102192} {"current_steps": 26185, "total_steps": 67140, "loss": 0.7036, "lr": 3.8248642959147136e-05, "epoch": 3.900059577003277, "percentage": 39.0, "elapsed_time": "1:48:15", "remaining_time": "2:49:19", "throughput": 2325.34, "total_tokens": 15104752} {"current_steps": 26190, "total_steps": 67140, "loss": 0.6462, "lr": 3.8243131287639234e-05, "epoch": 3.900804289544236, "percentage": 39.01, "elapsed_time": "1:48:16", "remaining_time": "2:49:18", "throughput": 2325.36, "total_tokens": 15107472} {"current_steps": 26195, "total_steps": 67140, "loss": 0.502, "lr": 3.823761872121436e-05, "epoch": 3.9015490020851953, "percentage": 39.02, "elapsed_time": "1:48:17", "remaining_time": "2:49:16", "throughput": 2325.43, "total_tokens": 15110608} {"current_steps": 26200, "total_steps": 67140, "loss": 0.6801, "lr": 3.823210526024503e-05, "epoch": 3.902293714626154, "percentage": 39.02, "elapsed_time": "1:48:19", "remaining_time": "2:49:15", "throughput": 2325.46, "total_tokens": 15113392} {"current_steps": 26205, "total_steps": 67140, "loss": 0.7951, "lr": 3.822659090510383e-05, "epoch": 3.9030384271671137, "percentage": 39.03, "elapsed_time": "1:48:20", "remaining_time": "2:49:14", "throughput": 2325.49, "total_tokens": 15116208} {"current_steps": 26210, "total_steps": 67140, "loss": 0.7807, "lr": 3.822107565616339e-05, "epoch": 3.9037831397080724, "percentage": 39.04, "elapsed_time": "1:48:21", "remaining_time": "2:49:12", "throughput": 2325.52, "total_tokens": 15119024} {"current_steps": 26215, "total_steps": 67140, "loss": 0.5556, "lr": 3.8215559513796405e-05, "epoch": 3.904527852249032, "percentage": 39.05, "elapsed_time": "1:48:22", "remaining_time": "2:49:11", "throughput": 2325.52, "total_tokens": 15121616} {"current_steps": 26220, "total_steps": 67140, "loss": 0.7335, "lr": 3.821004247837564e-05, "epoch": 3.905272564789991, "percentage": 39.05, "elapsed_time": "1:48:23", "remaining_time": "2:49:09", "throughput": 2325.57, "total_tokens": 15124528} {"current_steps": 26225, "total_steps": 67140, "loss": 0.5509, "lr": 3.820452455027391e-05, "epoch": 3.9060172773309505, "percentage": 39.06, "elapsed_time": "1:48:24", "remaining_time": "2:49:08", "throughput": 2325.65, "total_tokens": 15127856} {"current_steps": 26230, "total_steps": 67140, "loss": 0.5444, "lr": 3.819900572986411e-05, "epoch": 3.9067619898719093, "percentage": 39.07, "elapsed_time": "1:48:25", "remaining_time": "2:49:07", "throughput": 2325.69, "total_tokens": 15130800} {"current_steps": 26235, "total_steps": 67140, "loss": 0.5488, "lr": 3.8193486017519157e-05, "epoch": 3.907506702412869, "percentage": 39.08, "elapsed_time": "1:48:27", "remaining_time": "2:49:05", "throughput": 2325.73, "total_tokens": 15133680} {"current_steps": 26240, "total_steps": 67140, "loss": 0.6256, "lr": 3.818796541361206e-05, "epoch": 3.9082514149538277, "percentage": 39.08, "elapsed_time": "1:48:28", "remaining_time": "2:49:04", "throughput": 2325.8, "total_tokens": 15136880} {"current_steps": 26245, "total_steps": 67140, "loss": 0.6297, "lr": 3.8182443918515874e-05, "epoch": 3.908996127494787, "percentage": 39.09, "elapsed_time": "1:48:29", "remaining_time": "2:49:02", "throughput": 2325.86, "total_tokens": 15139952} {"current_steps": 26250, "total_steps": 67140, "loss": 0.5393, "lr": 3.817692153260374e-05, "epoch": 3.909740840035746, "percentage": 39.1, "elapsed_time": "1:48:30", "remaining_time": "2:49:01", "throughput": 2325.88, "total_tokens": 15142672} {"current_steps": 26255, "total_steps": 67140, "loss": 0.7684, "lr": 3.817139825624881e-05, "epoch": 3.9104855525767053, "percentage": 39.1, "elapsed_time": "1:48:31", "remaining_time": "2:49:00", "throughput": 2325.91, "total_tokens": 15145520} {"current_steps": 26260, "total_steps": 67140, "loss": 0.7337, "lr": 3.8165874089824336e-05, "epoch": 3.9112302651176645, "percentage": 39.11, "elapsed_time": "1:48:32", "remaining_time": "2:48:58", "throughput": 2325.96, "total_tokens": 15148432} {"current_steps": 26265, "total_steps": 67140, "loss": 0.6921, "lr": 3.816034903370362e-05, "epoch": 3.9119749776586237, "percentage": 39.12, "elapsed_time": "1:48:33", "remaining_time": "2:48:57", "throughput": 2326.01, "total_tokens": 15151504} {"current_steps": 26270, "total_steps": 67140, "loss": 0.6932, "lr": 3.8154823088260026e-05, "epoch": 3.912719690199583, "percentage": 39.13, "elapsed_time": "1:48:35", "remaining_time": "2:48:55", "throughput": 2326.05, "total_tokens": 15154320} {"current_steps": 26275, "total_steps": 67140, "loss": 0.6842, "lr": 3.8149296253866975e-05, "epoch": 3.913464402740542, "percentage": 39.13, "elapsed_time": "1:48:36", "remaining_time": "2:48:54", "throughput": 2326.11, "total_tokens": 15157456} {"current_steps": 26280, "total_steps": 67140, "loss": 0.5598, "lr": 3.8143768530897935e-05, "epoch": 3.9142091152815013, "percentage": 39.14, "elapsed_time": "1:48:37", "remaining_time": "2:48:53", "throughput": 2326.17, "total_tokens": 15160528} {"current_steps": 26285, "total_steps": 67140, "loss": 0.728, "lr": 3.813823991972646e-05, "epoch": 3.9149538278224605, "percentage": 39.15, "elapsed_time": "1:48:38", "remaining_time": "2:48:51", "throughput": 2326.18, "total_tokens": 15163184} {"current_steps": 26290, "total_steps": 67140, "loss": 0.6365, "lr": 3.8132710420726146e-05, "epoch": 3.9156985403634197, "percentage": 39.16, "elapsed_time": "1:48:39", "remaining_time": "2:48:50", "throughput": 2326.2, "total_tokens": 15165904} {"current_steps": 26295, "total_steps": 67140, "loss": 0.6422, "lr": 3.812718003427066e-05, "epoch": 3.916443252904379, "percentage": 39.16, "elapsed_time": "1:48:40", "remaining_time": "2:48:48", "throughput": 2326.22, "total_tokens": 15168624} {"current_steps": 26300, "total_steps": 67140, "loss": 0.6424, "lr": 3.812164876073371e-05, "epoch": 3.917187965445338, "percentage": 39.17, "elapsed_time": "1:48:41", "remaining_time": "2:48:47", "throughput": 2326.26, "total_tokens": 15171440} {"current_steps": 26305, "total_steps": 67140, "loss": 0.742, "lr": 3.8116116600489096e-05, "epoch": 3.9179326779862973, "percentage": 39.18, "elapsed_time": "1:48:42", "remaining_time": "2:48:46", "throughput": 2326.3, "total_tokens": 15174352} {"current_steps": 26310, "total_steps": 67140, "loss": 0.4925, "lr": 3.8110583553910644e-05, "epoch": 3.9186773905272565, "percentage": 39.19, "elapsed_time": "1:48:44", "remaining_time": "2:48:44", "throughput": 2326.35, "total_tokens": 15177328} {"current_steps": 26315, "total_steps": 67140, "loss": 0.572, "lr": 3.810504962137226e-05, "epoch": 3.9194221030682157, "percentage": 39.19, "elapsed_time": "1:48:45", "remaining_time": "2:48:43", "throughput": 2326.37, "total_tokens": 15180080} {"current_steps": 26320, "total_steps": 67140, "loss": 0.7886, "lr": 3.8099514803247905e-05, "epoch": 3.920166815609175, "percentage": 39.2, "elapsed_time": "1:48:46", "remaining_time": "2:48:41", "throughput": 2326.41, "total_tokens": 15183024} {"current_steps": 26325, "total_steps": 67140, "loss": 0.6728, "lr": 3.809397909991159e-05, "epoch": 3.920911528150134, "percentage": 39.21, "elapsed_time": "1:48:47", "remaining_time": "2:48:40", "throughput": 2326.43, "total_tokens": 15185712} {"current_steps": 26330, "total_steps": 67140, "loss": 0.6211, "lr": 3.808844251173741e-05, "epoch": 3.9216562406910933, "percentage": 39.22, "elapsed_time": "1:48:48", "remaining_time": "2:48:38", "throughput": 2326.44, "total_tokens": 15188336} {"current_steps": 26335, "total_steps": 67140, "loss": 0.6458, "lr": 3.8082905039099496e-05, "epoch": 3.9224009532320525, "percentage": 39.22, "elapsed_time": "1:48:49", "remaining_time": "2:48:37", "throughput": 2326.46, "total_tokens": 15191056} {"current_steps": 26340, "total_steps": 67140, "loss": 0.644, "lr": 3.8077366682372056e-05, "epoch": 3.9231456657730117, "percentage": 39.23, "elapsed_time": "1:48:50", "remaining_time": "2:48:35", "throughput": 2326.48, "total_tokens": 15193680} {"current_steps": 26345, "total_steps": 67140, "loss": 0.5518, "lr": 3.807182744192934e-05, "epoch": 3.923890378313971, "percentage": 39.24, "elapsed_time": "1:48:51", "remaining_time": "2:48:34", "throughput": 2326.5, "total_tokens": 15196432} {"current_steps": 26350, "total_steps": 67140, "loss": 0.7083, "lr": 3.806628731814568e-05, "epoch": 3.92463509085493, "percentage": 39.25, "elapsed_time": "1:48:52", "remaining_time": "2:48:33", "throughput": 2326.52, "total_tokens": 15199120} {"current_steps": 26355, "total_steps": 67140, "loss": 0.5036, "lr": 3.806074631139543e-05, "epoch": 3.9253798033958893, "percentage": 39.25, "elapsed_time": "1:48:54", "remaining_time": "2:48:31", "throughput": 2326.55, "total_tokens": 15201936} {"current_steps": 26360, "total_steps": 67140, "loss": 0.5895, "lr": 3.805520442205306e-05, "epoch": 3.9261245159368485, "percentage": 39.26, "elapsed_time": "1:48:55", "remaining_time": "2:48:30", "throughput": 2326.61, "total_tokens": 15205040} {"current_steps": 26365, "total_steps": 67140, "loss": 0.7347, "lr": 3.804966165049304e-05, "epoch": 3.9268692284778077, "percentage": 39.27, "elapsed_time": "1:48:56", "remaining_time": "2:48:28", "throughput": 2326.62, "total_tokens": 15207632} {"current_steps": 26370, "total_steps": 67140, "loss": 0.6495, "lr": 3.8044117997089954e-05, "epoch": 3.927613941018767, "percentage": 39.28, "elapsed_time": "1:48:57", "remaining_time": "2:48:27", "throughput": 2326.63, "total_tokens": 15210320} {"current_steps": 26375, "total_steps": 67140, "loss": 0.7435, "lr": 3.803857346221841e-05, "epoch": 3.9283586535597257, "percentage": 39.28, "elapsed_time": "1:48:58", "remaining_time": "2:48:26", "throughput": 2326.68, "total_tokens": 15213296} {"current_steps": 26380, "total_steps": 67140, "loss": 0.6728, "lr": 3.803302804625307e-05, "epoch": 3.9291033661006853, "percentage": 39.29, "elapsed_time": "1:48:59", "remaining_time": "2:48:24", "throughput": 2326.72, "total_tokens": 15216112} {"current_steps": 26385, "total_steps": 67140, "loss": 0.5671, "lr": 3.80274817495687e-05, "epoch": 3.929848078641644, "percentage": 39.3, "elapsed_time": "1:49:00", "remaining_time": "2:48:23", "throughput": 2326.74, "total_tokens": 15218864} {"current_steps": 26390, "total_steps": 67140, "loss": 0.7455, "lr": 3.8021934572540065e-05, "epoch": 3.9305927911826037, "percentage": 39.31, "elapsed_time": "1:49:02", "remaining_time": "2:48:21", "throughput": 2326.79, "total_tokens": 15221904} {"current_steps": 26395, "total_steps": 67140, "loss": 0.5667, "lr": 3.8016386515542035e-05, "epoch": 3.9313375037235625, "percentage": 39.31, "elapsed_time": "1:49:03", "remaining_time": "2:48:20", "throughput": 2326.82, "total_tokens": 15224656} {"current_steps": 26400, "total_steps": 67140, "loss": 0.5855, "lr": 3.8010837578949527e-05, "epoch": 3.932082216264522, "percentage": 39.32, "elapsed_time": "1:49:04", "remaining_time": "2:48:18", "throughput": 2326.83, "total_tokens": 15227344} {"current_steps": 26405, "total_steps": 67140, "loss": 0.6051, "lr": 3.800528776313752e-05, "epoch": 3.932826928805481, "percentage": 39.33, "elapsed_time": "1:49:05", "remaining_time": "2:48:17", "throughput": 2326.88, "total_tokens": 15230320} {"current_steps": 26410, "total_steps": 67140, "loss": 0.6773, "lr": 3.799973706848103e-05, "epoch": 3.9335716413464406, "percentage": 39.34, "elapsed_time": "1:49:06", "remaining_time": "2:48:16", "throughput": 2326.92, "total_tokens": 15233232} {"current_steps": 26415, "total_steps": 67140, "loss": 0.5255, "lr": 3.799418549535517e-05, "epoch": 3.9343163538873993, "percentage": 39.34, "elapsed_time": "1:49:07", "remaining_time": "2:48:14", "throughput": 2326.96, "total_tokens": 15236144} {"current_steps": 26420, "total_steps": 67140, "loss": 0.6306, "lr": 3.798863304413509e-05, "epoch": 3.9350610664283585, "percentage": 39.35, "elapsed_time": "1:49:08", "remaining_time": "2:48:13", "throughput": 2327.03, "total_tokens": 15239376} {"current_steps": 26425, "total_steps": 67140, "loss": 0.6539, "lr": 3.7983079715195984e-05, "epoch": 3.9358057789693177, "percentage": 39.36, "elapsed_time": "1:49:09", "remaining_time": "2:48:12", "throughput": 2327.05, "total_tokens": 15242128} {"current_steps": 26430, "total_steps": 67140, "loss": 0.6223, "lr": 3.7977525508913145e-05, "epoch": 3.936550491510277, "percentage": 39.37, "elapsed_time": "1:49:11", "remaining_time": "2:48:10", "throughput": 2327.09, "total_tokens": 15245040} {"current_steps": 26435, "total_steps": 67140, "loss": 0.6499, "lr": 3.797197042566189e-05, "epoch": 3.937295204051236, "percentage": 39.37, "elapsed_time": "1:49:12", "remaining_time": "2:48:09", "throughput": 2327.17, "total_tokens": 15248368} {"current_steps": 26440, "total_steps": 67140, "loss": 0.7126, "lr": 3.796641446581762e-05, "epoch": 3.9380399165921953, "percentage": 39.38, "elapsed_time": "1:49:13", "remaining_time": "2:48:07", "throughput": 2327.18, "total_tokens": 15250992} {"current_steps": 26445, "total_steps": 67140, "loss": 0.6641, "lr": 3.796085762975577e-05, "epoch": 3.9387846291331545, "percentage": 39.39, "elapsed_time": "1:49:14", "remaining_time": "2:48:06", "throughput": 2327.22, "total_tokens": 15253968} {"current_steps": 26450, "total_steps": 67140, "loss": 0.6507, "lr": 3.7955299917851864e-05, "epoch": 3.9395293416741137, "percentage": 39.4, "elapsed_time": "1:49:15", "remaining_time": "2:48:05", "throughput": 2327.27, "total_tokens": 15256944} {"current_steps": 26455, "total_steps": 67140, "loss": 0.629, "lr": 3.794974133048146e-05, "epoch": 3.940274054215073, "percentage": 39.4, "elapsed_time": "1:49:16", "remaining_time": "2:48:03", "throughput": 2327.27, "total_tokens": 15259504} {"current_steps": 26460, "total_steps": 67140, "loss": 0.6302, "lr": 3.794418186802018e-05, "epoch": 3.941018766756032, "percentage": 39.41, "elapsed_time": "1:49:17", "remaining_time": "2:48:02", "throughput": 2327.29, "total_tokens": 15262320} {"current_steps": 26465, "total_steps": 67140, "loss": 0.6797, "lr": 3.793862153084372e-05, "epoch": 3.9417634792969913, "percentage": 39.42, "elapsed_time": "1:49:19", "remaining_time": "2:48:00", "throughput": 2327.3, "total_tokens": 15264880} {"current_steps": 26470, "total_steps": 67140, "loss": 0.7797, "lr": 3.793306031932783e-05, "epoch": 3.9425081918379505, "percentage": 39.43, "elapsed_time": "1:49:20", "remaining_time": "2:47:59", "throughput": 2327.34, "total_tokens": 15267856} {"current_steps": 26475, "total_steps": 67140, "loss": 0.7026, "lr": 3.79274982338483e-05, "epoch": 3.9432529043789097, "percentage": 39.43, "elapsed_time": "1:49:21", "remaining_time": "2:47:58", "throughput": 2327.39, "total_tokens": 15270800} {"current_steps": 26480, "total_steps": 67140, "loss": 0.5525, "lr": 3.7921935274780994e-05, "epoch": 3.943997616919869, "percentage": 39.44, "elapsed_time": "1:49:22", "remaining_time": "2:47:56", "throughput": 2327.45, "total_tokens": 15273936} {"current_steps": 26485, "total_steps": 67140, "loss": 0.6771, "lr": 3.791637144250184e-05, "epoch": 3.944742329460828, "percentage": 39.45, "elapsed_time": "1:49:23", "remaining_time": "2:47:55", "throughput": 2327.49, "total_tokens": 15276816} {"current_steps": 26490, "total_steps": 67140, "loss": 0.6001, "lr": 3.791080673738682e-05, "epoch": 3.9454870420017873, "percentage": 39.45, "elapsed_time": "1:49:24", "remaining_time": "2:47:53", "throughput": 2327.52, "total_tokens": 15279632} {"current_steps": 26495, "total_steps": 67140, "loss": 0.5665, "lr": 3.790524115981198e-05, "epoch": 3.9462317545427466, "percentage": 39.46, "elapsed_time": "1:49:25", "remaining_time": "2:47:52", "throughput": 2327.54, "total_tokens": 15282288} {"current_steps": 26500, "total_steps": 67140, "loss": 0.7521, "lr": 3.78996747101534e-05, "epoch": 3.9469764670837058, "percentage": 39.47, "elapsed_time": "1:49:26", "remaining_time": "2:47:51", "throughput": 2327.56, "total_tokens": 15285008} {"current_steps": 26505, "total_steps": 67140, "loss": 0.6329, "lr": 3.789410738878726e-05, "epoch": 3.947721179624665, "percentage": 39.48, "elapsed_time": "1:49:28", "remaining_time": "2:47:49", "throughput": 2327.58, "total_tokens": 15287728} {"current_steps": 26510, "total_steps": 67140, "loss": 0.7028, "lr": 3.7888539196089755e-05, "epoch": 3.948465892165624, "percentage": 39.48, "elapsed_time": "1:49:29", "remaining_time": "2:47:48", "throughput": 2327.59, "total_tokens": 15290384} {"current_steps": 26515, "total_steps": 67140, "loss": 0.5805, "lr": 3.788297013243718e-05, "epoch": 3.9492106047065834, "percentage": 39.49, "elapsed_time": "1:49:30", "remaining_time": "2:47:46", "throughput": 2327.62, "total_tokens": 15293136} {"current_steps": 26520, "total_steps": 67140, "loss": 0.6097, "lr": 3.7877400198205856e-05, "epoch": 3.9499553172475426, "percentage": 39.5, "elapsed_time": "1:49:31", "remaining_time": "2:47:45", "throughput": 2327.67, "total_tokens": 15296176} {"current_steps": 26525, "total_steps": 67140, "loss": 0.6729, "lr": 3.7871829393772185e-05, "epoch": 3.9507000297885018, "percentage": 39.51, "elapsed_time": "1:49:32", "remaining_time": "2:47:43", "throughput": 2327.68, "total_tokens": 15298800} {"current_steps": 26530, "total_steps": 67140, "loss": 0.6031, "lr": 3.786625771951261e-05, "epoch": 3.951444742329461, "percentage": 39.51, "elapsed_time": "1:49:33", "remaining_time": "2:47:42", "throughput": 2327.72, "total_tokens": 15301680} {"current_steps": 26535, "total_steps": 67140, "loss": 0.6076, "lr": 3.7860685175803654e-05, "epoch": 3.95218945487042, "percentage": 39.52, "elapsed_time": "1:49:34", "remaining_time": "2:47:41", "throughput": 2327.74, "total_tokens": 15304432} {"current_steps": 26540, "total_steps": 67140, "loss": 0.4331, "lr": 3.785511176302189e-05, "epoch": 3.9529341674113794, "percentage": 39.53, "elapsed_time": "1:49:35", "remaining_time": "2:47:39", "throughput": 2327.76, "total_tokens": 15307184} {"current_steps": 26545, "total_steps": 67140, "loss": 0.6559, "lr": 3.784953748154393e-05, "epoch": 3.9536788799523386, "percentage": 39.54, "elapsed_time": "1:49:37", "remaining_time": "2:47:38", "throughput": 2327.79, "total_tokens": 15309968} {"current_steps": 26550, "total_steps": 67140, "loss": 0.6122, "lr": 3.784396233174647e-05, "epoch": 3.9544235924932973, "percentage": 39.54, "elapsed_time": "1:49:38", "remaining_time": "2:47:36", "throughput": 2327.84, "total_tokens": 15313008} {"current_steps": 26555, "total_steps": 67140, "loss": 1.0015, "lr": 3.7838386314006256e-05, "epoch": 3.955168305034257, "percentage": 39.55, "elapsed_time": "1:49:39", "remaining_time": "2:47:35", "throughput": 2327.87, "total_tokens": 15315824} {"current_steps": 26560, "total_steps": 67140, "loss": 0.7642, "lr": 3.78328094287001e-05, "epoch": 3.9559130175752157, "percentage": 39.56, "elapsed_time": "1:49:40", "remaining_time": "2:47:33", "throughput": 2327.9, "total_tokens": 15318576} {"current_steps": 26565, "total_steps": 67140, "loss": 0.6706, "lr": 3.782723167620484e-05, "epoch": 3.9566577301161754, "percentage": 39.57, "elapsed_time": "1:49:41", "remaining_time": "2:47:32", "throughput": 2327.93, "total_tokens": 15321456} {"current_steps": 26570, "total_steps": 67140, "loss": 0.7015, "lr": 3.782165305689743e-05, "epoch": 3.957402442657134, "percentage": 39.57, "elapsed_time": "1:49:42", "remaining_time": "2:47:31", "throughput": 2327.99, "total_tokens": 15324528} {"current_steps": 26575, "total_steps": 67140, "loss": 0.8019, "lr": 3.781607357115483e-05, "epoch": 3.958147155198094, "percentage": 39.58, "elapsed_time": "1:49:43", "remaining_time": "2:47:29", "throughput": 2328.03, "total_tokens": 15327472} {"current_steps": 26580, "total_steps": 67140, "loss": 0.8327, "lr": 3.7810493219354083e-05, "epoch": 3.9588918677390526, "percentage": 39.59, "elapsed_time": "1:49:44", "remaining_time": "2:47:28", "throughput": 2328.03, "total_tokens": 15330064} {"current_steps": 26585, "total_steps": 67140, "loss": 0.5491, "lr": 3.780491200187228e-05, "epoch": 3.9596365802800118, "percentage": 39.6, "elapsed_time": "1:49:46", "remaining_time": "2:47:27", "throughput": 2328.08, "total_tokens": 15333136} {"current_steps": 26590, "total_steps": 67140, "loss": 0.6257, "lr": 3.77993299190866e-05, "epoch": 3.960381292820971, "percentage": 39.6, "elapsed_time": "1:49:47", "remaining_time": "2:47:25", "throughput": 2328.11, "total_tokens": 15335888} {"current_steps": 26595, "total_steps": 67140, "loss": 0.694, "lr": 3.7793746971374236e-05, "epoch": 3.96112600536193, "percentage": 39.61, "elapsed_time": "1:49:48", "remaining_time": "2:47:24", "throughput": 2328.16, "total_tokens": 15338864} {"current_steps": 26600, "total_steps": 67140, "loss": 0.7019, "lr": 3.7788163159112467e-05, "epoch": 3.9618707179028894, "percentage": 39.62, "elapsed_time": "1:49:49", "remaining_time": "2:47:22", "throughput": 2328.18, "total_tokens": 15341616} {"current_steps": 26605, "total_steps": 67140, "loss": 0.7873, "lr": 3.778257848267863e-05, "epoch": 3.9626154304438486, "percentage": 39.63, "elapsed_time": "1:49:50", "remaining_time": "2:47:21", "throughput": 2328.22, "total_tokens": 15344496} {"current_steps": 26610, "total_steps": 67140, "loss": 0.6158, "lr": 3.7776992942450097e-05, "epoch": 3.9633601429848078, "percentage": 39.63, "elapsed_time": "1:49:51", "remaining_time": "2:47:20", "throughput": 2328.25, "total_tokens": 15347376} {"current_steps": 26615, "total_steps": 67140, "loss": 0.5795, "lr": 3.777140653880434e-05, "epoch": 3.964104855525767, "percentage": 39.64, "elapsed_time": "1:49:52", "remaining_time": "2:47:18", "throughput": 2328.28, "total_tokens": 15350224} {"current_steps": 26620, "total_steps": 67140, "loss": 0.6049, "lr": 3.776581927211885e-05, "epoch": 3.964849568066726, "percentage": 39.65, "elapsed_time": "1:49:54", "remaining_time": "2:47:17", "throughput": 2328.29, "total_tokens": 15352848} {"current_steps": 26625, "total_steps": 67140, "loss": 0.7167, "lr": 3.7760231142771194e-05, "epoch": 3.9655942806076854, "percentage": 39.66, "elapsed_time": "1:49:55", "remaining_time": "2:47:15", "throughput": 2328.32, "total_tokens": 15355632} {"current_steps": 26630, "total_steps": 67140, "loss": 0.7786, "lr": 3.7754642151139e-05, "epoch": 3.9663389931486446, "percentage": 39.66, "elapsed_time": "1:49:56", "remaining_time": "2:47:14", "throughput": 2328.37, "total_tokens": 15358640} {"current_steps": 26635, "total_steps": 67140, "loss": 0.8391, "lr": 3.774905229759994e-05, "epoch": 3.967083705689604, "percentage": 39.67, "elapsed_time": "1:49:57", "remaining_time": "2:47:13", "throughput": 2328.4, "total_tokens": 15361488} {"current_steps": 26640, "total_steps": 67140, "loss": 0.6438, "lr": 3.7743461582531767e-05, "epoch": 3.967828418230563, "percentage": 39.68, "elapsed_time": "1:49:58", "remaining_time": "2:47:11", "throughput": 2328.43, "total_tokens": 15364240} {"current_steps": 26645, "total_steps": 67140, "loss": 0.7018, "lr": 3.773787000631226e-05, "epoch": 3.968573130771522, "percentage": 39.69, "elapsed_time": "1:49:59", "remaining_time": "2:47:10", "throughput": 2328.45, "total_tokens": 15367056} {"current_steps": 26650, "total_steps": 67140, "loss": 0.6716, "lr": 3.77322775693193e-05, "epoch": 3.9693178433124814, "percentage": 39.69, "elapsed_time": "1:50:00", "remaining_time": "2:47:08", "throughput": 2328.49, "total_tokens": 15369904} {"current_steps": 26655, "total_steps": 67140, "loss": 0.5725, "lr": 3.772668427193078e-05, "epoch": 3.9700625558534406, "percentage": 39.7, "elapsed_time": "1:50:01", "remaining_time": "2:47:07", "throughput": 2328.52, "total_tokens": 15372752} {"current_steps": 26660, "total_steps": 67140, "loss": 0.7329, "lr": 3.772109011452468e-05, "epoch": 3.9708072683944, "percentage": 39.71, "elapsed_time": "1:50:03", "remaining_time": "2:47:05", "throughput": 2328.54, "total_tokens": 15375472} {"current_steps": 26665, "total_steps": 67140, "loss": 0.7581, "lr": 3.771549509747903e-05, "epoch": 3.971551980935359, "percentage": 39.72, "elapsed_time": "1:50:04", "remaining_time": "2:47:04", "throughput": 2328.6, "total_tokens": 15378640} {"current_steps": 26670, "total_steps": 67140, "loss": 0.5186, "lr": 3.7709899221171924e-05, "epoch": 3.972296693476318, "percentage": 39.72, "elapsed_time": "1:50:05", "remaining_time": "2:47:03", "throughput": 2328.64, "total_tokens": 15381616} {"current_steps": 26675, "total_steps": 67140, "loss": 0.5964, "lr": 3.7704302485981504e-05, "epoch": 3.9730414060172774, "percentage": 39.73, "elapsed_time": "1:50:06", "remaining_time": "2:47:01", "throughput": 2328.67, "total_tokens": 15384464} {"current_steps": 26680, "total_steps": 67140, "loss": 0.6531, "lr": 3.769870489228596e-05, "epoch": 3.9737861185582366, "percentage": 39.74, "elapsed_time": "1:50:07", "remaining_time": "2:47:00", "throughput": 2328.73, "total_tokens": 15387472} {"current_steps": 26685, "total_steps": 67140, "loss": 0.4847, "lr": 3.769310644046359e-05, "epoch": 3.974530831099196, "percentage": 39.75, "elapsed_time": "1:50:08", "remaining_time": "2:46:59", "throughput": 2328.79, "total_tokens": 15390608} {"current_steps": 26690, "total_steps": 67140, "loss": 0.6734, "lr": 3.768750713089267e-05, "epoch": 3.975275543640155, "percentage": 39.75, "elapsed_time": "1:50:09", "remaining_time": "2:46:57", "throughput": 2328.82, "total_tokens": 15393392} {"current_steps": 26695, "total_steps": 67140, "loss": 0.6141, "lr": 3.768190696395162e-05, "epoch": 3.976020256181114, "percentage": 39.76, "elapsed_time": "1:50:11", "remaining_time": "2:46:56", "throughput": 2328.85, "total_tokens": 15396272} {"current_steps": 26700, "total_steps": 67140, "loss": 0.7189, "lr": 3.767630594001885e-05, "epoch": 3.9767649687220734, "percentage": 39.77, "elapsed_time": "1:50:12", "remaining_time": "2:46:54", "throughput": 2328.85, "total_tokens": 15398896} {"current_steps": 26705, "total_steps": 67140, "loss": 0.7406, "lr": 3.767070405947287e-05, "epoch": 3.9775096812630326, "percentage": 39.78, "elapsed_time": "1:50:13", "remaining_time": "2:46:53", "throughput": 2328.9, "total_tokens": 15401936} {"current_steps": 26710, "total_steps": 67140, "loss": 0.6451, "lr": 3.7665101322692206e-05, "epoch": 3.978254393803992, "percentage": 39.78, "elapsed_time": "1:50:14", "remaining_time": "2:46:52", "throughput": 2328.94, "total_tokens": 15404880} {"current_steps": 26715, "total_steps": 67140, "loss": 0.7048, "lr": 3.765949773005551e-05, "epoch": 3.9789991063449506, "percentage": 39.79, "elapsed_time": "1:50:15", "remaining_time": "2:46:50", "throughput": 2328.98, "total_tokens": 15407760} {"current_steps": 26720, "total_steps": 67140, "loss": 0.7079, "lr": 3.7653893281941425e-05, "epoch": 3.9797438188859102, "percentage": 39.8, "elapsed_time": "1:50:16", "remaining_time": "2:46:49", "throughput": 2329.03, "total_tokens": 15410864} {"current_steps": 26725, "total_steps": 67140, "loss": 0.4995, "lr": 3.764828797872866e-05, "epoch": 3.980488531426869, "percentage": 39.8, "elapsed_time": "1:50:17", "remaining_time": "2:46:48", "throughput": 2329.06, "total_tokens": 15413680} {"current_steps": 26730, "total_steps": 67140, "loss": 0.6769, "lr": 3.764268182079603e-05, "epoch": 3.9812332439678286, "percentage": 39.81, "elapsed_time": "1:50:19", "remaining_time": "2:46:46", "throughput": 2329.09, "total_tokens": 15416592} {"current_steps": 26735, "total_steps": 67140, "loss": 0.5161, "lr": 3.7637074808522365e-05, "epoch": 3.9819779565087874, "percentage": 39.82, "elapsed_time": "1:50:20", "remaining_time": "2:46:45", "throughput": 2329.16, "total_tokens": 15419792} {"current_steps": 26740, "total_steps": 67140, "loss": 0.7121, "lr": 3.763146694228657e-05, "epoch": 3.982722669049747, "percentage": 39.83, "elapsed_time": "1:50:21", "remaining_time": "2:46:43", "throughput": 2329.17, "total_tokens": 15422352} {"current_steps": 26745, "total_steps": 67140, "loss": 0.5629, "lr": 3.762585822246758e-05, "epoch": 3.983467381590706, "percentage": 39.83, "elapsed_time": "1:50:22", "remaining_time": "2:46:42", "throughput": 2329.2, "total_tokens": 15425232} {"current_steps": 26750, "total_steps": 67140, "loss": 0.8016, "lr": 3.762024864944443e-05, "epoch": 3.9842120941316654, "percentage": 39.84, "elapsed_time": "1:50:23", "remaining_time": "2:46:41", "throughput": 2329.23, "total_tokens": 15428016} {"current_steps": 26755, "total_steps": 67140, "loss": 0.5651, "lr": 3.761463822359619e-05, "epoch": 3.984956806672624, "percentage": 39.85, "elapsed_time": "1:50:24", "remaining_time": "2:46:39", "throughput": 2329.23, "total_tokens": 15430576} {"current_steps": 26760, "total_steps": 67140, "loss": 0.7401, "lr": 3.760902694530198e-05, "epoch": 3.9857015192135834, "percentage": 39.86, "elapsed_time": "1:50:25", "remaining_time": "2:46:38", "throughput": 2329.26, "total_tokens": 15433424} {"current_steps": 26765, "total_steps": 67140, "loss": 0.6337, "lr": 3.7603414814940995e-05, "epoch": 3.9864462317545426, "percentage": 39.86, "elapsed_time": "1:50:27", "remaining_time": "2:46:36", "throughput": 2329.32, "total_tokens": 15436528} {"current_steps": 26770, "total_steps": 67140, "loss": 0.7574, "lr": 3.7597801832892475e-05, "epoch": 3.987190944295502, "percentage": 39.87, "elapsed_time": "1:50:28", "remaining_time": "2:46:35", "throughput": 2329.37, "total_tokens": 15439600} {"current_steps": 26775, "total_steps": 67140, "loss": 0.6838, "lr": 3.759218799953574e-05, "epoch": 3.987935656836461, "percentage": 39.88, "elapsed_time": "1:50:29", "remaining_time": "2:46:34", "throughput": 2329.4, "total_tokens": 15442416} {"current_steps": 26780, "total_steps": 67140, "loss": 0.7172, "lr": 3.758657331525012e-05, "epoch": 3.98868036937742, "percentage": 39.89, "elapsed_time": "1:50:30", "remaining_time": "2:46:32", "throughput": 2329.45, "total_tokens": 15445392} {"current_steps": 26785, "total_steps": 67140, "loss": 0.5644, "lr": 3.758095778041506e-05, "epoch": 3.9894250819183794, "percentage": 39.89, "elapsed_time": "1:50:31", "remaining_time": "2:46:31", "throughput": 2329.48, "total_tokens": 15448272} {"current_steps": 26790, "total_steps": 67140, "loss": 0.4421, "lr": 3.757534139541002e-05, "epoch": 3.9901697944593386, "percentage": 39.9, "elapsed_time": "1:50:32", "remaining_time": "2:46:30", "throughput": 2329.52, "total_tokens": 15451184} {"current_steps": 26795, "total_steps": 67140, "loss": 0.5798, "lr": 3.7569724160614536e-05, "epoch": 3.990914507000298, "percentage": 39.91, "elapsed_time": "1:50:33", "remaining_time": "2:46:28", "throughput": 2329.57, "total_tokens": 15454256} {"current_steps": 26800, "total_steps": 67140, "loss": 0.7363, "lr": 3.75641060764082e-05, "epoch": 3.991659219541257, "percentage": 39.92, "elapsed_time": "1:50:35", "remaining_time": "2:46:27", "throughput": 2329.58, "total_tokens": 15456848} {"current_steps": 26805, "total_steps": 67140, "loss": 0.5894, "lr": 3.755848714317065e-05, "epoch": 3.9924039320822162, "percentage": 39.92, "elapsed_time": "1:50:36", "remaining_time": "2:46:25", "throughput": 2329.59, "total_tokens": 15459536} {"current_steps": 26810, "total_steps": 67140, "loss": 0.6654, "lr": 3.75528673612816e-05, "epoch": 3.9931486446231754, "percentage": 39.93, "elapsed_time": "1:50:37", "remaining_time": "2:46:24", "throughput": 2329.64, "total_tokens": 15462640} {"current_steps": 26815, "total_steps": 67140, "loss": 0.7152, "lr": 3.7547246731120816e-05, "epoch": 3.9938933571641346, "percentage": 39.94, "elapsed_time": "1:50:38", "remaining_time": "2:46:23", "throughput": 2329.68, "total_tokens": 15465584} {"current_steps": 26820, "total_steps": 67140, "loss": 0.8004, "lr": 3.7541625253068117e-05, "epoch": 3.994638069705094, "percentage": 39.95, "elapsed_time": "1:50:39", "remaining_time": "2:46:21", "throughput": 2329.73, "total_tokens": 15468592} {"current_steps": 26825, "total_steps": 67140, "loss": 0.7465, "lr": 3.7536002927503354e-05, "epoch": 3.995382782246053, "percentage": 39.95, "elapsed_time": "1:50:40", "remaining_time": "2:46:20", "throughput": 2329.76, "total_tokens": 15471408} {"current_steps": 26830, "total_steps": 67140, "loss": 0.6825, "lr": 3.7530379754806494e-05, "epoch": 3.9961274947870122, "percentage": 39.96, "elapsed_time": "1:50:41", "remaining_time": "2:46:18", "throughput": 2329.81, "total_tokens": 15474384} {"current_steps": 26835, "total_steps": 67140, "loss": 0.6626, "lr": 3.752475573535752e-05, "epoch": 3.9968722073279714, "percentage": 39.97, "elapsed_time": "1:50:43", "remaining_time": "2:46:17", "throughput": 2329.85, "total_tokens": 15477264} {"current_steps": 26840, "total_steps": 67140, "loss": 0.609, "lr": 3.7519130869536465e-05, "epoch": 3.9976169198689306, "percentage": 39.98, "elapsed_time": "1:50:44", "remaining_time": "2:46:16", "throughput": 2329.9, "total_tokens": 15480272} {"current_steps": 26845, "total_steps": 67140, "loss": 0.6716, "lr": 3.751350515772344e-05, "epoch": 3.99836163240989, "percentage": 39.98, "elapsed_time": "1:50:45", "remaining_time": "2:46:14", "throughput": 2329.92, "total_tokens": 15483024} {"current_steps": 26850, "total_steps": 67140, "loss": 0.5745, "lr": 3.7507878600298626e-05, "epoch": 3.999106344950849, "percentage": 39.99, "elapsed_time": "1:50:46", "remaining_time": "2:46:13", "throughput": 2329.93, "total_tokens": 15485680} {"current_steps": 26855, "total_steps": 67140, "loss": 0.6451, "lr": 3.750225119764223e-05, "epoch": 3.9998510574918082, "percentage": 40.0, "elapsed_time": "1:50:47", "remaining_time": "2:46:12", "throughput": 2330.0, "total_tokens": 15488912} {"current_steps": 26856, "total_steps": 67140, "eval_loss": 0.6477048397064209, "epoch": 4.0, "percentage": 40.0, "elapsed_time": "1:52:02", "remaining_time": "2:48:03", "throughput": 2304.2, "total_tokens": 15489040} {"current_steps": 26860, "total_steps": 67140, "loss": 0.7113, "lr": 3.749662295013452e-05, "epoch": 4.000595770032767, "percentage": 40.01, "elapsed_time": "1:52:06", "remaining_time": "2:48:06", "throughput": 2303.21, "total_tokens": 15491568} {"current_steps": 26865, "total_steps": 67140, "loss": 0.6548, "lr": 3.7490993858155837e-05, "epoch": 4.001340482573727, "percentage": 40.01, "elapsed_time": "1:52:07", "remaining_time": "2:48:05", "throughput": 2303.27, "total_tokens": 15494608} {"current_steps": 26870, "total_steps": 67140, "loss": 0.5661, "lr": 3.748536392208658e-05, "epoch": 4.002085195114685, "percentage": 40.02, "elapsed_time": "1:52:08", "remaining_time": "2:48:03", "throughput": 2303.34, "total_tokens": 15497744} {"current_steps": 26875, "total_steps": 67140, "loss": 0.6105, "lr": 3.74797331423072e-05, "epoch": 4.002829907655645, "percentage": 40.03, "elapsed_time": "1:52:09", "remaining_time": "2:48:02", "throughput": 2303.38, "total_tokens": 15500624} {"current_steps": 26880, "total_steps": 67140, "loss": 0.6949, "lr": 3.747410151919817e-05, "epoch": 4.003574620196604, "percentage": 40.04, "elapsed_time": "1:52:10", "remaining_time": "2:48:01", "throughput": 2303.45, "total_tokens": 15503856} {"current_steps": 26885, "total_steps": 67140, "loss": 0.6145, "lr": 3.746846905314009e-05, "epoch": 4.0043193327375635, "percentage": 40.04, "elapsed_time": "1:52:11", "remaining_time": "2:47:59", "throughput": 2303.49, "total_tokens": 15506704} {"current_steps": 26890, "total_steps": 67140, "loss": 0.7355, "lr": 3.746283574451356e-05, "epoch": 4.005064045278522, "percentage": 40.05, "elapsed_time": "1:52:12", "remaining_time": "2:47:58", "throughput": 2303.52, "total_tokens": 15509488} {"current_steps": 26895, "total_steps": 67140, "loss": 0.6375, "lr": 3.7457201593699264e-05, "epoch": 4.005808757819482, "percentage": 40.06, "elapsed_time": "1:52:14", "remaining_time": "2:47:56", "throughput": 2303.55, "total_tokens": 15512272} {"current_steps": 26900, "total_steps": 67140, "loss": 0.7449, "lr": 3.7451566601077936e-05, "epoch": 4.006553470360441, "percentage": 40.07, "elapsed_time": "1:52:15", "remaining_time": "2:47:55", "throughput": 2303.58, "total_tokens": 15515120} {"current_steps": 26905, "total_steps": 67140, "loss": 0.8259, "lr": 3.744593076703035e-05, "epoch": 4.0072981829014, "percentage": 40.07, "elapsed_time": "1:52:16", "remaining_time": "2:47:53", "throughput": 2303.61, "total_tokens": 15517936} {"current_steps": 26910, "total_steps": 67140, "loss": 0.75, "lr": 3.744029409193737e-05, "epoch": 4.008042895442359, "percentage": 40.08, "elapsed_time": "1:52:17", "remaining_time": "2:47:52", "throughput": 2303.63, "total_tokens": 15520624} {"current_steps": 26915, "total_steps": 67140, "loss": 0.6046, "lr": 3.7434656576179894e-05, "epoch": 4.008787607983319, "percentage": 40.09, "elapsed_time": "1:52:18", "remaining_time": "2:47:50", "throughput": 2303.68, "total_tokens": 15523600} {"current_steps": 26920, "total_steps": 67140, "loss": 0.6862, "lr": 3.742901822013889e-05, "epoch": 4.009532320524277, "percentage": 40.1, "elapsed_time": "1:52:19", "remaining_time": "2:47:49", "throughput": 2303.71, "total_tokens": 15526320} {"current_steps": 26925, "total_steps": 67140, "loss": 0.6967, "lr": 3.7423379024195355e-05, "epoch": 4.010277033065237, "percentage": 40.1, "elapsed_time": "1:52:20", "remaining_time": "2:47:48", "throughput": 2303.76, "total_tokens": 15529264} {"current_steps": 26930, "total_steps": 67140, "loss": 0.5817, "lr": 3.7417738988730375e-05, "epoch": 4.011021745606196, "percentage": 40.11, "elapsed_time": "1:52:21", "remaining_time": "2:47:46", "throughput": 2303.78, "total_tokens": 15532048} {"current_steps": 26935, "total_steps": 67140, "loss": 0.6301, "lr": 3.7412098114125094e-05, "epoch": 4.0117664581471555, "percentage": 40.12, "elapsed_time": "1:52:23", "remaining_time": "2:47:45", "throughput": 2303.81, "total_tokens": 15534864} {"current_steps": 26940, "total_steps": 67140, "loss": 0.5442, "lr": 3.740645640076068e-05, "epoch": 4.012511170688114, "percentage": 40.13, "elapsed_time": "1:52:24", "remaining_time": "2:47:43", "throughput": 2303.86, "total_tokens": 15537776} {"current_steps": 26945, "total_steps": 67140, "loss": 0.6191, "lr": 3.740081384901837e-05, "epoch": 4.013255883229074, "percentage": 40.13, "elapsed_time": "1:52:25", "remaining_time": "2:47:42", "throughput": 2303.89, "total_tokens": 15540560} {"current_steps": 26950, "total_steps": 67140, "loss": 0.6101, "lr": 3.7395170459279494e-05, "epoch": 4.014000595770033, "percentage": 40.14, "elapsed_time": "1:52:26", "remaining_time": "2:47:40", "throughput": 2303.94, "total_tokens": 15543568} {"current_steps": 26955, "total_steps": 67140, "loss": 0.6724, "lr": 3.738952623192539e-05, "epoch": 4.014745308310992, "percentage": 40.15, "elapsed_time": "1:52:27", "remaining_time": "2:47:39", "throughput": 2303.99, "total_tokens": 15546544} {"current_steps": 26960, "total_steps": 67140, "loss": 0.536, "lr": 3.738388116733748e-05, "epoch": 4.015490020851951, "percentage": 40.15, "elapsed_time": "1:52:28", "remaining_time": "2:47:38", "throughput": 2304.06, "total_tokens": 15549744} {"current_steps": 26965, "total_steps": 67140, "loss": 0.7443, "lr": 3.737823526589722e-05, "epoch": 4.016234733392911, "percentage": 40.16, "elapsed_time": "1:52:30", "remaining_time": "2:47:36", "throughput": 2304.12, "total_tokens": 15552912} {"current_steps": 26970, "total_steps": 67140, "loss": 0.4248, "lr": 3.737258852798615e-05, "epoch": 4.0169794459338695, "percentage": 40.17, "elapsed_time": "1:52:31", "remaining_time": "2:47:35", "throughput": 2304.15, "total_tokens": 15555696} {"current_steps": 26975, "total_steps": 67140, "loss": 0.625, "lr": 3.736694095398585e-05, "epoch": 4.017724158474829, "percentage": 40.18, "elapsed_time": "1:52:32", "remaining_time": "2:47:33", "throughput": 2304.19, "total_tokens": 15558608} {"current_steps": 26980, "total_steps": 67140, "loss": 0.5117, "lr": 3.736129254427796e-05, "epoch": 4.018468871015788, "percentage": 40.18, "elapsed_time": "1:52:33", "remaining_time": "2:47:32", "throughput": 2304.2, "total_tokens": 15561168} {"current_steps": 26985, "total_steps": 67140, "loss": 0.6862, "lr": 3.735564329924419e-05, "epoch": 4.0192135835567475, "percentage": 40.19, "elapsed_time": "1:52:34", "remaining_time": "2:47:31", "throughput": 2304.24, "total_tokens": 15564016} {"current_steps": 26990, "total_steps": 67140, "loss": 0.6184, "lr": 3.734999321926626e-05, "epoch": 4.019958296097706, "percentage": 40.2, "elapsed_time": "1:52:35", "remaining_time": "2:47:29", "throughput": 2304.3, "total_tokens": 15567088} {"current_steps": 26995, "total_steps": 67140, "loss": 0.5276, "lr": 3.7344342304726014e-05, "epoch": 4.020703008638666, "percentage": 40.21, "elapsed_time": "1:52:36", "remaining_time": "2:47:28", "throughput": 2304.34, "total_tokens": 15570128} {"current_steps": 27000, "total_steps": 67140, "loss": 0.5292, "lr": 3.73386905560053e-05, "epoch": 4.021447721179625, "percentage": 40.21, "elapsed_time": "1:52:37", "remaining_time": "2:47:26", "throughput": 2304.37, "total_tokens": 15572912} {"current_steps": 27005, "total_steps": 67140, "loss": 0.6736, "lr": 3.733303797348604e-05, "epoch": 4.022192433720583, "percentage": 40.22, "elapsed_time": "1:52:39", "remaining_time": "2:47:25", "throughput": 2304.44, "total_tokens": 15576080} {"current_steps": 27010, "total_steps": 67140, "loss": 0.713, "lr": 3.732738455755022e-05, "epoch": 4.022937146261543, "percentage": 40.23, "elapsed_time": "1:52:40", "remaining_time": "2:47:24", "throughput": 2304.49, "total_tokens": 15579056} {"current_steps": 27015, "total_steps": 67140, "loss": 0.7387, "lr": 3.732173030857987e-05, "epoch": 4.023681858802502, "percentage": 40.24, "elapsed_time": "1:52:41", "remaining_time": "2:47:22", "throughput": 2304.54, "total_tokens": 15582064} {"current_steps": 27020, "total_steps": 67140, "loss": 0.7922, "lr": 3.731607522695709e-05, "epoch": 4.0244265713434615, "percentage": 40.24, "elapsed_time": "1:52:42", "remaining_time": "2:47:21", "throughput": 2304.59, "total_tokens": 15585072} {"current_steps": 27025, "total_steps": 67140, "loss": 0.5884, "lr": 3.731041931306401e-05, "epoch": 4.02517128388442, "percentage": 40.25, "elapsed_time": "1:52:43", "remaining_time": "2:47:19", "throughput": 2304.64, "total_tokens": 15588080} {"current_steps": 27030, "total_steps": 67140, "loss": 0.5583, "lr": 3.730476256728284e-05, "epoch": 4.02591599642538, "percentage": 40.26, "elapsed_time": "1:52:44", "remaining_time": "2:47:18", "throughput": 2304.67, "total_tokens": 15590864} {"current_steps": 27035, "total_steps": 67140, "loss": 0.539, "lr": 3.729910498999585e-05, "epoch": 4.026660708966339, "percentage": 40.27, "elapsed_time": "1:52:46", "remaining_time": "2:47:17", "throughput": 2304.7, "total_tokens": 15593648} {"current_steps": 27040, "total_steps": 67140, "loss": 0.6956, "lr": 3.729344658158535e-05, "epoch": 4.027405421507298, "percentage": 40.27, "elapsed_time": "1:52:47", "remaining_time": "2:47:15", "throughput": 2304.76, "total_tokens": 15596720} {"current_steps": 27045, "total_steps": 67140, "loss": 0.4805, "lr": 3.7287787342433706e-05, "epoch": 4.028150134048257, "percentage": 40.28, "elapsed_time": "1:52:48", "remaining_time": "2:47:14", "throughput": 2304.83, "total_tokens": 15599920} {"current_steps": 27050, "total_steps": 67140, "loss": 0.4561, "lr": 3.728212727292336e-05, "epoch": 4.028894846589217, "percentage": 40.29, "elapsed_time": "1:52:49", "remaining_time": "2:47:12", "throughput": 2304.89, "total_tokens": 15603024} {"current_steps": 27055, "total_steps": 67140, "loss": 0.5183, "lr": 3.727646637343678e-05, "epoch": 4.0296395591301755, "percentage": 40.3, "elapsed_time": "1:52:50", "remaining_time": "2:47:11", "throughput": 2304.95, "total_tokens": 15606192} {"current_steps": 27060, "total_steps": 67140, "loss": 0.7007, "lr": 3.727080464435652e-05, "epoch": 4.030384271671135, "percentage": 40.3, "elapsed_time": "1:52:51", "remaining_time": "2:47:10", "throughput": 2304.99, "total_tokens": 15609136} {"current_steps": 27065, "total_steps": 67140, "loss": 0.618, "lr": 3.726514208606517e-05, "epoch": 4.031128984212094, "percentage": 40.31, "elapsed_time": "1:52:52", "remaining_time": "2:47:08", "throughput": 2305.01, "total_tokens": 15611824} {"current_steps": 27070, "total_steps": 67140, "loss": 0.6923, "lr": 3.725947869894538e-05, "epoch": 4.0318736967530535, "percentage": 40.32, "elapsed_time": "1:52:54", "remaining_time": "2:47:07", "throughput": 2305.07, "total_tokens": 15614992} {"current_steps": 27075, "total_steps": 67140, "loss": 0.7013, "lr": 3.725381448337987e-05, "epoch": 4.032618409294012, "percentage": 40.33, "elapsed_time": "1:52:55", "remaining_time": "2:47:05", "throughput": 2305.09, "total_tokens": 15617616} {"current_steps": 27080, "total_steps": 67140, "loss": 0.4963, "lr": 3.72481494397514e-05, "epoch": 4.033363121834972, "percentage": 40.33, "elapsed_time": "1:52:56", "remaining_time": "2:47:04", "throughput": 2305.1, "total_tokens": 15620176} {"current_steps": 27085, "total_steps": 67140, "loss": 0.5251, "lr": 3.724248356844278e-05, "epoch": 4.034107834375931, "percentage": 40.34, "elapsed_time": "1:52:57", "remaining_time": "2:47:02", "throughput": 2305.13, "total_tokens": 15623024} {"current_steps": 27090, "total_steps": 67140, "loss": 0.6475, "lr": 3.7236816869836896e-05, "epoch": 4.03485254691689, "percentage": 40.35, "elapsed_time": "1:52:58", "remaining_time": "2:47:01", "throughput": 2305.22, "total_tokens": 15626448} {"current_steps": 27095, "total_steps": 67140, "loss": 0.6974, "lr": 3.723114934431669e-05, "epoch": 4.035597259457849, "percentage": 40.36, "elapsed_time": "1:52:59", "remaining_time": "2:47:00", "throughput": 2305.26, "total_tokens": 15629360} {"current_steps": 27100, "total_steps": 67140, "loss": 0.5527, "lr": 3.7225480992265125e-05, "epoch": 4.036341971998809, "percentage": 40.36, "elapsed_time": "1:53:00", "remaining_time": "2:46:58", "throughput": 2305.31, "total_tokens": 15632272} {"current_steps": 27105, "total_steps": 67140, "loss": 0.5131, "lr": 3.721981181406526e-05, "epoch": 4.0370866845397675, "percentage": 40.37, "elapsed_time": "1:53:02", "remaining_time": "2:46:57", "throughput": 2305.37, "total_tokens": 15635408} {"current_steps": 27110, "total_steps": 67140, "loss": 0.5928, "lr": 3.721414181010021e-05, "epoch": 4.037831397080727, "percentage": 40.38, "elapsed_time": "1:53:03", "remaining_time": "2:46:56", "throughput": 2305.43, "total_tokens": 15638480} {"current_steps": 27115, "total_steps": 67140, "loss": 0.7019, "lr": 3.72084709807531e-05, "epoch": 4.038576109621686, "percentage": 40.39, "elapsed_time": "1:53:04", "remaining_time": "2:46:54", "throughput": 2305.47, "total_tokens": 15641392} {"current_steps": 27120, "total_steps": 67140, "loss": 0.6184, "lr": 3.720279932640717e-05, "epoch": 4.0393208221626455, "percentage": 40.39, "elapsed_time": "1:53:05", "remaining_time": "2:46:53", "throughput": 2305.53, "total_tokens": 15644464} {"current_steps": 27125, "total_steps": 67140, "loss": 0.5785, "lr": 3.7197126847445664e-05, "epoch": 4.040065534703604, "percentage": 40.4, "elapsed_time": "1:53:06", "remaining_time": "2:46:51", "throughput": 2305.56, "total_tokens": 15647280} {"current_steps": 27130, "total_steps": 67140, "loss": 0.6394, "lr": 3.719145354425192e-05, "epoch": 4.040810247244564, "percentage": 40.41, "elapsed_time": "1:53:07", "remaining_time": "2:46:50", "throughput": 2305.6, "total_tokens": 15650256} {"current_steps": 27135, "total_steps": 67140, "loss": 0.7781, "lr": 3.718577941720931e-05, "epoch": 4.041554959785523, "percentage": 40.42, "elapsed_time": "1:53:09", "remaining_time": "2:46:49", "throughput": 2305.65, "total_tokens": 15653232} {"current_steps": 27140, "total_steps": 67140, "loss": 0.499, "lr": 3.7180104466701274e-05, "epoch": 4.042299672326482, "percentage": 40.42, "elapsed_time": "1:53:10", "remaining_time": "2:46:47", "throughput": 2305.68, "total_tokens": 15655952} {"current_steps": 27145, "total_steps": 67140, "loss": 0.8341, "lr": 3.71744286931113e-05, "epoch": 4.043044384867441, "percentage": 40.43, "elapsed_time": "1:53:11", "remaining_time": "2:46:46", "throughput": 2305.73, "total_tokens": 15658896} {"current_steps": 27150, "total_steps": 67140, "loss": 0.7449, "lr": 3.7168752096822924e-05, "epoch": 4.043789097408401, "percentage": 40.44, "elapsed_time": "1:53:12", "remaining_time": "2:46:44", "throughput": 2305.77, "total_tokens": 15661872} {"current_steps": 27155, "total_steps": 67140, "loss": 0.7857, "lr": 3.716307467821976e-05, "epoch": 4.0445338099493595, "percentage": 40.45, "elapsed_time": "1:53:13", "remaining_time": "2:46:43", "throughput": 2305.82, "total_tokens": 15664848} {"current_steps": 27160, "total_steps": 67140, "loss": 0.602, "lr": 3.7157396437685465e-05, "epoch": 4.045278522490319, "percentage": 40.45, "elapsed_time": "1:53:14", "remaining_time": "2:46:41", "throughput": 2305.85, "total_tokens": 15667600} {"current_steps": 27165, "total_steps": 67140, "loss": 0.815, "lr": 3.715171737560374e-05, "epoch": 4.046023235031278, "percentage": 40.46, "elapsed_time": "1:53:15", "remaining_time": "2:46:40", "throughput": 2305.89, "total_tokens": 15670512} {"current_steps": 27170, "total_steps": 67140, "loss": 0.5381, "lr": 3.7146037492358366e-05, "epoch": 4.046767947572237, "percentage": 40.47, "elapsed_time": "1:53:16", "remaining_time": "2:46:39", "throughput": 2305.9, "total_tokens": 15673072} {"current_steps": 27175, "total_steps": 67140, "loss": 0.7189, "lr": 3.714035678833316e-05, "epoch": 4.047512660113196, "percentage": 40.48, "elapsed_time": "1:53:18", "remaining_time": "2:46:37", "throughput": 2305.91, "total_tokens": 15675728} {"current_steps": 27180, "total_steps": 67140, "loss": 0.6788, "lr": 3.7134675263912e-05, "epoch": 4.048257372654155, "percentage": 40.48, "elapsed_time": "1:53:19", "remaining_time": "2:46:36", "throughput": 2305.93, "total_tokens": 15678320} {"current_steps": 27185, "total_steps": 67140, "loss": 0.6816, "lr": 3.712899291947882e-05, "epoch": 4.049002085195115, "percentage": 40.49, "elapsed_time": "1:53:20", "remaining_time": "2:46:34", "throughput": 2305.98, "total_tokens": 15681360} {"current_steps": 27190, "total_steps": 67140, "loss": 0.6064, "lr": 3.7123309755417615e-05, "epoch": 4.0497467977360735, "percentage": 40.5, "elapsed_time": "1:53:21", "remaining_time": "2:46:33", "throughput": 2306.02, "total_tokens": 15684208} {"current_steps": 27195, "total_steps": 67140, "loss": 0.5884, "lr": 3.7117625772112416e-05, "epoch": 4.050491510277033, "percentage": 40.5, "elapsed_time": "1:53:22", "remaining_time": "2:46:31", "throughput": 2306.1, "total_tokens": 15687632} {"current_steps": 27200, "total_steps": 67140, "loss": 0.627, "lr": 3.711194096994736e-05, "epoch": 4.051236222817992, "percentage": 40.51, "elapsed_time": "1:53:23", "remaining_time": "2:46:30", "throughput": 2306.13, "total_tokens": 15690352} {"current_steps": 27205, "total_steps": 67140, "loss": 0.7244, "lr": 3.710625534930655e-05, "epoch": 4.0519809353589515, "percentage": 40.52, "elapsed_time": "1:53:24", "remaining_time": "2:46:29", "throughput": 2306.15, "total_tokens": 15693040} {"current_steps": 27210, "total_steps": 67140, "loss": 0.4943, "lr": 3.710056891057423e-05, "epoch": 4.05272564789991, "percentage": 40.53, "elapsed_time": "1:53:26", "remaining_time": "2:46:27", "throughput": 2306.23, "total_tokens": 15696400} {"current_steps": 27215, "total_steps": 67140, "loss": 0.5981, "lr": 3.709488165413467e-05, "epoch": 4.05347036044087, "percentage": 40.53, "elapsed_time": "1:53:27", "remaining_time": "2:46:26", "throughput": 2306.29, "total_tokens": 15699568} {"current_steps": 27220, "total_steps": 67140, "loss": 0.5825, "lr": 3.708919358037218e-05, "epoch": 4.054215072981829, "percentage": 40.54, "elapsed_time": "1:53:28", "remaining_time": "2:46:24", "throughput": 2306.31, "total_tokens": 15702224} {"current_steps": 27225, "total_steps": 67140, "loss": 0.7578, "lr": 3.708350468967113e-05, "epoch": 4.054959785522788, "percentage": 40.55, "elapsed_time": "1:53:29", "remaining_time": "2:46:23", "throughput": 2306.37, "total_tokens": 15705360} {"current_steps": 27230, "total_steps": 67140, "loss": 0.7126, "lr": 3.707781498241596e-05, "epoch": 4.055704498063747, "percentage": 40.56, "elapsed_time": "1:53:30", "remaining_time": "2:46:22", "throughput": 2306.41, "total_tokens": 15708304} {"current_steps": 27235, "total_steps": 67140, "loss": 0.5667, "lr": 3.707212445899116e-05, "epoch": 4.056449210604707, "percentage": 40.56, "elapsed_time": "1:53:31", "remaining_time": "2:46:20", "throughput": 2306.45, "total_tokens": 15711152} {"current_steps": 27240, "total_steps": 67140, "loss": 0.7164, "lr": 3.7066433119781286e-05, "epoch": 4.0571939231456655, "percentage": 40.57, "elapsed_time": "1:53:32", "remaining_time": "2:46:19", "throughput": 2306.48, "total_tokens": 15714000} {"current_steps": 27245, "total_steps": 67140, "loss": 0.7122, "lr": 3.70607409651709e-05, "epoch": 4.057938635686625, "percentage": 40.58, "elapsed_time": "1:53:34", "remaining_time": "2:46:17", "throughput": 2306.5, "total_tokens": 15716656} {"current_steps": 27250, "total_steps": 67140, "loss": 0.4699, "lr": 3.705504799554469e-05, "epoch": 4.058683348227584, "percentage": 40.59, "elapsed_time": "1:53:35", "remaining_time": "2:46:16", "throughput": 2306.53, "total_tokens": 15719440} {"current_steps": 27255, "total_steps": 67140, "loss": 0.56, "lr": 3.704935421128734e-05, "epoch": 4.059428060768544, "percentage": 40.59, "elapsed_time": "1:53:36", "remaining_time": "2:46:15", "throughput": 2306.57, "total_tokens": 15722288} {"current_steps": 27260, "total_steps": 67140, "loss": 0.6577, "lr": 3.704365961278363e-05, "epoch": 4.060172773309502, "percentage": 40.6, "elapsed_time": "1:53:37", "remaining_time": "2:46:13", "throughput": 2306.6, "total_tokens": 15725072} {"current_steps": 27265, "total_steps": 67140, "loss": 0.7138, "lr": 3.7037964200418365e-05, "epoch": 4.060917485850462, "percentage": 40.61, "elapsed_time": "1:53:38", "remaining_time": "2:46:12", "throughput": 2306.63, "total_tokens": 15727920} {"current_steps": 27270, "total_steps": 67140, "loss": 0.6847, "lr": 3.7032267974576415e-05, "epoch": 4.061662198391421, "percentage": 40.62, "elapsed_time": "1:53:39", "remaining_time": "2:46:10", "throughput": 2306.66, "total_tokens": 15730736} {"current_steps": 27275, "total_steps": 67140, "loss": 0.5235, "lr": 3.702657093564272e-05, "epoch": 4.06240691093238, "percentage": 40.62, "elapsed_time": "1:53:40", "remaining_time": "2:46:09", "throughput": 2306.7, "total_tokens": 15733552} {"current_steps": 27280, "total_steps": 67140, "loss": 0.6354, "lr": 3.702087308400226e-05, "epoch": 4.063151623473339, "percentage": 40.63, "elapsed_time": "1:53:41", "remaining_time": "2:46:07", "throughput": 2306.73, "total_tokens": 15736464} {"current_steps": 27285, "total_steps": 67140, "loss": 0.5655, "lr": 3.7015174420040074e-05, "epoch": 4.063896336014299, "percentage": 40.64, "elapsed_time": "1:53:43", "remaining_time": "2:46:06", "throughput": 2306.77, "total_tokens": 15739312} {"current_steps": 27290, "total_steps": 67140, "loss": 0.5895, "lr": 3.7009474944141244e-05, "epoch": 4.0646410485552575, "percentage": 40.65, "elapsed_time": "1:53:44", "remaining_time": "2:46:05", "throughput": 2306.85, "total_tokens": 15742672} {"current_steps": 27295, "total_steps": 67140, "loss": 0.6019, "lr": 3.7003774656690924e-05, "epoch": 4.065385761096217, "percentage": 40.65, "elapsed_time": "1:53:45", "remaining_time": "2:46:03", "throughput": 2306.88, "total_tokens": 15745488} {"current_steps": 27300, "total_steps": 67140, "loss": 0.7128, "lr": 3.699807355807432e-05, "epoch": 4.066130473637176, "percentage": 40.66, "elapsed_time": "1:53:46", "remaining_time": "2:46:02", "throughput": 2306.91, "total_tokens": 15748240} {"current_steps": 27305, "total_steps": 67140, "loss": 0.7489, "lr": 3.6992371648676685e-05, "epoch": 4.066875186178136, "percentage": 40.67, "elapsed_time": "1:53:47", "remaining_time": "2:46:00", "throughput": 2306.95, "total_tokens": 15751088} {"current_steps": 27310, "total_steps": 67140, "loss": 0.6828, "lr": 3.698666892888332e-05, "epoch": 4.067619898719094, "percentage": 40.68, "elapsed_time": "1:53:48", "remaining_time": "2:45:59", "throughput": 2307.0, "total_tokens": 15754192} {"current_steps": 27315, "total_steps": 67140, "loss": 0.6506, "lr": 3.698096539907962e-05, "epoch": 4.068364611260054, "percentage": 40.68, "elapsed_time": "1:53:49", "remaining_time": "2:45:58", "throughput": 2307.03, "total_tokens": 15756976} {"current_steps": 27320, "total_steps": 67140, "loss": 0.7272, "lr": 3.6975261059650986e-05, "epoch": 4.069109323801013, "percentage": 40.69, "elapsed_time": "1:53:51", "remaining_time": "2:45:56", "throughput": 2307.1, "total_tokens": 15760144} {"current_steps": 27325, "total_steps": 67140, "loss": 0.6906, "lr": 3.696955591098289e-05, "epoch": 4.069854036341972, "percentage": 40.7, "elapsed_time": "1:53:52", "remaining_time": "2:45:55", "throughput": 2307.14, "total_tokens": 15763056} {"current_steps": 27330, "total_steps": 67140, "loss": 0.5584, "lr": 3.696384995346087e-05, "epoch": 4.070598748882931, "percentage": 40.71, "elapsed_time": "1:53:53", "remaining_time": "2:45:53", "throughput": 2307.15, "total_tokens": 15765680} {"current_steps": 27335, "total_steps": 67140, "loss": 0.5773, "lr": 3.6958143187470514e-05, "epoch": 4.071343461423891, "percentage": 40.71, "elapsed_time": "1:53:54", "remaining_time": "2:45:52", "throughput": 2307.17, "total_tokens": 15768368} {"current_steps": 27340, "total_steps": 67140, "loss": 0.5582, "lr": 3.695243561339747e-05, "epoch": 4.07208817396485, "percentage": 40.72, "elapsed_time": "1:53:55", "remaining_time": "2:45:50", "throughput": 2307.23, "total_tokens": 15771472} {"current_steps": 27345, "total_steps": 67140, "loss": 0.644, "lr": 3.694672723162741e-05, "epoch": 4.072832886505808, "percentage": 40.73, "elapsed_time": "1:53:56", "remaining_time": "2:45:49", "throughput": 2307.27, "total_tokens": 15774448} {"current_steps": 27350, "total_steps": 67140, "loss": 0.6728, "lr": 3.69410180425461e-05, "epoch": 4.073577599046768, "percentage": 40.74, "elapsed_time": "1:53:57", "remaining_time": "2:45:48", "throughput": 2307.32, "total_tokens": 15777392} {"current_steps": 27355, "total_steps": 67140, "loss": 0.5735, "lr": 3.693530804653934e-05, "epoch": 4.074322311587727, "percentage": 40.74, "elapsed_time": "1:53:59", "remaining_time": "2:45:46", "throughput": 2307.33, "total_tokens": 15780080} {"current_steps": 27360, "total_steps": 67140, "loss": 0.5824, "lr": 3.692959724399299e-05, "epoch": 4.075067024128686, "percentage": 40.75, "elapsed_time": "1:54:00", "remaining_time": "2:45:45", "throughput": 2307.37, "total_tokens": 15782992} {"current_steps": 27365, "total_steps": 67140, "loss": 0.5423, "lr": 3.692388563529295e-05, "epoch": 4.075811736669645, "percentage": 40.76, "elapsed_time": "1:54:01", "remaining_time": "2:45:43", "throughput": 2307.43, "total_tokens": 15786032} {"current_steps": 27370, "total_steps": 67140, "loss": 0.6213, "lr": 3.6918173220825204e-05, "epoch": 4.076556449210605, "percentage": 40.77, "elapsed_time": "1:54:02", "remaining_time": "2:45:42", "throughput": 2307.47, "total_tokens": 15788976} {"current_steps": 27375, "total_steps": 67140, "loss": 0.5579, "lr": 3.691246000097577e-05, "epoch": 4.0773011617515635, "percentage": 40.77, "elapsed_time": "1:54:03", "remaining_time": "2:45:41", "throughput": 2307.49, "total_tokens": 15791696} {"current_steps": 27380, "total_steps": 67140, "loss": 0.6474, "lr": 3.6906745976130716e-05, "epoch": 4.078045874292523, "percentage": 40.78, "elapsed_time": "1:54:04", "remaining_time": "2:45:39", "throughput": 2307.52, "total_tokens": 15794480} {"current_steps": 27385, "total_steps": 67140, "loss": 0.58, "lr": 3.6901031146676185e-05, "epoch": 4.078790586833482, "percentage": 40.79, "elapsed_time": "1:54:05", "remaining_time": "2:45:38", "throughput": 2307.54, "total_tokens": 15797136} {"current_steps": 27390, "total_steps": 67140, "loss": 0.6865, "lr": 3.689531551299835e-05, "epoch": 4.079535299374442, "percentage": 40.8, "elapsed_time": "1:54:06", "remaining_time": "2:45:36", "throughput": 2307.55, "total_tokens": 15799696} {"current_steps": 27395, "total_steps": 67140, "loss": 0.6217, "lr": 3.688959907548346e-05, "epoch": 4.0802800119154, "percentage": 40.8, "elapsed_time": "1:54:08", "remaining_time": "2:45:35", "throughput": 2307.61, "total_tokens": 15802832} {"current_steps": 27400, "total_steps": 67140, "loss": 0.5523, "lr": 3.68838818345178e-05, "epoch": 4.08102472445636, "percentage": 40.81, "elapsed_time": "1:54:09", "remaining_time": "2:45:33", "throughput": 2307.62, "total_tokens": 15805456} {"current_steps": 27405, "total_steps": 67140, "loss": 0.581, "lr": 3.6878163790487726e-05, "epoch": 4.081769436997319, "percentage": 40.82, "elapsed_time": "1:54:10", "remaining_time": "2:45:32", "throughput": 2307.68, "total_tokens": 15808464} {"current_steps": 27410, "total_steps": 67140, "loss": 0.5514, "lr": 3.6872444943779624e-05, "epoch": 4.082514149538278, "percentage": 40.83, "elapsed_time": "1:54:11", "remaining_time": "2:45:31", "throughput": 2307.7, "total_tokens": 15811184} {"current_steps": 27415, "total_steps": 67140, "loss": 0.728, "lr": 3.686672529477998e-05, "epoch": 4.083258862079237, "percentage": 40.83, "elapsed_time": "1:54:12", "remaining_time": "2:45:29", "throughput": 2307.74, "total_tokens": 15814096} {"current_steps": 27420, "total_steps": 67140, "loss": 0.5372, "lr": 3.686100484387528e-05, "epoch": 4.084003574620197, "percentage": 40.84, "elapsed_time": "1:54:13", "remaining_time": "2:45:28", "throughput": 2307.8, "total_tokens": 15817232} {"current_steps": 27425, "total_steps": 67140, "loss": 0.6693, "lr": 3.685528359145209e-05, "epoch": 4.084748287161156, "percentage": 40.85, "elapsed_time": "1:54:14", "remaining_time": "2:45:26", "throughput": 2307.85, "total_tokens": 15820208} {"current_steps": 27430, "total_steps": 67140, "loss": 0.481, "lr": 3.6849561537897045e-05, "epoch": 4.085492999702115, "percentage": 40.85, "elapsed_time": "1:54:16", "remaining_time": "2:45:25", "throughput": 2307.86, "total_tokens": 15822864} {"current_steps": 27435, "total_steps": 67140, "loss": 0.7588, "lr": 3.684383868359681e-05, "epoch": 4.086237712243074, "percentage": 40.86, "elapsed_time": "1:54:17", "remaining_time": "2:45:24", "throughput": 2307.95, "total_tokens": 15826256} {"current_steps": 27440, "total_steps": 67140, "loss": 0.6542, "lr": 3.68381150289381e-05, "epoch": 4.086982424784034, "percentage": 40.87, "elapsed_time": "1:54:18", "remaining_time": "2:45:22", "throughput": 2307.96, "total_tokens": 15828880} {"current_steps": 27445, "total_steps": 67140, "loss": 0.6227, "lr": 3.683239057430771e-05, "epoch": 4.087727137324992, "percentage": 40.88, "elapsed_time": "1:54:19", "remaining_time": "2:45:21", "throughput": 2307.99, "total_tokens": 15831760} {"current_steps": 27450, "total_steps": 67140, "loss": 0.6716, "lr": 3.6826665320092465e-05, "epoch": 4.088471849865952, "percentage": 40.88, "elapsed_time": "1:54:20", "remaining_time": "2:45:19", "throughput": 2308.06, "total_tokens": 15834992} {"current_steps": 27455, "total_steps": 67140, "loss": 0.6036, "lr": 3.682093926667927e-05, "epoch": 4.089216562406911, "percentage": 40.89, "elapsed_time": "1:54:21", "remaining_time": "2:45:18", "throughput": 2308.09, "total_tokens": 15837808} {"current_steps": 27460, "total_steps": 67140, "loss": 0.7112, "lr": 3.681521241445506e-05, "epoch": 4.08996127494787, "percentage": 40.9, "elapsed_time": "1:54:22", "remaining_time": "2:45:17", "throughput": 2308.12, "total_tokens": 15840528} {"current_steps": 27465, "total_steps": 67140, "loss": 0.6739, "lr": 3.6809484763806834e-05, "epoch": 4.090705987488829, "percentage": 40.91, "elapsed_time": "1:54:24", "remaining_time": "2:45:15", "throughput": 2308.12, "total_tokens": 15843120} {"current_steps": 27470, "total_steps": 67140, "loss": 0.6843, "lr": 3.680375631512164e-05, "epoch": 4.091450700029789, "percentage": 40.91, "elapsed_time": "1:54:25", "remaining_time": "2:45:14", "throughput": 2308.14, "total_tokens": 15845840} {"current_steps": 27475, "total_steps": 67140, "loss": 0.59, "lr": 3.679802706878658e-05, "epoch": 4.092195412570748, "percentage": 40.92, "elapsed_time": "1:54:26", "remaining_time": "2:45:12", "throughput": 2308.18, "total_tokens": 15848720} {"current_steps": 27480, "total_steps": 67140, "loss": 0.7528, "lr": 3.6792297025188824e-05, "epoch": 4.092940125111707, "percentage": 40.93, "elapsed_time": "1:54:27", "remaining_time": "2:45:11", "throughput": 2308.21, "total_tokens": 15851504} {"current_steps": 27485, "total_steps": 67140, "loss": 0.4858, "lr": 3.6786566184715576e-05, "epoch": 4.093684837652666, "percentage": 40.94, "elapsed_time": "1:54:28", "remaining_time": "2:45:09", "throughput": 2308.23, "total_tokens": 15854256} {"current_steps": 27490, "total_steps": 67140, "loss": 0.5944, "lr": 3.67808345477541e-05, "epoch": 4.094429550193626, "percentage": 40.94, "elapsed_time": "1:54:29", "remaining_time": "2:45:08", "throughput": 2308.28, "total_tokens": 15857168} {"current_steps": 27495, "total_steps": 67140, "loss": 0.5201, "lr": 3.6775102114691736e-05, "epoch": 4.095174262734584, "percentage": 40.95, "elapsed_time": "1:54:30", "remaining_time": "2:45:07", "throughput": 2308.31, "total_tokens": 15859984} {"current_steps": 27500, "total_steps": 67140, "loss": 0.5742, "lr": 3.676936888591583e-05, "epoch": 4.095918975275544, "percentage": 40.96, "elapsed_time": "1:54:31", "remaining_time": "2:45:05", "throughput": 2308.35, "total_tokens": 15862800} {"current_steps": 27505, "total_steps": 67140, "loss": 0.7449, "lr": 3.6763634861813836e-05, "epoch": 4.096663687816503, "percentage": 40.97, "elapsed_time": "1:54:33", "remaining_time": "2:45:04", "throughput": 2308.37, "total_tokens": 15865584} {"current_steps": 27510, "total_steps": 67140, "loss": 0.8086, "lr": 3.675790004277322e-05, "epoch": 4.0974084003574625, "percentage": 40.97, "elapsed_time": "1:54:34", "remaining_time": "2:45:02", "throughput": 2308.42, "total_tokens": 15868560} {"current_steps": 27515, "total_steps": 67140, "loss": 0.8226, "lr": 3.675216442918153e-05, "epoch": 4.098153112898421, "percentage": 40.98, "elapsed_time": "1:54:35", "remaining_time": "2:45:01", "throughput": 2308.44, "total_tokens": 15871280} {"current_steps": 27520, "total_steps": 67140, "loss": 0.5296, "lr": 3.674642802142635e-05, "epoch": 4.09889782543938, "percentage": 40.99, "elapsed_time": "1:54:36", "remaining_time": "2:44:59", "throughput": 2308.51, "total_tokens": 15874448} {"current_steps": 27525, "total_steps": 67140, "loss": 0.5949, "lr": 3.6740690819895304e-05, "epoch": 4.09964253798034, "percentage": 41.0, "elapsed_time": "1:54:37", "remaining_time": "2:44:58", "throughput": 2308.56, "total_tokens": 15877456} {"current_steps": 27530, "total_steps": 67140, "loss": 0.4719, "lr": 3.673495282497613e-05, "epoch": 4.100387250521298, "percentage": 41.0, "elapsed_time": "1:54:38", "remaining_time": "2:44:57", "throughput": 2308.61, "total_tokens": 15880464} {"current_steps": 27535, "total_steps": 67140, "loss": 0.4718, "lr": 3.672921403705654e-05, "epoch": 4.101131963062258, "percentage": 41.01, "elapsed_time": "1:54:39", "remaining_time": "2:44:55", "throughput": 2308.65, "total_tokens": 15883408} {"current_steps": 27540, "total_steps": 67140, "loss": 0.5255, "lr": 3.672347445652436e-05, "epoch": 4.101876675603217, "percentage": 41.02, "elapsed_time": "1:54:41", "remaining_time": "2:44:54", "throughput": 2308.71, "total_tokens": 15886416} {"current_steps": 27545, "total_steps": 67140, "loss": 0.6744, "lr": 3.671773408376743e-05, "epoch": 4.102621388144176, "percentage": 41.03, "elapsed_time": "1:54:42", "remaining_time": "2:44:52", "throughput": 2308.72, "total_tokens": 15889008} {"current_steps": 27550, "total_steps": 67140, "loss": 0.866, "lr": 3.671199291917368e-05, "epoch": 4.103366100685135, "percentage": 41.03, "elapsed_time": "1:54:43", "remaining_time": "2:44:51", "throughput": 2308.75, "total_tokens": 15891824} {"current_steps": 27555, "total_steps": 67140, "loss": 0.5095, "lr": 3.6706250963131065e-05, "epoch": 4.104110813226095, "percentage": 41.04, "elapsed_time": "1:54:44", "remaining_time": "2:44:49", "throughput": 2308.76, "total_tokens": 15894416} {"current_steps": 27560, "total_steps": 67140, "loss": 0.8919, "lr": 3.670050821602761e-05, "epoch": 4.104855525767054, "percentage": 41.05, "elapsed_time": "1:54:45", "remaining_time": "2:44:48", "throughput": 2308.79, "total_tokens": 15897232} {"current_steps": 27565, "total_steps": 67140, "loss": 0.5827, "lr": 3.669476467825137e-05, "epoch": 4.105600238308013, "percentage": 41.06, "elapsed_time": "1:54:46", "remaining_time": "2:44:47", "throughput": 2308.84, "total_tokens": 15900240} {"current_steps": 27570, "total_steps": 67140, "loss": 0.7303, "lr": 3.668902035019049e-05, "epoch": 4.106344950848972, "percentage": 41.06, "elapsed_time": "1:54:47", "remaining_time": "2:44:45", "throughput": 2308.92, "total_tokens": 15903600} {"current_steps": 27575, "total_steps": 67140, "loss": 0.5697, "lr": 3.668327523223313e-05, "epoch": 4.107089663389932, "percentage": 41.07, "elapsed_time": "1:54:49", "remaining_time": "2:44:44", "throughput": 2308.96, "total_tokens": 15906448} {"current_steps": 27580, "total_steps": 67140, "loss": 0.7025, "lr": 3.667752932476753e-05, "epoch": 4.10783437593089, "percentage": 41.08, "elapsed_time": "1:54:50", "remaining_time": "2:44:42", "throughput": 2308.97, "total_tokens": 15909040} {"current_steps": 27585, "total_steps": 67140, "loss": 0.5599, "lr": 3.667178262818198e-05, "epoch": 4.10857908847185, "percentage": 41.09, "elapsed_time": "1:54:51", "remaining_time": "2:44:41", "throughput": 2309.02, "total_tokens": 15912080} {"current_steps": 27590, "total_steps": 67140, "loss": 0.7527, "lr": 3.666603514286482e-05, "epoch": 4.109323801012809, "percentage": 41.09, "elapsed_time": "1:54:52", "remaining_time": "2:44:40", "throughput": 2309.06, "total_tokens": 15915024} {"current_steps": 27595, "total_steps": 67140, "loss": 0.5841, "lr": 3.666028686920443e-05, "epoch": 4.1100685135537685, "percentage": 41.1, "elapsed_time": "1:54:53", "remaining_time": "2:44:38", "throughput": 2309.09, "total_tokens": 15917776} {"current_steps": 27600, "total_steps": 67140, "loss": 0.5319, "lr": 3.665453780758926e-05, "epoch": 4.110813226094727, "percentage": 41.11, "elapsed_time": "1:54:54", "remaining_time": "2:44:37", "throughput": 2309.12, "total_tokens": 15920624} {"current_steps": 27605, "total_steps": 67140, "loss": 0.7171, "lr": 3.6648787958407803e-05, "epoch": 4.111557938635687, "percentage": 41.12, "elapsed_time": "1:54:55", "remaining_time": "2:44:35", "throughput": 2309.16, "total_tokens": 15923536} {"current_steps": 27610, "total_steps": 67140, "loss": 0.7936, "lr": 3.6643037322048624e-05, "epoch": 4.112302651176646, "percentage": 41.12, "elapsed_time": "1:54:56", "remaining_time": "2:44:34", "throughput": 2309.23, "total_tokens": 15926672} {"current_steps": 27615, "total_steps": 67140, "loss": 0.6302, "lr": 3.663728589890032e-05, "epoch": 4.113047363717605, "percentage": 41.13, "elapsed_time": "1:54:58", "remaining_time": "2:44:33", "throughput": 2309.3, "total_tokens": 15929936} {"current_steps": 27620, "total_steps": 67140, "loss": 0.6515, "lr": 3.6631533689351544e-05, "epoch": 4.113792076258564, "percentage": 41.14, "elapsed_time": "1:54:59", "remaining_time": "2:44:31", "throughput": 2309.32, "total_tokens": 15932656} {"current_steps": 27625, "total_steps": 67140, "loss": 0.5501, "lr": 3.6625780693791016e-05, "epoch": 4.114536788799524, "percentage": 41.15, "elapsed_time": "1:55:00", "remaining_time": "2:44:30", "throughput": 2309.36, "total_tokens": 15935568} {"current_steps": 27630, "total_steps": 67140, "loss": 0.5737, "lr": 3.6620026912607497e-05, "epoch": 4.115281501340482, "percentage": 41.15, "elapsed_time": "1:55:01", "remaining_time": "2:44:28", "throughput": 2309.39, "total_tokens": 15938288} {"current_steps": 27635, "total_steps": 67140, "loss": 0.8386, "lr": 3.6614272346189795e-05, "epoch": 4.116026213881442, "percentage": 41.16, "elapsed_time": "1:55:02", "remaining_time": "2:44:27", "throughput": 2309.42, "total_tokens": 15941136} {"current_steps": 27640, "total_steps": 67140, "loss": 0.6243, "lr": 3.660851699492679e-05, "epoch": 4.116770926422401, "percentage": 41.17, "elapsed_time": "1:55:03", "remaining_time": "2:44:26", "throughput": 2309.45, "total_tokens": 15943920} {"current_steps": 27645, "total_steps": 67140, "loss": 0.6188, "lr": 3.660276085920742e-05, "epoch": 4.1175156389633605, "percentage": 41.18, "elapsed_time": "1:55:04", "remaining_time": "2:44:24", "throughput": 2309.48, "total_tokens": 15946736} {"current_steps": 27650, "total_steps": 67140, "loss": 0.4999, "lr": 3.6597003939420623e-05, "epoch": 4.118260351504319, "percentage": 41.18, "elapsed_time": "1:55:06", "remaining_time": "2:44:23", "throughput": 2309.51, "total_tokens": 15949616} {"current_steps": 27655, "total_steps": 67140, "loss": 0.516, "lr": 3.6591246235955456e-05, "epoch": 4.119005064045279, "percentage": 41.19, "elapsed_time": "1:55:07", "remaining_time": "2:44:21", "throughput": 2309.53, "total_tokens": 15952272} {"current_steps": 27660, "total_steps": 67140, "loss": 0.5351, "lr": 3.6585487749200996e-05, "epoch": 4.119749776586238, "percentage": 41.2, "elapsed_time": "1:55:08", "remaining_time": "2:44:20", "throughput": 2309.59, "total_tokens": 15955408} {"current_steps": 27665, "total_steps": 67140, "loss": 0.598, "lr": 3.657972847954638e-05, "epoch": 4.120494489127197, "percentage": 41.2, "elapsed_time": "1:55:09", "remaining_time": "2:44:19", "throughput": 2309.64, "total_tokens": 15958384} {"current_steps": 27670, "total_steps": 67140, "loss": 0.8547, "lr": 3.657396842738079e-05, "epoch": 4.121239201668156, "percentage": 41.21, "elapsed_time": "1:55:10", "remaining_time": "2:44:17", "throughput": 2309.67, "total_tokens": 15961232} {"current_steps": 27675, "total_steps": 67140, "loss": 0.6548, "lr": 3.6568207593093465e-05, "epoch": 4.121983914209116, "percentage": 41.22, "elapsed_time": "1:55:11", "remaining_time": "2:44:16", "throughput": 2309.7, "total_tokens": 15963984} {"current_steps": 27680, "total_steps": 67140, "loss": 0.5088, "lr": 3.656244597707372e-05, "epoch": 4.1227286267500745, "percentage": 41.23, "elapsed_time": "1:55:12", "remaining_time": "2:44:14", "throughput": 2309.73, "total_tokens": 15966800} {"current_steps": 27685, "total_steps": 67140, "loss": 0.5864, "lr": 3.655668357971087e-05, "epoch": 4.123473339291033, "percentage": 41.23, "elapsed_time": "1:55:13", "remaining_time": "2:44:13", "throughput": 2309.74, "total_tokens": 15969392} {"current_steps": 27690, "total_steps": 67140, "loss": 0.6706, "lr": 3.6550920401394335e-05, "epoch": 4.124218051831993, "percentage": 41.24, "elapsed_time": "1:55:15", "remaining_time": "2:44:11", "throughput": 2309.78, "total_tokens": 15972304} {"current_steps": 27695, "total_steps": 67140, "loss": 0.6008, "lr": 3.654515644251356e-05, "epoch": 4.124962764372952, "percentage": 41.25, "elapsed_time": "1:55:16", "remaining_time": "2:44:10", "throughput": 2309.81, "total_tokens": 15975056} {"current_steps": 27700, "total_steps": 67140, "loss": 0.6576, "lr": 3.653939170345805e-05, "epoch": 4.125707476913911, "percentage": 41.26, "elapsed_time": "1:55:17", "remaining_time": "2:44:09", "throughput": 2309.82, "total_tokens": 15977712} {"current_steps": 27705, "total_steps": 67140, "loss": 0.5436, "lr": 3.653362618461737e-05, "epoch": 4.12645218945487, "percentage": 41.26, "elapsed_time": "1:55:18", "remaining_time": "2:44:07", "throughput": 2309.85, "total_tokens": 15980432} {"current_steps": 27710, "total_steps": 67140, "loss": 0.4474, "lr": 3.652785988638112e-05, "epoch": 4.12719690199583, "percentage": 41.27, "elapsed_time": "1:55:19", "remaining_time": "2:44:06", "throughput": 2309.87, "total_tokens": 15983152} {"current_steps": 27715, "total_steps": 67140, "loss": 0.7052, "lr": 3.6522092809138975e-05, "epoch": 4.127941614536788, "percentage": 41.28, "elapsed_time": "1:55:20", "remaining_time": "2:44:04", "throughput": 2309.88, "total_tokens": 15985744} {"current_steps": 27720, "total_steps": 67140, "loss": 0.5862, "lr": 3.651632495328064e-05, "epoch": 4.128686327077748, "percentage": 41.29, "elapsed_time": "1:55:21", "remaining_time": "2:44:03", "throughput": 2309.9, "total_tokens": 15988464} {"current_steps": 27725, "total_steps": 67140, "loss": 0.5336, "lr": 3.6510556319195884e-05, "epoch": 4.129431039618707, "percentage": 41.29, "elapsed_time": "1:55:22", "remaining_time": "2:44:01", "throughput": 2309.94, "total_tokens": 15991344} {"current_steps": 27730, "total_steps": 67140, "loss": 0.7367, "lr": 3.650478690727454e-05, "epoch": 4.1301757521596665, "percentage": 41.3, "elapsed_time": "1:55:23", "remaining_time": "2:44:00", "throughput": 2309.95, "total_tokens": 15993968} {"current_steps": 27735, "total_steps": 67140, "loss": 0.5243, "lr": 3.6499016717906455e-05, "epoch": 4.130920464700625, "percentage": 41.31, "elapsed_time": "1:55:25", "remaining_time": "2:43:58", "throughput": 2309.99, "total_tokens": 15996848} {"current_steps": 27740, "total_steps": 67140, "loss": 0.6197, "lr": 3.6493245751481574e-05, "epoch": 4.131665177241585, "percentage": 41.32, "elapsed_time": "1:55:26", "remaining_time": "2:43:57", "throughput": 2310.03, "total_tokens": 15999856} {"current_steps": 27745, "total_steps": 67140, "loss": 0.5733, "lr": 3.648747400838989e-05, "epoch": 4.132409889782544, "percentage": 41.32, "elapsed_time": "1:55:27", "remaining_time": "2:43:56", "throughput": 2310.07, "total_tokens": 16002768} {"current_steps": 27750, "total_steps": 67140, "loss": 0.5877, "lr": 3.6481701489021404e-05, "epoch": 4.133154602323503, "percentage": 41.33, "elapsed_time": "1:55:28", "remaining_time": "2:43:54", "throughput": 2310.11, "total_tokens": 16005552} {"current_steps": 27755, "total_steps": 67140, "loss": 0.5128, "lr": 3.647592819376621e-05, "epoch": 4.133899314864462, "percentage": 41.34, "elapsed_time": "1:55:29", "remaining_time": "2:43:53", "throughput": 2310.14, "total_tokens": 16008464} {"current_steps": 27760, "total_steps": 67140, "loss": 0.5053, "lr": 3.6470154123014455e-05, "epoch": 4.134644027405422, "percentage": 41.35, "elapsed_time": "1:55:30", "remaining_time": "2:43:51", "throughput": 2310.17, "total_tokens": 16011184} {"current_steps": 27765, "total_steps": 67140, "loss": 0.3726, "lr": 3.646437927715632e-05, "epoch": 4.1353887399463805, "percentage": 41.35, "elapsed_time": "1:55:31", "remaining_time": "2:43:50", "throughput": 2310.18, "total_tokens": 16013872} {"current_steps": 27770, "total_steps": 67140, "loss": 0.5831, "lr": 3.645860365658203e-05, "epoch": 4.13613345248734, "percentage": 41.36, "elapsed_time": "1:55:32", "remaining_time": "2:43:48", "throughput": 2310.21, "total_tokens": 16016560} {"current_steps": 27775, "total_steps": 67140, "loss": 0.3386, "lr": 3.645282726168191e-05, "epoch": 4.136878165028299, "percentage": 41.37, "elapsed_time": "1:55:34", "remaining_time": "2:43:47", "throughput": 2310.26, "total_tokens": 16019568} {"current_steps": 27780, "total_steps": 67140, "loss": 0.5439, "lr": 3.644705009284628e-05, "epoch": 4.1376228775692585, "percentage": 41.38, "elapsed_time": "1:55:35", "remaining_time": "2:43:46", "throughput": 2310.3, "total_tokens": 16022576} {"current_steps": 27785, "total_steps": 67140, "loss": 0.5763, "lr": 3.644127215046555e-05, "epoch": 4.138367590110217, "percentage": 41.38, "elapsed_time": "1:55:36", "remaining_time": "2:43:44", "throughput": 2310.33, "total_tokens": 16025360} {"current_steps": 27790, "total_steps": 67140, "loss": 0.7348, "lr": 3.643549343493015e-05, "epoch": 4.139112302651177, "percentage": 41.39, "elapsed_time": "1:55:37", "remaining_time": "2:43:43", "throughput": 2310.36, "total_tokens": 16028240} {"current_steps": 27795, "total_steps": 67140, "loss": 0.6832, "lr": 3.642971394663061e-05, "epoch": 4.139857015192136, "percentage": 41.4, "elapsed_time": "1:55:38", "remaining_time": "2:43:42", "throughput": 2310.42, "total_tokens": 16031408} {"current_steps": 27800, "total_steps": 67140, "loss": 0.7401, "lr": 3.642393368595747e-05, "epoch": 4.140601727733095, "percentage": 41.41, "elapsed_time": "1:55:39", "remaining_time": "2:43:40", "throughput": 2310.45, "total_tokens": 16034192} {"current_steps": 27805, "total_steps": 67140, "loss": 0.741, "lr": 3.641815265330133e-05, "epoch": 4.141346440274054, "percentage": 41.41, "elapsed_time": "1:55:40", "remaining_time": "2:43:39", "throughput": 2310.47, "total_tokens": 16036880} {"current_steps": 27810, "total_steps": 67140, "loss": 0.7912, "lr": 3.6412370849052865e-05, "epoch": 4.142091152815014, "percentage": 41.42, "elapsed_time": "1:55:42", "remaining_time": "2:43:37", "throughput": 2310.5, "total_tokens": 16039728} {"current_steps": 27815, "total_steps": 67140, "loss": 0.5217, "lr": 3.6406588273602774e-05, "epoch": 4.1428358653559725, "percentage": 41.43, "elapsed_time": "1:55:43", "remaining_time": "2:43:36", "throughput": 2310.53, "total_tokens": 16042512} {"current_steps": 27820, "total_steps": 67140, "loss": 0.8122, "lr": 3.640080492734182e-05, "epoch": 4.143580577896932, "percentage": 41.44, "elapsed_time": "1:55:44", "remaining_time": "2:43:34", "throughput": 2310.57, "total_tokens": 16045424} {"current_steps": 27825, "total_steps": 67140, "loss": 0.6432, "lr": 3.639502081066083e-05, "epoch": 4.144325290437891, "percentage": 41.44, "elapsed_time": "1:55:45", "remaining_time": "2:43:33", "throughput": 2310.59, "total_tokens": 16048112} {"current_steps": 27830, "total_steps": 67140, "loss": 0.6842, "lr": 3.638923592395066e-05, "epoch": 4.1450700029788505, "percentage": 41.45, "elapsed_time": "1:55:46", "remaining_time": "2:43:32", "throughput": 2310.62, "total_tokens": 16050960} {"current_steps": 27835, "total_steps": 67140, "loss": 0.5389, "lr": 3.638345026760222e-05, "epoch": 4.145814715519809, "percentage": 41.46, "elapsed_time": "1:55:47", "remaining_time": "2:43:30", "throughput": 2310.67, "total_tokens": 16053936} {"current_steps": 27840, "total_steps": 67140, "loss": 0.9386, "lr": 3.63776638420065e-05, "epoch": 4.146559428060769, "percentage": 41.47, "elapsed_time": "1:55:48", "remaining_time": "2:43:29", "throughput": 2310.68, "total_tokens": 16056528} {"current_steps": 27845, "total_steps": 67140, "loss": 0.6632, "lr": 3.6371876647554524e-05, "epoch": 4.147304140601728, "percentage": 41.47, "elapsed_time": "1:55:49", "remaining_time": "2:43:27", "throughput": 2310.72, "total_tokens": 16059408} {"current_steps": 27850, "total_steps": 67140, "loss": 0.5477, "lr": 3.636608868463735e-05, "epoch": 4.148048853142687, "percentage": 41.48, "elapsed_time": "1:55:51", "remaining_time": "2:43:26", "throughput": 2310.76, "total_tokens": 16062288} {"current_steps": 27855, "total_steps": 67140, "loss": 0.6131, "lr": 3.636029995364611e-05, "epoch": 4.148793565683646, "percentage": 41.49, "elapsed_time": "1:55:52", "remaining_time": "2:43:25", "throughput": 2310.79, "total_tokens": 16065200} {"current_steps": 27860, "total_steps": 67140, "loss": 0.6142, "lr": 3.6354510454972e-05, "epoch": 4.149538278224606, "percentage": 41.5, "elapsed_time": "1:55:53", "remaining_time": "2:43:23", "throughput": 2310.84, "total_tokens": 16068240} {"current_steps": 27865, "total_steps": 67140, "loss": 0.5786, "lr": 3.634872018900623e-05, "epoch": 4.1502829907655645, "percentage": 41.5, "elapsed_time": "1:55:54", "remaining_time": "2:43:22", "throughput": 2310.87, "total_tokens": 16071024} {"current_steps": 27870, "total_steps": 67140, "loss": 0.6189, "lr": 3.634292915614009e-05, "epoch": 4.151027703306523, "percentage": 41.51, "elapsed_time": "1:55:55", "remaining_time": "2:43:20", "throughput": 2310.91, "total_tokens": 16073936} {"current_steps": 27875, "total_steps": 67140, "loss": 0.5558, "lr": 3.633713735676491e-05, "epoch": 4.151772415847483, "percentage": 41.52, "elapsed_time": "1:55:56", "remaining_time": "2:43:19", "throughput": 2310.95, "total_tokens": 16076816} {"current_steps": 27880, "total_steps": 67140, "loss": 0.6326, "lr": 3.6331344791272087e-05, "epoch": 4.152517128388442, "percentage": 41.53, "elapsed_time": "1:55:57", "remaining_time": "2:43:18", "throughput": 2310.98, "total_tokens": 16079696} {"current_steps": 27885, "total_steps": 67140, "loss": 0.5919, "lr": 3.632555146005305e-05, "epoch": 4.153261840929401, "percentage": 41.53, "elapsed_time": "1:55:59", "remaining_time": "2:43:16", "throughput": 2311.05, "total_tokens": 16082928} {"current_steps": 27890, "total_steps": 67140, "loss": 0.9987, "lr": 3.63197573634993e-05, "epoch": 4.15400655347036, "percentage": 41.54, "elapsed_time": "1:56:00", "remaining_time": "2:43:15", "throughput": 2311.1, "total_tokens": 16085936} {"current_steps": 27895, "total_steps": 67140, "loss": 0.5336, "lr": 3.6313962502002365e-05, "epoch": 4.15475126601132, "percentage": 41.55, "elapsed_time": "1:56:01", "remaining_time": "2:43:13", "throughput": 2311.15, "total_tokens": 16088944} {"current_steps": 27900, "total_steps": 67140, "loss": 0.8162, "lr": 3.6308166875953836e-05, "epoch": 4.1554959785522785, "percentage": 41.55, "elapsed_time": "1:56:02", "remaining_time": "2:43:12", "throughput": 2311.2, "total_tokens": 16091984} {"current_steps": 27905, "total_steps": 67140, "loss": 0.525, "lr": 3.630237048574537e-05, "epoch": 4.156240691093238, "percentage": 41.56, "elapsed_time": "1:56:03", "remaining_time": "2:43:11", "throughput": 2311.25, "total_tokens": 16095056} {"current_steps": 27910, "total_steps": 67140, "loss": 0.6546, "lr": 3.6296573331768664e-05, "epoch": 4.156985403634197, "percentage": 41.57, "elapsed_time": "1:56:04", "remaining_time": "2:43:09", "throughput": 2311.27, "total_tokens": 16097840} {"current_steps": 27915, "total_steps": 67140, "loss": 0.6558, "lr": 3.629077541441546e-05, "epoch": 4.1577301161751565, "percentage": 41.58, "elapsed_time": "1:56:06", "remaining_time": "2:43:08", "throughput": 2311.29, "total_tokens": 16100528} {"current_steps": 27920, "total_steps": 67140, "loss": 0.7294, "lr": 3.628497673407755e-05, "epoch": 4.158474828716115, "percentage": 41.58, "elapsed_time": "1:56:07", "remaining_time": "2:43:06", "throughput": 2311.32, "total_tokens": 16103344} {"current_steps": 27925, "total_steps": 67140, "loss": 0.667, "lr": 3.62791772911468e-05, "epoch": 4.159219541257075, "percentage": 41.59, "elapsed_time": "1:56:08", "remaining_time": "2:43:05", "throughput": 2311.34, "total_tokens": 16106064} {"current_steps": 27930, "total_steps": 67140, "loss": 0.3914, "lr": 3.6273377086015106e-05, "epoch": 4.159964253798034, "percentage": 41.6, "elapsed_time": "1:56:09", "remaining_time": "2:43:04", "throughput": 2311.36, "total_tokens": 16108752} {"current_steps": 27935, "total_steps": 67140, "loss": 0.8011, "lr": 3.626757611907442e-05, "epoch": 4.160708966338993, "percentage": 41.61, "elapsed_time": "1:56:10", "remaining_time": "2:43:02", "throughput": 2311.38, "total_tokens": 16111408} {"current_steps": 27940, "total_steps": 67140, "loss": 0.6567, "lr": 3.6261774390716744e-05, "epoch": 4.161453678879952, "percentage": 41.61, "elapsed_time": "1:56:11", "remaining_time": "2:43:01", "throughput": 2311.42, "total_tokens": 16114384} {"current_steps": 27945, "total_steps": 67140, "loss": 0.7704, "lr": 3.625597190133416e-05, "epoch": 4.162198391420912, "percentage": 41.62, "elapsed_time": "1:56:12", "remaining_time": "2:42:59", "throughput": 2311.46, "total_tokens": 16117328} {"current_steps": 27950, "total_steps": 67140, "loss": 0.6454, "lr": 3.625016865131875e-05, "epoch": 4.1629431039618705, "percentage": 41.63, "elapsed_time": "1:56:13", "remaining_time": "2:42:58", "throughput": 2311.52, "total_tokens": 16120336} {"current_steps": 27955, "total_steps": 67140, "loss": 0.5859, "lr": 3.624436464106267e-05, "epoch": 4.16368781650283, "percentage": 41.64, "elapsed_time": "1:56:15", "remaining_time": "2:42:57", "throughput": 2311.54, "total_tokens": 16123120} {"current_steps": 27960, "total_steps": 67140, "loss": 0.5834, "lr": 3.623855987095816e-05, "epoch": 4.164432529043789, "percentage": 41.64, "elapsed_time": "1:56:16", "remaining_time": "2:42:55", "throughput": 2311.58, "total_tokens": 16126000} {"current_steps": 27965, "total_steps": 67140, "loss": 0.5986, "lr": 3.623275434139746e-05, "epoch": 4.165177241584749, "percentage": 41.65, "elapsed_time": "1:56:17", "remaining_time": "2:42:54", "throughput": 2311.64, "total_tokens": 16129072} {"current_steps": 27970, "total_steps": 67140, "loss": 0.5437, "lr": 3.622694805277289e-05, "epoch": 4.165921954125707, "percentage": 41.66, "elapsed_time": "1:56:18", "remaining_time": "2:42:52", "throughput": 2311.65, "total_tokens": 16131632} {"current_steps": 27975, "total_steps": 67140, "loss": 0.4689, "lr": 3.6221141005476824e-05, "epoch": 4.166666666666667, "percentage": 41.67, "elapsed_time": "1:56:19", "remaining_time": "2:42:51", "throughput": 2311.71, "total_tokens": 16134768} {"current_steps": 27980, "total_steps": 67140, "loss": 0.5122, "lr": 3.6215333199901655e-05, "epoch": 4.167411379207626, "percentage": 41.67, "elapsed_time": "1:56:20", "remaining_time": "2:42:50", "throughput": 2311.75, "total_tokens": 16137712} {"current_steps": 27985, "total_steps": 67140, "loss": 0.6037, "lr": 3.620952463643989e-05, "epoch": 4.168156091748585, "percentage": 41.68, "elapsed_time": "1:56:21", "remaining_time": "2:42:48", "throughput": 2311.78, "total_tokens": 16140560} {"current_steps": 27990, "total_steps": 67140, "loss": 0.6727, "lr": 3.6203715315484e-05, "epoch": 4.168900804289544, "percentage": 41.69, "elapsed_time": "1:56:23", "remaining_time": "2:42:47", "throughput": 2311.86, "total_tokens": 16143856} {"current_steps": 27995, "total_steps": 67140, "loss": 0.6175, "lr": 3.6197905237426596e-05, "epoch": 4.169645516830504, "percentage": 41.7, "elapsed_time": "1:56:24", "remaining_time": "2:42:45", "throughput": 2311.89, "total_tokens": 16146640} {"current_steps": 28000, "total_steps": 67140, "loss": 0.8422, "lr": 3.619209440266027e-05, "epoch": 4.1703902293714625, "percentage": 41.7, "elapsed_time": "1:56:25", "remaining_time": "2:42:44", "throughput": 2311.94, "total_tokens": 16149712} {"current_steps": 28005, "total_steps": 67140, "loss": 0.7279, "lr": 3.618628281157772e-05, "epoch": 4.171134941912422, "percentage": 41.71, "elapsed_time": "1:56:26", "remaining_time": "2:42:43", "throughput": 2311.96, "total_tokens": 16152400} {"current_steps": 28010, "total_steps": 67140, "loss": 0.4674, "lr": 3.618047046457166e-05, "epoch": 4.171879654453381, "percentage": 41.72, "elapsed_time": "1:56:27", "remaining_time": "2:42:41", "throughput": 2312.02, "total_tokens": 16155536} {"current_steps": 28015, "total_steps": 67140, "loss": 0.8408, "lr": 3.617465736203485e-05, "epoch": 4.172624366994341, "percentage": 41.73, "elapsed_time": "1:56:28", "remaining_time": "2:42:40", "throughput": 2312.06, "total_tokens": 16158480} {"current_steps": 28020, "total_steps": 67140, "loss": 0.7595, "lr": 3.616884350436013e-05, "epoch": 4.173369079535299, "percentage": 41.73, "elapsed_time": "1:56:29", "remaining_time": "2:42:38", "throughput": 2312.09, "total_tokens": 16161296} {"current_steps": 28025, "total_steps": 67140, "loss": 0.5679, "lr": 3.616302889194039e-05, "epoch": 4.174113792076259, "percentage": 41.74, "elapsed_time": "1:56:31", "remaining_time": "2:42:37", "throughput": 2312.15, "total_tokens": 16164400} {"current_steps": 28030, "total_steps": 67140, "loss": 0.7642, "lr": 3.6157213525168534e-05, "epoch": 4.174858504617218, "percentage": 41.75, "elapsed_time": "1:56:32", "remaining_time": "2:42:36", "throughput": 2312.2, "total_tokens": 16167408} {"current_steps": 28035, "total_steps": 67140, "loss": 0.6871, "lr": 3.6151397404437544e-05, "epoch": 4.1756032171581765, "percentage": 41.76, "elapsed_time": "1:56:33", "remaining_time": "2:42:34", "throughput": 2312.21, "total_tokens": 16170032} {"current_steps": 28040, "total_steps": 67140, "loss": 0.8523, "lr": 3.614558053014045e-05, "epoch": 4.176347929699136, "percentage": 41.76, "elapsed_time": "1:56:34", "remaining_time": "2:42:33", "throughput": 2312.22, "total_tokens": 16172624} {"current_steps": 28045, "total_steps": 67140, "loss": 0.9506, "lr": 3.613976290267036e-05, "epoch": 4.177092642240095, "percentage": 41.77, "elapsed_time": "1:56:35", "remaining_time": "2:42:31", "throughput": 2312.23, "total_tokens": 16175184} {"current_steps": 28050, "total_steps": 67140, "loss": 0.6745, "lr": 3.6133944522420374e-05, "epoch": 4.177837354781055, "percentage": 41.78, "elapsed_time": "1:56:36", "remaining_time": "2:42:30", "throughput": 2312.28, "total_tokens": 16178224} {"current_steps": 28055, "total_steps": 67140, "loss": 0.6909, "lr": 3.612812538978368e-05, "epoch": 4.178582067322013, "percentage": 41.79, "elapsed_time": "1:56:37", "remaining_time": "2:42:29", "throughput": 2312.35, "total_tokens": 16181456} {"current_steps": 28060, "total_steps": 67140, "loss": 0.7617, "lr": 3.612230550515352e-05, "epoch": 4.179326779862973, "percentage": 41.79, "elapsed_time": "1:56:38", "remaining_time": "2:42:27", "throughput": 2312.36, "total_tokens": 16184112} {"current_steps": 28065, "total_steps": 67140, "loss": 0.7174, "lr": 3.6116484868923174e-05, "epoch": 4.180071492403932, "percentage": 41.8, "elapsed_time": "1:56:40", "remaining_time": "2:42:26", "throughput": 2312.42, "total_tokens": 16187152} {"current_steps": 28070, "total_steps": 67140, "loss": 0.6634, "lr": 3.611066348148597e-05, "epoch": 4.180816204944891, "percentage": 41.81, "elapsed_time": "1:56:41", "remaining_time": "2:42:24", "throughput": 2312.47, "total_tokens": 16190288} {"current_steps": 28075, "total_steps": 67140, "loss": 0.7325, "lr": 3.6104841343235313e-05, "epoch": 4.18156091748585, "percentage": 41.82, "elapsed_time": "1:56:42", "remaining_time": "2:42:23", "throughput": 2312.49, "total_tokens": 16193008} {"current_steps": 28080, "total_steps": 67140, "loss": 0.5391, "lr": 3.609901845456462e-05, "epoch": 4.18230563002681, "percentage": 41.82, "elapsed_time": "1:56:43", "remaining_time": "2:42:22", "throughput": 2312.55, "total_tokens": 16196112} {"current_steps": 28085, "total_steps": 67140, "loss": 0.7133, "lr": 3.6093194815867385e-05, "epoch": 4.1830503425677685, "percentage": 41.83, "elapsed_time": "1:56:44", "remaining_time": "2:42:20", "throughput": 2312.62, "total_tokens": 16199344} {"current_steps": 28090, "total_steps": 67140, "loss": 0.5684, "lr": 3.608737042753715e-05, "epoch": 4.183795055108728, "percentage": 41.84, "elapsed_time": "1:56:45", "remaining_time": "2:42:19", "throughput": 2312.66, "total_tokens": 16202320} {"current_steps": 28095, "total_steps": 67140, "loss": 0.638, "lr": 3.608154528996749e-05, "epoch": 4.184539767649687, "percentage": 41.85, "elapsed_time": "1:56:47", "remaining_time": "2:42:18", "throughput": 2312.73, "total_tokens": 16205488} {"current_steps": 28100, "total_steps": 67140, "loss": 0.6011, "lr": 3.607571940355206e-05, "epoch": 4.185284480190647, "percentage": 41.85, "elapsed_time": "1:56:48", "remaining_time": "2:42:16", "throughput": 2312.74, "total_tokens": 16208080} {"current_steps": 28105, "total_steps": 67140, "loss": 0.6625, "lr": 3.606989276868455e-05, "epoch": 4.186029192731605, "percentage": 41.86, "elapsed_time": "1:56:49", "remaining_time": "2:42:15", "throughput": 2312.77, "total_tokens": 16210864} {"current_steps": 28110, "total_steps": 67140, "loss": 0.7725, "lr": 3.606406538575868e-05, "epoch": 4.186773905272565, "percentage": 41.87, "elapsed_time": "1:56:50", "remaining_time": "2:42:13", "throughput": 2312.8, "total_tokens": 16213712} {"current_steps": 28115, "total_steps": 67140, "loss": 0.6692, "lr": 3.605823725516826e-05, "epoch": 4.187518617813524, "percentage": 41.88, "elapsed_time": "1:56:51", "remaining_time": "2:42:12", "throughput": 2312.81, "total_tokens": 16216336} {"current_steps": 28120, "total_steps": 67140, "loss": 0.7155, "lr": 3.605240837730713e-05, "epoch": 4.188263330354483, "percentage": 41.88, "elapsed_time": "1:56:52", "remaining_time": "2:42:10", "throughput": 2312.86, "total_tokens": 16219376} {"current_steps": 28125, "total_steps": 67140, "loss": 0.5022, "lr": 3.604657875256918e-05, "epoch": 4.189008042895442, "percentage": 41.89, "elapsed_time": "1:56:53", "remaining_time": "2:42:09", "throughput": 2312.88, "total_tokens": 16222064} {"current_steps": 28130, "total_steps": 67140, "loss": 0.562, "lr": 3.604074838134834e-05, "epoch": 4.189752755436402, "percentage": 41.9, "elapsed_time": "1:56:54", "remaining_time": "2:42:08", "throughput": 2312.91, "total_tokens": 16224848} {"current_steps": 28135, "total_steps": 67140, "loss": 0.6031, "lr": 3.603491726403862e-05, "epoch": 4.190497467977361, "percentage": 41.9, "elapsed_time": "1:56:56", "remaining_time": "2:42:06", "throughput": 2312.95, "total_tokens": 16227792} {"current_steps": 28140, "total_steps": 67140, "loss": 0.69, "lr": 3.6029085401034053e-05, "epoch": 4.19124218051832, "percentage": 41.91, "elapsed_time": "1:56:57", "remaining_time": "2:42:05", "throughput": 2312.97, "total_tokens": 16230576} {"current_steps": 28145, "total_steps": 67140, "loss": 0.6048, "lr": 3.602325279272874e-05, "epoch": 4.191986893059279, "percentage": 41.92, "elapsed_time": "1:56:58", "remaining_time": "2:42:03", "throughput": 2312.98, "total_tokens": 16233104} {"current_steps": 28150, "total_steps": 67140, "loss": 0.5604, "lr": 3.6017419439516815e-05, "epoch": 4.192731605600239, "percentage": 41.93, "elapsed_time": "1:56:59", "remaining_time": "2:42:02", "throughput": 2312.99, "total_tokens": 16235760} {"current_steps": 28155, "total_steps": 67140, "loss": 0.6276, "lr": 3.6011585341792477e-05, "epoch": 4.193476318141197, "percentage": 41.93, "elapsed_time": "1:57:00", "remaining_time": "2:42:00", "throughput": 2313.02, "total_tokens": 16238512} {"current_steps": 28160, "total_steps": 67140, "loss": 0.5669, "lr": 3.600575049994997e-05, "epoch": 4.194221030682157, "percentage": 41.94, "elapsed_time": "1:57:01", "remaining_time": "2:41:59", "throughput": 2313.05, "total_tokens": 16241360} {"current_steps": 28165, "total_steps": 67140, "loss": 0.7382, "lr": 3.59999149143836e-05, "epoch": 4.194965743223116, "percentage": 41.95, "elapsed_time": "1:57:02", "remaining_time": "2:41:58", "throughput": 2313.11, "total_tokens": 16244496} {"current_steps": 28170, "total_steps": 67140, "loss": 0.5098, "lr": 3.5994078585487694e-05, "epoch": 4.195710455764075, "percentage": 41.96, "elapsed_time": "1:57:03", "remaining_time": "2:41:56", "throughput": 2313.13, "total_tokens": 16247152} {"current_steps": 28175, "total_steps": 67140, "loss": 0.6704, "lr": 3.5988241513656664e-05, "epoch": 4.196455168305034, "percentage": 41.96, "elapsed_time": "1:57:05", "remaining_time": "2:41:55", "throughput": 2313.16, "total_tokens": 16250064} {"current_steps": 28180, "total_steps": 67140, "loss": 0.6091, "lr": 3.598240369928494e-05, "epoch": 4.197199880845994, "percentage": 41.97, "elapsed_time": "1:57:06", "remaining_time": "2:41:53", "throughput": 2313.2, "total_tokens": 16252880} {"current_steps": 28185, "total_steps": 67140, "loss": 0.6628, "lr": 3.5976565142767025e-05, "epoch": 4.197944593386953, "percentage": 41.98, "elapsed_time": "1:57:07", "remaining_time": "2:41:52", "throughput": 2313.21, "total_tokens": 16255568} {"current_steps": 28190, "total_steps": 67140, "loss": 0.5478, "lr": 3.5970725844497465e-05, "epoch": 4.198689305927912, "percentage": 41.99, "elapsed_time": "1:57:08", "remaining_time": "2:41:51", "throughput": 2313.26, "total_tokens": 16258576} {"current_steps": 28195, "total_steps": 67140, "loss": 0.7375, "lr": 3.596488580487086e-05, "epoch": 4.199434018468871, "percentage": 41.99, "elapsed_time": "1:57:09", "remaining_time": "2:41:49", "throughput": 2313.31, "total_tokens": 16261584} {"current_steps": 28200, "total_steps": 67140, "loss": 0.6227, "lr": 3.595904502428185e-05, "epoch": 4.200178731009831, "percentage": 42.0, "elapsed_time": "1:57:10", "remaining_time": "2:41:48", "throughput": 2313.32, "total_tokens": 16264240} {"current_steps": 28205, "total_steps": 67140, "loss": 0.5593, "lr": 3.595320350312513e-05, "epoch": 4.200923443550789, "percentage": 42.01, "elapsed_time": "1:57:11", "remaining_time": "2:41:46", "throughput": 2313.33, "total_tokens": 16266864} {"current_steps": 28210, "total_steps": 67140, "loss": 0.4733, "lr": 3.594736124179546e-05, "epoch": 4.201668156091749, "percentage": 42.02, "elapsed_time": "1:57:12", "remaining_time": "2:41:45", "throughput": 2313.38, "total_tokens": 16269840} {"current_steps": 28215, "total_steps": 67140, "loss": 0.6797, "lr": 3.594151824068762e-05, "epoch": 4.202412868632708, "percentage": 42.02, "elapsed_time": "1:57:14", "remaining_time": "2:41:44", "throughput": 2313.43, "total_tokens": 16272944} {"current_steps": 28220, "total_steps": 67140, "loss": 0.5871, "lr": 3.593567450019646e-05, "epoch": 4.203157581173667, "percentage": 42.03, "elapsed_time": "1:57:15", "remaining_time": "2:41:42", "throughput": 2313.44, "total_tokens": 16275568} {"current_steps": 28225, "total_steps": 67140, "loss": 0.5865, "lr": 3.592983002071688e-05, "epoch": 4.203902293714626, "percentage": 42.04, "elapsed_time": "1:57:16", "remaining_time": "2:41:41", "throughput": 2313.52, "total_tokens": 16278832} {"current_steps": 28230, "total_steps": 67140, "loss": 0.5326, "lr": 3.5923984802643826e-05, "epoch": 4.204647006255585, "percentage": 42.05, "elapsed_time": "1:57:17", "remaining_time": "2:41:39", "throughput": 2313.55, "total_tokens": 16281648} {"current_steps": 28235, "total_steps": 67140, "loss": 0.6303, "lr": 3.59181388463723e-05, "epoch": 4.205391718796545, "percentage": 42.05, "elapsed_time": "1:57:18", "remaining_time": "2:41:38", "throughput": 2313.58, "total_tokens": 16284464} {"current_steps": 28240, "total_steps": 67140, "loss": 0.4648, "lr": 3.591229215229733e-05, "epoch": 4.206136431337503, "percentage": 42.06, "elapsed_time": "1:57:19", "remaining_time": "2:41:37", "throughput": 2313.61, "total_tokens": 16287280} {"current_steps": 28245, "total_steps": 67140, "loss": 0.8032, "lr": 3.590644472081402e-05, "epoch": 4.206881143878463, "percentage": 42.07, "elapsed_time": "1:57:20", "remaining_time": "2:41:35", "throughput": 2313.65, "total_tokens": 16290160} {"current_steps": 28250, "total_steps": 67140, "loss": 0.6741, "lr": 3.5900596552317526e-05, "epoch": 4.207625856419422, "percentage": 42.08, "elapsed_time": "1:57:22", "remaining_time": "2:41:34", "throughput": 2313.71, "total_tokens": 16293328} {"current_steps": 28255, "total_steps": 67140, "loss": 0.6308, "lr": 3.589474764720303e-05, "epoch": 4.208370568960381, "percentage": 42.08, "elapsed_time": "1:57:23", "remaining_time": "2:41:32", "throughput": 2313.75, "total_tokens": 16296272} {"current_steps": 28260, "total_steps": 67140, "loss": 0.4657, "lr": 3.588889800586579e-05, "epoch": 4.20911528150134, "percentage": 42.09, "elapsed_time": "1:57:24", "remaining_time": "2:41:31", "throughput": 2313.78, "total_tokens": 16299056} {"current_steps": 28265, "total_steps": 67140, "loss": 0.3693, "lr": 3.588304762870108e-05, "epoch": 4.2098599940423, "percentage": 42.1, "elapsed_time": "1:57:25", "remaining_time": "2:41:30", "throughput": 2313.82, "total_tokens": 16301936} {"current_steps": 28270, "total_steps": 67140, "loss": 0.4635, "lr": 3.5877196516104275e-05, "epoch": 4.210604706583259, "percentage": 42.11, "elapsed_time": "1:57:26", "remaining_time": "2:41:28", "throughput": 2313.85, "total_tokens": 16304784} {"current_steps": 28275, "total_steps": 67140, "loss": 0.5644, "lr": 3.5871344668470755e-05, "epoch": 4.211349419124218, "percentage": 42.11, "elapsed_time": "1:57:27", "remaining_time": "2:41:27", "throughput": 2313.91, "total_tokens": 16307920} {"current_steps": 28280, "total_steps": 67140, "loss": 0.5943, "lr": 3.5865492086195945e-05, "epoch": 4.212094131665177, "percentage": 42.12, "elapsed_time": "1:57:28", "remaining_time": "2:41:26", "throughput": 2313.95, "total_tokens": 16310768} {"current_steps": 28285, "total_steps": 67140, "loss": 0.9189, "lr": 3.585963876967536e-05, "epoch": 4.212838844206137, "percentage": 42.13, "elapsed_time": "1:57:30", "remaining_time": "2:41:24", "throughput": 2313.98, "total_tokens": 16313616} {"current_steps": 28290, "total_steps": 67140, "loss": 0.7329, "lr": 3.585378471930455e-05, "epoch": 4.213583556747095, "percentage": 42.14, "elapsed_time": "1:57:31", "remaining_time": "2:41:23", "throughput": 2314.01, "total_tokens": 16316464} {"current_steps": 28295, "total_steps": 67140, "loss": 0.6951, "lr": 3.584792993547908e-05, "epoch": 4.214328269288055, "percentage": 42.14, "elapsed_time": "1:57:32", "remaining_time": "2:41:21", "throughput": 2314.01, "total_tokens": 16318992} {"current_steps": 28300, "total_steps": 67140, "loss": 0.731, "lr": 3.5842074418594625e-05, "epoch": 4.215072981829014, "percentage": 42.15, "elapsed_time": "1:57:33", "remaining_time": "2:41:20", "throughput": 2314.05, "total_tokens": 16321968} {"current_steps": 28305, "total_steps": 67140, "loss": 1.0179, "lr": 3.583621816904686e-05, "epoch": 4.2158176943699734, "percentage": 42.16, "elapsed_time": "1:57:34", "remaining_time": "2:41:19", "throughput": 2314.11, "total_tokens": 16325072} {"current_steps": 28310, "total_steps": 67140, "loss": 0.6792, "lr": 3.583036118723152e-05, "epoch": 4.216562406910932, "percentage": 42.17, "elapsed_time": "1:57:35", "remaining_time": "2:41:17", "throughput": 2314.14, "total_tokens": 16327920} {"current_steps": 28315, "total_steps": 67140, "loss": 0.6001, "lr": 3.5824503473544405e-05, "epoch": 4.217307119451892, "percentage": 42.17, "elapsed_time": "1:57:36", "remaining_time": "2:41:16", "throughput": 2314.18, "total_tokens": 16330864} {"current_steps": 28320, "total_steps": 67140, "loss": 0.6771, "lr": 3.5818645028381356e-05, "epoch": 4.218051831992851, "percentage": 42.18, "elapsed_time": "1:57:37", "remaining_time": "2:41:14", "throughput": 2314.22, "total_tokens": 16333712} {"current_steps": 28325, "total_steps": 67140, "loss": 0.8169, "lr": 3.581278585213826e-05, "epoch": 4.21879654453381, "percentage": 42.19, "elapsed_time": "1:57:39", "remaining_time": "2:41:13", "throughput": 2314.29, "total_tokens": 16337072} {"current_steps": 28330, "total_steps": 67140, "loss": 0.8161, "lr": 3.5806925945211065e-05, "epoch": 4.219541257074769, "percentage": 42.2, "elapsed_time": "1:57:40", "remaining_time": "2:41:12", "throughput": 2314.32, "total_tokens": 16339888} {"current_steps": 28335, "total_steps": 67140, "loss": 0.7823, "lr": 3.580106530799575e-05, "epoch": 4.220285969615729, "percentage": 42.2, "elapsed_time": "1:57:41", "remaining_time": "2:41:10", "throughput": 2314.34, "total_tokens": 16342672} {"current_steps": 28340, "total_steps": 67140, "loss": 0.7066, "lr": 3.579520394088835e-05, "epoch": 4.221030682156687, "percentage": 42.21, "elapsed_time": "1:57:42", "remaining_time": "2:41:09", "throughput": 2314.36, "total_tokens": 16345328} {"current_steps": 28345, "total_steps": 67140, "loss": 0.7133, "lr": 3.578934184428496e-05, "epoch": 4.221775394697647, "percentage": 42.22, "elapsed_time": "1:57:43", "remaining_time": "2:41:07", "throughput": 2314.38, "total_tokens": 16348080} {"current_steps": 28350, "total_steps": 67140, "loss": 0.5823, "lr": 3.578347901858172e-05, "epoch": 4.222520107238606, "percentage": 42.23, "elapsed_time": "1:57:44", "remaining_time": "2:41:06", "throughput": 2314.41, "total_tokens": 16350896} {"current_steps": 28355, "total_steps": 67140, "loss": 0.8069, "lr": 3.57776154641748e-05, "epoch": 4.2232648197795655, "percentage": 42.23, "elapsed_time": "1:57:46", "remaining_time": "2:41:05", "throughput": 2314.48, "total_tokens": 16354160} {"current_steps": 28360, "total_steps": 67140, "loss": 0.5388, "lr": 3.577175118146045e-05, "epoch": 4.224009532320524, "percentage": 42.24, "elapsed_time": "1:57:47", "remaining_time": "2:41:03", "throughput": 2314.51, "total_tokens": 16356976} {"current_steps": 28365, "total_steps": 67140, "loss": 0.5917, "lr": 3.576588617083495e-05, "epoch": 4.224754244861484, "percentage": 42.25, "elapsed_time": "1:57:48", "remaining_time": "2:41:02", "throughput": 2314.55, "total_tokens": 16359888} {"current_steps": 28370, "total_steps": 67140, "loss": 0.658, "lr": 3.576002043269464e-05, "epoch": 4.225498957402443, "percentage": 42.25, "elapsed_time": "1:57:49", "remaining_time": "2:41:00", "throughput": 2314.58, "total_tokens": 16362640} {"current_steps": 28375, "total_steps": 67140, "loss": 0.7291, "lr": 3.575415396743589e-05, "epoch": 4.226243669943402, "percentage": 42.26, "elapsed_time": "1:57:50", "remaining_time": "2:40:59", "throughput": 2314.63, "total_tokens": 16365712} {"current_steps": 28380, "total_steps": 67140, "loss": 0.5281, "lr": 3.574828677545514e-05, "epoch": 4.226988382484361, "percentage": 42.27, "elapsed_time": "1:57:51", "remaining_time": "2:40:58", "throughput": 2314.66, "total_tokens": 16368464} {"current_steps": 28385, "total_steps": 67140, "loss": 0.7878, "lr": 3.574241885714886e-05, "epoch": 4.22773309502532, "percentage": 42.28, "elapsed_time": "1:57:52", "remaining_time": "2:40:56", "throughput": 2314.73, "total_tokens": 16371760} {"current_steps": 28390, "total_steps": 67140, "loss": 0.7883, "lr": 3.57365502129136e-05, "epoch": 4.2284778075662794, "percentage": 42.28, "elapsed_time": "1:57:53", "remaining_time": "2:40:55", "throughput": 2314.76, "total_tokens": 16374544} {"current_steps": 28395, "total_steps": 67140, "loss": 0.5691, "lr": 3.573068084314593e-05, "epoch": 4.229222520107238, "percentage": 42.29, "elapsed_time": "1:57:55", "remaining_time": "2:40:53", "throughput": 2314.78, "total_tokens": 16377264} {"current_steps": 28400, "total_steps": 67140, "loss": 0.7319, "lr": 3.572481074824247e-05, "epoch": 4.229967232648198, "percentage": 42.3, "elapsed_time": "1:57:56", "remaining_time": "2:40:52", "throughput": 2314.82, "total_tokens": 16380208} {"current_steps": 28405, "total_steps": 67140, "loss": 0.4806, "lr": 3.5718939928599904e-05, "epoch": 4.230711945189157, "percentage": 42.31, "elapsed_time": "1:57:57", "remaining_time": "2:40:51", "throughput": 2314.84, "total_tokens": 16382832} {"current_steps": 28410, "total_steps": 67140, "loss": 0.6061, "lr": 3.571306838461496e-05, "epoch": 4.231456657730116, "percentage": 42.31, "elapsed_time": "1:57:58", "remaining_time": "2:40:49", "throughput": 2314.87, "total_tokens": 16385648} {"current_steps": 28415, "total_steps": 67140, "loss": 0.6926, "lr": 3.570719611668441e-05, "epoch": 4.232201370271075, "percentage": 42.32, "elapsed_time": "1:57:59", "remaining_time": "2:40:48", "throughput": 2314.87, "total_tokens": 16388080} {"current_steps": 28420, "total_steps": 67140, "loss": 0.6007, "lr": 3.5701323125205076e-05, "epoch": 4.232946082812035, "percentage": 42.33, "elapsed_time": "1:58:00", "remaining_time": "2:40:46", "throughput": 2314.9, "total_tokens": 16390928} {"current_steps": 28425, "total_steps": 67140, "loss": 0.5403, "lr": 3.569544941057384e-05, "epoch": 4.233690795352993, "percentage": 42.34, "elapsed_time": "1:58:01", "remaining_time": "2:40:45", "throughput": 2314.92, "total_tokens": 16393648} {"current_steps": 28430, "total_steps": 67140, "loss": 0.6513, "lr": 3.568957497318761e-05, "epoch": 4.234435507893953, "percentage": 42.34, "elapsed_time": "1:58:02", "remaining_time": "2:40:43", "throughput": 2314.95, "total_tokens": 16396496} {"current_steps": 28435, "total_steps": 67140, "loss": 0.708, "lr": 3.5683699813443364e-05, "epoch": 4.235180220434912, "percentage": 42.35, "elapsed_time": "1:58:03", "remaining_time": "2:40:42", "throughput": 2314.99, "total_tokens": 16399408} {"current_steps": 28440, "total_steps": 67140, "loss": 0.494, "lr": 3.567782393173813e-05, "epoch": 4.2359249329758715, "percentage": 42.36, "elapsed_time": "1:58:05", "remaining_time": "2:40:41", "throughput": 2315.04, "total_tokens": 16402352} {"current_steps": 28445, "total_steps": 67140, "loss": 0.6471, "lr": 3.567194732846896e-05, "epoch": 4.23666964551683, "percentage": 42.37, "elapsed_time": "1:58:06", "remaining_time": "2:40:39", "throughput": 2315.07, "total_tokens": 16405200} {"current_steps": 28450, "total_steps": 67140, "loss": 0.7112, "lr": 3.566607000403298e-05, "epoch": 4.23741435805779, "percentage": 42.37, "elapsed_time": "1:58:07", "remaining_time": "2:40:38", "throughput": 2315.1, "total_tokens": 16407984} {"current_steps": 28455, "total_steps": 67140, "loss": 0.8348, "lr": 3.5660191958827354e-05, "epoch": 4.238159070598749, "percentage": 42.38, "elapsed_time": "1:58:08", "remaining_time": "2:40:36", "throughput": 2315.13, "total_tokens": 16410768} {"current_steps": 28460, "total_steps": 67140, "loss": 0.5229, "lr": 3.56543131932493e-05, "epoch": 4.238903783139708, "percentage": 42.39, "elapsed_time": "1:58:09", "remaining_time": "2:40:35", "throughput": 2315.15, "total_tokens": 16413456} {"current_steps": 28465, "total_steps": 67140, "loss": 0.6219, "lr": 3.5648433707696074e-05, "epoch": 4.239648495680667, "percentage": 42.4, "elapsed_time": "1:58:10", "remaining_time": "2:40:34", "throughput": 2315.16, "total_tokens": 16416080} {"current_steps": 28470, "total_steps": 67140, "loss": 0.5007, "lr": 3.564255350256499e-05, "epoch": 4.240393208221627, "percentage": 42.4, "elapsed_time": "1:58:11", "remaining_time": "2:40:32", "throughput": 2315.2, "total_tokens": 16418992} {"current_steps": 28475, "total_steps": 67140, "loss": 0.7464, "lr": 3.5636672578253415e-05, "epoch": 4.2411379207625854, "percentage": 42.41, "elapsed_time": "1:58:12", "remaining_time": "2:40:31", "throughput": 2315.25, "total_tokens": 16422032} {"current_steps": 28480, "total_steps": 67140, "loss": 0.6224, "lr": 3.5630790935158754e-05, "epoch": 4.241882633303545, "percentage": 42.42, "elapsed_time": "1:58:14", "remaining_time": "2:40:29", "throughput": 2315.27, "total_tokens": 16424720} {"current_steps": 28485, "total_steps": 67140, "loss": 0.629, "lr": 3.562490857367845e-05, "epoch": 4.242627345844504, "percentage": 42.43, "elapsed_time": "1:58:15", "remaining_time": "2:40:28", "throughput": 2315.28, "total_tokens": 16427376} {"current_steps": 28490, "total_steps": 67140, "loss": 0.5492, "lr": 3.561902549421004e-05, "epoch": 4.2433720583854635, "percentage": 42.43, "elapsed_time": "1:58:16", "remaining_time": "2:40:26", "throughput": 2315.32, "total_tokens": 16430224} {"current_steps": 28495, "total_steps": 67140, "loss": 0.5761, "lr": 3.5613141697151055e-05, "epoch": 4.244116770926422, "percentage": 42.44, "elapsed_time": "1:58:17", "remaining_time": "2:40:25", "throughput": 2315.33, "total_tokens": 16432880} {"current_steps": 28500, "total_steps": 67140, "loss": 0.6048, "lr": 3.5607257182899095e-05, "epoch": 4.244861483467382, "percentage": 42.45, "elapsed_time": "1:58:18", "remaining_time": "2:40:24", "throughput": 2315.37, "total_tokens": 16435728} {"current_steps": 28505, "total_steps": 67140, "loss": 0.6278, "lr": 3.560137195185183e-05, "epoch": 4.245606196008341, "percentage": 42.46, "elapsed_time": "1:58:19", "remaining_time": "2:40:22", "throughput": 2315.39, "total_tokens": 16438448} {"current_steps": 28510, "total_steps": 67140, "loss": 0.703, "lr": 3.559548600440695e-05, "epoch": 4.2463509085493, "percentage": 42.46, "elapsed_time": "1:58:20", "remaining_time": "2:40:21", "throughput": 2315.43, "total_tokens": 16441424} {"current_steps": 28515, "total_steps": 67140, "loss": 0.4895, "lr": 3.5589599340962196e-05, "epoch": 4.247095621090259, "percentage": 42.47, "elapsed_time": "1:58:21", "remaining_time": "2:40:19", "throughput": 2315.46, "total_tokens": 16444240} {"current_steps": 28520, "total_steps": 67140, "loss": 0.5311, "lr": 3.5583711961915375e-05, "epoch": 4.247840333631219, "percentage": 42.48, "elapsed_time": "1:58:23", "remaining_time": "2:40:18", "throughput": 2315.48, "total_tokens": 16447024} {"current_steps": 28525, "total_steps": 67140, "loss": 0.565, "lr": 3.557782386766434e-05, "epoch": 4.2485850461721775, "percentage": 42.49, "elapsed_time": "1:58:24", "remaining_time": "2:40:17", "throughput": 2315.51, "total_tokens": 16449776} {"current_steps": 28530, "total_steps": 67140, "loss": 0.6892, "lr": 3.557193505860696e-05, "epoch": 4.249329758713137, "percentage": 42.49, "elapsed_time": "1:58:25", "remaining_time": "2:40:15", "throughput": 2315.55, "total_tokens": 16452720} {"current_steps": 28535, "total_steps": 67140, "loss": 0.6658, "lr": 3.55660455351412e-05, "epoch": 4.250074471254096, "percentage": 42.5, "elapsed_time": "1:58:26", "remaining_time": "2:40:14", "throughput": 2315.59, "total_tokens": 16455632} {"current_steps": 28540, "total_steps": 67140, "loss": 0.5434, "lr": 3.5560155297665046e-05, "epoch": 4.2508191837950555, "percentage": 42.51, "elapsed_time": "1:58:27", "remaining_time": "2:40:12", "throughput": 2315.64, "total_tokens": 16458608} {"current_steps": 28545, "total_steps": 67140, "loss": 0.7164, "lr": 3.555426434657652e-05, "epoch": 4.251563896336014, "percentage": 42.52, "elapsed_time": "1:58:28", "remaining_time": "2:40:11", "throughput": 2315.66, "total_tokens": 16461360} {"current_steps": 28550, "total_steps": 67140, "loss": 0.7188, "lr": 3.5548372682273726e-05, "epoch": 4.252308608876973, "percentage": 42.52, "elapsed_time": "1:58:29", "remaining_time": "2:40:10", "throughput": 2315.69, "total_tokens": 16464208} {"current_steps": 28555, "total_steps": 67140, "loss": 0.7088, "lr": 3.554248030515479e-05, "epoch": 4.253053321417933, "percentage": 42.53, "elapsed_time": "1:58:30", "remaining_time": "2:40:08", "throughput": 2315.74, "total_tokens": 16467152} {"current_steps": 28560, "total_steps": 67140, "loss": 0.5063, "lr": 3.55365872156179e-05, "epoch": 4.253798033958892, "percentage": 42.54, "elapsed_time": "1:58:32", "remaining_time": "2:40:07", "throughput": 2315.76, "total_tokens": 16469936} {"current_steps": 28565, "total_steps": 67140, "loss": 0.4596, "lr": 3.5530693414061285e-05, "epoch": 4.254542746499851, "percentage": 42.55, "elapsed_time": "1:58:33", "remaining_time": "2:40:05", "throughput": 2315.78, "total_tokens": 16472592} {"current_steps": 28570, "total_steps": 67140, "loss": 0.5653, "lr": 3.5524798900883226e-05, "epoch": 4.25528745904081, "percentage": 42.55, "elapsed_time": "1:58:34", "remaining_time": "2:40:04", "throughput": 2315.82, "total_tokens": 16475600} {"current_steps": 28575, "total_steps": 67140, "loss": 0.6615, "lr": 3.551890367648205e-05, "epoch": 4.2560321715817695, "percentage": 42.56, "elapsed_time": "1:58:35", "remaining_time": "2:40:03", "throughput": 2315.85, "total_tokens": 16478416} {"current_steps": 28580, "total_steps": 67140, "loss": 0.7547, "lr": 3.551300774125611e-05, "epoch": 4.256776884122728, "percentage": 42.57, "elapsed_time": "1:58:36", "remaining_time": "2:40:01", "throughput": 2315.88, "total_tokens": 16481136} {"current_steps": 28585, "total_steps": 67140, "loss": 0.6696, "lr": 3.5507111095603864e-05, "epoch": 4.257521596663688, "percentage": 42.58, "elapsed_time": "1:58:37", "remaining_time": "2:40:00", "throughput": 2315.92, "total_tokens": 16484112} {"current_steps": 28590, "total_steps": 67140, "loss": 0.7417, "lr": 3.550121373992378e-05, "epoch": 4.258266309204647, "percentage": 42.58, "elapsed_time": "1:58:38", "remaining_time": "2:39:58", "throughput": 2315.95, "total_tokens": 16486896} {"current_steps": 28595, "total_steps": 67140, "loss": 0.5161, "lr": 3.5495315674614356e-05, "epoch": 4.259011021745606, "percentage": 42.59, "elapsed_time": "1:58:39", "remaining_time": "2:39:57", "throughput": 2315.97, "total_tokens": 16489552} {"current_steps": 28600, "total_steps": 67140, "loss": 0.5066, "lr": 3.548941690007417e-05, "epoch": 4.259755734286565, "percentage": 42.6, "elapsed_time": "1:58:41", "remaining_time": "2:39:56", "throughput": 2316.02, "total_tokens": 16492560} {"current_steps": 28605, "total_steps": 67140, "loss": 0.6026, "lr": 3.5483517416701836e-05, "epoch": 4.260500446827525, "percentage": 42.61, "elapsed_time": "1:58:42", "remaining_time": "2:39:54", "throughput": 2316.04, "total_tokens": 16495248} {"current_steps": 28610, "total_steps": 67140, "loss": 0.5641, "lr": 3.547761722489602e-05, "epoch": 4.2612451593684835, "percentage": 42.61, "elapsed_time": "1:58:43", "remaining_time": "2:39:53", "throughput": 2316.07, "total_tokens": 16498096} {"current_steps": 28615, "total_steps": 67140, "loss": 0.579, "lr": 3.5471716325055424e-05, "epoch": 4.261989871909443, "percentage": 42.62, "elapsed_time": "1:58:44", "remaining_time": "2:39:51", "throughput": 2316.09, "total_tokens": 16500848} {"current_steps": 28620, "total_steps": 67140, "loss": 0.5711, "lr": 3.5465814717578815e-05, "epoch": 4.262734584450402, "percentage": 42.63, "elapsed_time": "1:58:45", "remaining_time": "2:39:50", "throughput": 2316.15, "total_tokens": 16504016} {"current_steps": 28625, "total_steps": 67140, "loss": 0.7122, "lr": 3.5459912402865006e-05, "epoch": 4.2634792969913615, "percentage": 42.63, "elapsed_time": "1:58:46", "remaining_time": "2:39:49", "throughput": 2316.17, "total_tokens": 16506704} {"current_steps": 28630, "total_steps": 67140, "loss": 0.5391, "lr": 3.545400938131284e-05, "epoch": 4.26422400953232, "percentage": 42.64, "elapsed_time": "1:58:47", "remaining_time": "2:39:47", "throughput": 2316.2, "total_tokens": 16509456} {"current_steps": 28635, "total_steps": 67140, "loss": 0.614, "lr": 3.544810565332122e-05, "epoch": 4.26496872207328, "percentage": 42.65, "elapsed_time": "1:58:48", "remaining_time": "2:39:46", "throughput": 2316.26, "total_tokens": 16512560} {"current_steps": 28640, "total_steps": 67140, "loss": 0.6144, "lr": 3.5442201219289105e-05, "epoch": 4.265713434614239, "percentage": 42.66, "elapsed_time": "1:58:50", "remaining_time": "2:39:44", "throughput": 2316.3, "total_tokens": 16515504} {"current_steps": 28645, "total_steps": 67140, "loss": 0.5335, "lr": 3.543629607961548e-05, "epoch": 4.266458147155198, "percentage": 42.66, "elapsed_time": "1:58:51", "remaining_time": "2:39:43", "throughput": 2316.37, "total_tokens": 16518832} {"current_steps": 28650, "total_steps": 67140, "loss": 0.5337, "lr": 3.5430390234699404e-05, "epoch": 4.267202859696157, "percentage": 42.67, "elapsed_time": "1:58:52", "remaining_time": "2:39:42", "throughput": 2316.39, "total_tokens": 16521552} {"current_steps": 28655, "total_steps": 67140, "loss": 0.6274, "lr": 3.542448368493996e-05, "epoch": 4.267947572237117, "percentage": 42.68, "elapsed_time": "1:58:53", "remaining_time": "2:39:40", "throughput": 2316.44, "total_tokens": 16524560} {"current_steps": 28660, "total_steps": 67140, "loss": 0.6452, "lr": 3.5418576430736285e-05, "epoch": 4.2686922847780755, "percentage": 42.69, "elapsed_time": "1:58:54", "remaining_time": "2:39:39", "throughput": 2316.5, "total_tokens": 16527696} {"current_steps": 28665, "total_steps": 67140, "loss": 0.6301, "lr": 3.5412668472487575e-05, "epoch": 4.269436997319035, "percentage": 42.69, "elapsed_time": "1:58:55", "remaining_time": "2:39:37", "throughput": 2316.54, "total_tokens": 16530512} {"current_steps": 28670, "total_steps": 67140, "loss": 0.4224, "lr": 3.540675981059307e-05, "epoch": 4.270181709859994, "percentage": 42.7, "elapsed_time": "1:58:57", "remaining_time": "2:39:36", "throughput": 2316.57, "total_tokens": 16533392} {"current_steps": 28675, "total_steps": 67140, "loss": 0.6044, "lr": 3.540085044545205e-05, "epoch": 4.2709264224009535, "percentage": 42.71, "elapsed_time": "1:58:58", "remaining_time": "2:39:35", "throughput": 2316.58, "total_tokens": 16535952} {"current_steps": 28680, "total_steps": 67140, "loss": 0.8374, "lr": 3.539494037746384e-05, "epoch": 4.271671134941912, "percentage": 42.72, "elapsed_time": "1:58:59", "remaining_time": "2:39:33", "throughput": 2316.62, "total_tokens": 16538896} {"current_steps": 28685, "total_steps": 67140, "loss": 0.8568, "lr": 3.538902960702781e-05, "epoch": 4.272415847482872, "percentage": 42.72, "elapsed_time": "1:59:00", "remaining_time": "2:39:32", "throughput": 2316.64, "total_tokens": 16541584} {"current_steps": 28690, "total_steps": 67140, "loss": 0.6526, "lr": 3.538311813454342e-05, "epoch": 4.273160560023831, "percentage": 42.73, "elapsed_time": "1:59:01", "remaining_time": "2:39:30", "throughput": 2316.67, "total_tokens": 16544368} {"current_steps": 28695, "total_steps": 67140, "loss": 0.4069, "lr": 3.537720596041011e-05, "epoch": 4.27390527256479, "percentage": 42.74, "elapsed_time": "1:59:02", "remaining_time": "2:39:29", "throughput": 2316.7, "total_tokens": 16547216} {"current_steps": 28700, "total_steps": 67140, "loss": 0.6716, "lr": 3.537129308502741e-05, "epoch": 4.274649985105749, "percentage": 42.75, "elapsed_time": "1:59:03", "remaining_time": "2:39:28", "throughput": 2316.76, "total_tokens": 16550384} {"current_steps": 28705, "total_steps": 67140, "loss": 0.5914, "lr": 3.536537950879489e-05, "epoch": 4.275394697646709, "percentage": 42.75, "elapsed_time": "1:59:04", "remaining_time": "2:39:26", "throughput": 2316.78, "total_tokens": 16553072} {"current_steps": 28710, "total_steps": 67140, "loss": 0.5157, "lr": 3.535946523211217e-05, "epoch": 4.2761394101876675, "percentage": 42.76, "elapsed_time": "1:59:05", "remaining_time": "2:39:25", "throughput": 2316.8, "total_tokens": 16555760} {"current_steps": 28715, "total_steps": 67140, "loss": 0.5689, "lr": 3.5353550255378905e-05, "epoch": 4.276884122728626, "percentage": 42.77, "elapsed_time": "1:59:07", "remaining_time": "2:39:23", "throughput": 2316.85, "total_tokens": 16558768} {"current_steps": 28720, "total_steps": 67140, "loss": 0.68, "lr": 3.5347634578994806e-05, "epoch": 4.277628835269586, "percentage": 42.78, "elapsed_time": "1:59:08", "remaining_time": "2:39:22", "throughput": 2316.9, "total_tokens": 16561904} {"current_steps": 28725, "total_steps": 67140, "loss": 0.6896, "lr": 3.534171820335964e-05, "epoch": 4.278373547810546, "percentage": 42.78, "elapsed_time": "1:59:09", "remaining_time": "2:39:21", "throughput": 2316.95, "total_tokens": 16564976} {"current_steps": 28730, "total_steps": 67140, "loss": 0.6227, "lr": 3.53358011288732e-05, "epoch": 4.279118260351504, "percentage": 42.79, "elapsed_time": "1:59:10", "remaining_time": "2:39:19", "throughput": 2316.98, "total_tokens": 16567824} {"current_steps": 28735, "total_steps": 67140, "loss": 0.6094, "lr": 3.532988335593534e-05, "epoch": 4.279862972892463, "percentage": 42.8, "elapsed_time": "1:59:11", "remaining_time": "2:39:18", "throughput": 2316.97, "total_tokens": 16570192} {"current_steps": 28740, "total_steps": 67140, "loss": 0.6469, "lr": 3.532396488494596e-05, "epoch": 4.280607685433423, "percentage": 42.81, "elapsed_time": "1:59:12", "remaining_time": "2:39:16", "throughput": 2317.01, "total_tokens": 16573104} {"current_steps": 28745, "total_steps": 67140, "loss": 0.6326, "lr": 3.531804571630501e-05, "epoch": 4.2813523979743815, "percentage": 42.81, "elapsed_time": "1:59:13", "remaining_time": "2:39:15", "throughput": 2317.06, "total_tokens": 16576144} {"current_steps": 28750, "total_steps": 67140, "loss": 0.5223, "lr": 3.531212585041248e-05, "epoch": 4.282097110515341, "percentage": 42.82, "elapsed_time": "1:59:15", "remaining_time": "2:39:14", "throughput": 2317.09, "total_tokens": 16579024} {"current_steps": 28755, "total_steps": 67140, "loss": 0.9139, "lr": 3.530620528766841e-05, "epoch": 4.2828418230563, "percentage": 42.83, "elapsed_time": "1:59:16", "remaining_time": "2:39:12", "throughput": 2317.12, "total_tokens": 16581904} {"current_steps": 28760, "total_steps": 67140, "loss": 0.5556, "lr": 3.53002840284729e-05, "epoch": 4.2835865355972595, "percentage": 42.84, "elapsed_time": "1:59:17", "remaining_time": "2:39:11", "throughput": 2317.13, "total_tokens": 16584496} {"current_steps": 28765, "total_steps": 67140, "loss": 0.6104, "lr": 3.5294362073226054e-05, "epoch": 4.284331248138218, "percentage": 42.84, "elapsed_time": "1:59:18", "remaining_time": "2:39:10", "throughput": 2317.15, "total_tokens": 16587248} {"current_steps": 28770, "total_steps": 67140, "loss": 0.665, "lr": 3.528843942232809e-05, "epoch": 4.285075960679178, "percentage": 42.85, "elapsed_time": "1:59:19", "remaining_time": "2:39:08", "throughput": 2317.18, "total_tokens": 16590032} {"current_steps": 28775, "total_steps": 67140, "loss": 0.726, "lr": 3.528251607617921e-05, "epoch": 4.285820673220137, "percentage": 42.86, "elapsed_time": "1:59:20", "remaining_time": "2:39:07", "throughput": 2317.2, "total_tokens": 16592752} {"current_steps": 28780, "total_steps": 67140, "loss": 0.645, "lr": 3.52765920351797e-05, "epoch": 4.286565385761096, "percentage": 42.87, "elapsed_time": "1:59:21", "remaining_time": "2:39:05", "throughput": 2317.23, "total_tokens": 16595568} {"current_steps": 28785, "total_steps": 67140, "loss": 0.5456, "lr": 3.5270667299729883e-05, "epoch": 4.287310098302055, "percentage": 42.87, "elapsed_time": "1:59:22", "remaining_time": "2:39:04", "throughput": 2317.25, "total_tokens": 16598320} {"current_steps": 28790, "total_steps": 67140, "loss": 0.7491, "lr": 3.526474187023013e-05, "epoch": 4.288054810843015, "percentage": 42.88, "elapsed_time": "1:59:24", "remaining_time": "2:39:02", "throughput": 2317.27, "total_tokens": 16601072} {"current_steps": 28795, "total_steps": 67140, "loss": 0.6308, "lr": 3.5258815747080853e-05, "epoch": 4.2887995233839735, "percentage": 42.89, "elapsed_time": "1:59:25", "remaining_time": "2:39:01", "throughput": 2317.3, "total_tokens": 16603856} {"current_steps": 28800, "total_steps": 67140, "loss": 0.6408, "lr": 3.5252888930682516e-05, "epoch": 4.289544235924933, "percentage": 42.9, "elapsed_time": "1:59:26", "remaining_time": "2:39:00", "throughput": 2317.34, "total_tokens": 16606832} {"current_steps": 28805, "total_steps": 67140, "loss": 0.7772, "lr": 3.524696142143563e-05, "epoch": 4.290288948465892, "percentage": 42.9, "elapsed_time": "1:59:27", "remaining_time": "2:38:58", "throughput": 2317.41, "total_tokens": 16610032} {"current_steps": 28810, "total_steps": 67140, "loss": 0.6457, "lr": 3.524103321974075e-05, "epoch": 4.291033661006852, "percentage": 42.91, "elapsed_time": "1:59:28", "remaining_time": "2:38:57", "throughput": 2317.43, "total_tokens": 16612784} {"current_steps": 28815, "total_steps": 67140, "loss": 0.7513, "lr": 3.523510432599849e-05, "epoch": 4.29177837354781, "percentage": 42.92, "elapsed_time": "1:59:29", "remaining_time": "2:38:56", "throughput": 2317.46, "total_tokens": 16615600} {"current_steps": 28820, "total_steps": 67140, "loss": 0.5474, "lr": 3.522917474060949e-05, "epoch": 4.29252308608877, "percentage": 42.93, "elapsed_time": "1:59:30", "remaining_time": "2:38:54", "throughput": 2317.5, "total_tokens": 16618544} {"current_steps": 28825, "total_steps": 67140, "loss": 0.6376, "lr": 3.522324446397444e-05, "epoch": 4.293267798629729, "percentage": 42.93, "elapsed_time": "1:59:31", "remaining_time": "2:38:53", "throughput": 2317.53, "total_tokens": 16621296} {"current_steps": 28830, "total_steps": 67140, "loss": 0.6219, "lr": 3.5217313496494096e-05, "epoch": 4.294012511170688, "percentage": 42.94, "elapsed_time": "1:59:33", "remaining_time": "2:38:51", "throughput": 2317.56, "total_tokens": 16624144} {"current_steps": 28835, "total_steps": 67140, "loss": 0.5, "lr": 3.521138183856926e-05, "epoch": 4.294757223711647, "percentage": 42.95, "elapsed_time": "1:59:34", "remaining_time": "2:38:50", "throughput": 2317.61, "total_tokens": 16627216} {"current_steps": 28840, "total_steps": 67140, "loss": 0.6372, "lr": 3.520544949060075e-05, "epoch": 4.295501936252607, "percentage": 42.96, "elapsed_time": "1:59:35", "remaining_time": "2:38:49", "throughput": 2317.65, "total_tokens": 16630160} {"current_steps": 28845, "total_steps": 67140, "loss": 0.5669, "lr": 3.5199516452989444e-05, "epoch": 4.2962466487935655, "percentage": 42.96, "elapsed_time": "1:59:36", "remaining_time": "2:38:47", "throughput": 2317.66, "total_tokens": 16632784} {"current_steps": 28850, "total_steps": 67140, "loss": 0.6625, "lr": 3.51935827261363e-05, "epoch": 4.296991361334525, "percentage": 42.97, "elapsed_time": "1:59:37", "remaining_time": "2:38:46", "throughput": 2317.69, "total_tokens": 16635600} {"current_steps": 28855, "total_steps": 67140, "loss": 0.597, "lr": 3.518764831044228e-05, "epoch": 4.297736073875484, "percentage": 42.98, "elapsed_time": "1:59:38", "remaining_time": "2:38:44", "throughput": 2317.74, "total_tokens": 16638640} {"current_steps": 28860, "total_steps": 67140, "loss": 0.5637, "lr": 3.518171320630839e-05, "epoch": 4.298480786416444, "percentage": 42.98, "elapsed_time": "1:59:39", "remaining_time": "2:38:43", "throughput": 2317.78, "total_tokens": 16641616} {"current_steps": 28865, "total_steps": 67140, "loss": 0.7196, "lr": 3.5175777414135726e-05, "epoch": 4.299225498957402, "percentage": 42.99, "elapsed_time": "1:59:41", "remaining_time": "2:38:42", "throughput": 2317.82, "total_tokens": 16644592} {"current_steps": 28870, "total_steps": 67140, "loss": 0.5855, "lr": 3.5169840934325404e-05, "epoch": 4.299970211498362, "percentage": 43.0, "elapsed_time": "1:59:42", "remaining_time": "2:38:40", "throughput": 2317.87, "total_tokens": 16647536} {"current_steps": 28875, "total_steps": 67140, "loss": 0.6959, "lr": 3.5163903767278573e-05, "epoch": 4.300714924039321, "percentage": 43.01, "elapsed_time": "1:59:43", "remaining_time": "2:38:39", "throughput": 2317.91, "total_tokens": 16650512} {"current_steps": 28880, "total_steps": 67140, "loss": 0.7681, "lr": 3.515796591339644e-05, "epoch": 4.30145963658028, "percentage": 43.01, "elapsed_time": "1:59:44", "remaining_time": "2:38:38", "throughput": 2317.92, "total_tokens": 16653200} {"current_steps": 28885, "total_steps": 67140, "loss": 0.6082, "lr": 3.515202737308028e-05, "epoch": 4.302204349121239, "percentage": 43.02, "elapsed_time": "1:59:45", "remaining_time": "2:38:36", "throughput": 2317.94, "total_tokens": 16655920} {"current_steps": 28890, "total_steps": 67140, "loss": 0.5553, "lr": 3.514608814673139e-05, "epoch": 4.302949061662199, "percentage": 43.03, "elapsed_time": "1:59:46", "remaining_time": "2:38:35", "throughput": 2317.98, "total_tokens": 16658896} {"current_steps": 28895, "total_steps": 67140, "loss": 0.6457, "lr": 3.5140148234751106e-05, "epoch": 4.303693774203158, "percentage": 43.04, "elapsed_time": "1:59:47", "remaining_time": "2:38:33", "throughput": 2318.01, "total_tokens": 16661712} {"current_steps": 28900, "total_steps": 67140, "loss": 0.5143, "lr": 3.513420763754083e-05, "epoch": 4.304438486744116, "percentage": 43.04, "elapsed_time": "1:59:49", "remaining_time": "2:38:32", "throughput": 2318.02, "total_tokens": 16664368} {"current_steps": 28905, "total_steps": 67140, "loss": 0.6092, "lr": 3.512826635550201e-05, "epoch": 4.305183199285076, "percentage": 43.05, "elapsed_time": "1:59:50", "remaining_time": "2:38:31", "throughput": 2318.05, "total_tokens": 16667184} {"current_steps": 28910, "total_steps": 67140, "loss": 0.7055, "lr": 3.512232438903612e-05, "epoch": 4.305927911826035, "percentage": 43.06, "elapsed_time": "1:59:51", "remaining_time": "2:38:29", "throughput": 2318.11, "total_tokens": 16670416} {"current_steps": 28915, "total_steps": 67140, "loss": 0.7282, "lr": 3.511638173854471e-05, "epoch": 4.306672624366994, "percentage": 43.07, "elapsed_time": "1:59:52", "remaining_time": "2:38:28", "throughput": 2318.14, "total_tokens": 16673264} {"current_steps": 28920, "total_steps": 67140, "loss": 0.64, "lr": 3.511043840442936e-05, "epoch": 4.307417336907953, "percentage": 43.07, "elapsed_time": "1:59:53", "remaining_time": "2:38:26", "throughput": 2318.17, "total_tokens": 16676112} {"current_steps": 28925, "total_steps": 67140, "loss": 0.8218, "lr": 3.510449438709167e-05, "epoch": 4.308162049448913, "percentage": 43.08, "elapsed_time": "1:59:54", "remaining_time": "2:38:25", "throughput": 2318.2, "total_tokens": 16678928} {"current_steps": 28930, "total_steps": 67140, "loss": 0.7157, "lr": 3.509854968693334e-05, "epoch": 4.3089067619898715, "percentage": 43.09, "elapsed_time": "1:59:55", "remaining_time": "2:38:24", "throughput": 2318.27, "total_tokens": 16682128} {"current_steps": 28935, "total_steps": 67140, "loss": 0.5904, "lr": 3.509260430435608e-05, "epoch": 4.309651474530831, "percentage": 43.1, "elapsed_time": "1:59:57", "remaining_time": "2:38:22", "throughput": 2318.31, "total_tokens": 16685136} {"current_steps": 28940, "total_steps": 67140, "loss": 0.6497, "lr": 3.5086658239761664e-05, "epoch": 4.31039618707179, "percentage": 43.1, "elapsed_time": "1:59:58", "remaining_time": "2:38:21", "throughput": 2318.35, "total_tokens": 16688016} {"current_steps": 28945, "total_steps": 67140, "loss": 0.6602, "lr": 3.5080711493551876e-05, "epoch": 4.31114089961275, "percentage": 43.11, "elapsed_time": "1:59:59", "remaining_time": "2:38:20", "throughput": 2318.38, "total_tokens": 16690864} {"current_steps": 28950, "total_steps": 67140, "loss": 0.7003, "lr": 3.5074764066128594e-05, "epoch": 4.311885612153708, "percentage": 43.12, "elapsed_time": "2:00:00", "remaining_time": "2:38:18", "throughput": 2318.41, "total_tokens": 16693680} {"current_steps": 28955, "total_steps": 67140, "loss": 0.6294, "lr": 3.506881595789373e-05, "epoch": 4.312630324694668, "percentage": 43.13, "elapsed_time": "2:00:01", "remaining_time": "2:38:17", "throughput": 2318.46, "total_tokens": 16696752} {"current_steps": 28960, "total_steps": 67140, "loss": 0.7671, "lr": 3.506286716924921e-05, "epoch": 4.313375037235627, "percentage": 43.13, "elapsed_time": "2:00:02", "remaining_time": "2:38:15", "throughput": 2318.48, "total_tokens": 16699536} {"current_steps": 28965, "total_steps": 67140, "loss": 0.6091, "lr": 3.505691770059704e-05, "epoch": 4.314119749776586, "percentage": 43.14, "elapsed_time": "2:00:03", "remaining_time": "2:38:14", "throughput": 2318.49, "total_tokens": 16702128} {"current_steps": 28970, "total_steps": 67140, "loss": 0.6802, "lr": 3.5050967552339265e-05, "epoch": 4.314864462317545, "percentage": 43.15, "elapsed_time": "2:00:04", "remaining_time": "2:38:13", "throughput": 2318.51, "total_tokens": 16704816} {"current_steps": 28975, "total_steps": 67140, "loss": 0.661, "lr": 3.5045016724877967e-05, "epoch": 4.315609174858505, "percentage": 43.16, "elapsed_time": "2:00:06", "remaining_time": "2:38:11", "throughput": 2318.53, "total_tokens": 16707568} {"current_steps": 28980, "total_steps": 67140, "loss": 0.6178, "lr": 3.503906521861527e-05, "epoch": 4.316353887399464, "percentage": 43.16, "elapsed_time": "2:00:07", "remaining_time": "2:38:10", "throughput": 2318.59, "total_tokens": 16710800} {"current_steps": 28985, "total_steps": 67140, "loss": 0.4587, "lr": 3.503311303395337e-05, "epoch": 4.317098599940423, "percentage": 43.17, "elapsed_time": "2:00:08", "remaining_time": "2:38:08", "throughput": 2318.61, "total_tokens": 16713456} {"current_steps": 28990, "total_steps": 67140, "loss": 0.5815, "lr": 3.5027160171294476e-05, "epoch": 4.317843312481382, "percentage": 43.18, "elapsed_time": "2:00:09", "remaining_time": "2:38:07", "throughput": 2318.61, "total_tokens": 16715984} {"current_steps": 28995, "total_steps": 67140, "loss": 0.6552, "lr": 3.502120663104087e-05, "epoch": 4.318588025022342, "percentage": 43.19, "elapsed_time": "2:00:10", "remaining_time": "2:38:06", "throughput": 2318.63, "total_tokens": 16718704} {"current_steps": 29000, "total_steps": 67140, "loss": 0.6494, "lr": 3.5015252413594864e-05, "epoch": 4.3193327375633, "percentage": 43.19, "elapsed_time": "2:00:11", "remaining_time": "2:38:04", "throughput": 2318.66, "total_tokens": 16721552} {"current_steps": 29005, "total_steps": 67140, "loss": 0.5516, "lr": 3.5009297519358816e-05, "epoch": 4.32007745010426, "percentage": 43.2, "elapsed_time": "2:00:12", "remaining_time": "2:38:03", "throughput": 2318.68, "total_tokens": 16724304} {"current_steps": 29010, "total_steps": 67140, "loss": 0.6579, "lr": 3.500334194873513e-05, "epoch": 4.320822162645219, "percentage": 43.21, "elapsed_time": "2:00:13", "remaining_time": "2:38:01", "throughput": 2318.72, "total_tokens": 16727248} {"current_steps": 29015, "total_steps": 67140, "loss": 0.5948, "lr": 3.499738570212628e-05, "epoch": 4.321566875186178, "percentage": 43.22, "elapsed_time": "2:00:15", "remaining_time": "2:38:00", "throughput": 2318.75, "total_tokens": 16730000} {"current_steps": 29020, "total_steps": 67140, "loss": 0.7431, "lr": 3.4991428779934746e-05, "epoch": 4.322311587727137, "percentage": 43.22, "elapsed_time": "2:00:16", "remaining_time": "2:37:59", "throughput": 2318.77, "total_tokens": 16732752} {"current_steps": 29025, "total_steps": 67140, "loss": 0.5287, "lr": 3.498547118256307e-05, "epoch": 4.323056300268097, "percentage": 43.23, "elapsed_time": "2:00:17", "remaining_time": "2:37:57", "throughput": 2318.83, "total_tokens": 16735984} {"current_steps": 29030, "total_steps": 67140, "loss": 0.6997, "lr": 3.497951291041386e-05, "epoch": 4.323801012809056, "percentage": 43.24, "elapsed_time": "2:00:18", "remaining_time": "2:37:56", "throughput": 2318.84, "total_tokens": 16738640} {"current_steps": 29035, "total_steps": 67140, "loss": 0.6844, "lr": 3.497355396388974e-05, "epoch": 4.324545725350015, "percentage": 43.25, "elapsed_time": "2:00:19", "remaining_time": "2:37:54", "throughput": 2318.88, "total_tokens": 16741552} {"current_steps": 29040, "total_steps": 67140, "loss": 0.6672, "lr": 3.496759434339338e-05, "epoch": 4.325290437890974, "percentage": 43.25, "elapsed_time": "2:00:20", "remaining_time": "2:37:53", "throughput": 2318.9, "total_tokens": 16744240} {"current_steps": 29045, "total_steps": 67140, "loss": 0.8169, "lr": 3.4961634049327527e-05, "epoch": 4.326035150431934, "percentage": 43.26, "elapsed_time": "2:00:21", "remaining_time": "2:37:52", "throughput": 2318.94, "total_tokens": 16747216} {"current_steps": 29050, "total_steps": 67140, "loss": 0.6759, "lr": 3.495567308209495e-05, "epoch": 4.326779862972892, "percentage": 43.27, "elapsed_time": "2:00:23", "remaining_time": "2:37:50", "throughput": 2318.99, "total_tokens": 16750256} {"current_steps": 29055, "total_steps": 67140, "loss": 0.6039, "lr": 3.4949711442098464e-05, "epoch": 4.327524575513852, "percentage": 43.28, "elapsed_time": "2:00:24", "remaining_time": "2:37:49", "throughput": 2319.02, "total_tokens": 16753072} {"current_steps": 29060, "total_steps": 67140, "loss": 0.7787, "lr": 3.494374912974093e-05, "epoch": 4.328269288054811, "percentage": 43.28, "elapsed_time": "2:00:25", "remaining_time": "2:37:48", "throughput": 2319.07, "total_tokens": 16756144} {"current_steps": 29065, "total_steps": 67140, "loss": 0.7333, "lr": 3.493778614542525e-05, "epoch": 4.32901400059577, "percentage": 43.29, "elapsed_time": "2:00:26", "remaining_time": "2:37:46", "throughput": 2319.15, "total_tokens": 16759440} {"current_steps": 29070, "total_steps": 67140, "loss": 0.5205, "lr": 3.493182248955439e-05, "epoch": 4.329758713136729, "percentage": 43.3, "elapsed_time": "2:00:27", "remaining_time": "2:37:45", "throughput": 2319.18, "total_tokens": 16762320} {"current_steps": 29075, "total_steps": 67140, "loss": 0.6136, "lr": 3.4925858162531354e-05, "epoch": 4.330503425677689, "percentage": 43.31, "elapsed_time": "2:00:28", "remaining_time": "2:37:44", "throughput": 2319.24, "total_tokens": 16765456} {"current_steps": 29080, "total_steps": 67140, "loss": 0.7193, "lr": 3.491989316475917e-05, "epoch": 4.331248138218648, "percentage": 43.31, "elapsed_time": "2:00:29", "remaining_time": "2:37:42", "throughput": 2319.28, "total_tokens": 16768368} {"current_steps": 29085, "total_steps": 67140, "loss": 0.6949, "lr": 3.491392749664094e-05, "epoch": 4.331992850759606, "percentage": 43.32, "elapsed_time": "2:00:31", "remaining_time": "2:37:41", "throughput": 2319.31, "total_tokens": 16771248} {"current_steps": 29090, "total_steps": 67140, "loss": 0.6526, "lr": 3.49079611585798e-05, "epoch": 4.332737563300566, "percentage": 43.33, "elapsed_time": "2:00:32", "remaining_time": "2:37:39", "throughput": 2319.36, "total_tokens": 16774288} {"current_steps": 29095, "total_steps": 67140, "loss": 0.5687, "lr": 3.490199415097892e-05, "epoch": 4.333482275841525, "percentage": 43.33, "elapsed_time": "2:00:33", "remaining_time": "2:37:38", "throughput": 2319.38, "total_tokens": 16777008} {"current_steps": 29100, "total_steps": 67140, "loss": 0.4832, "lr": 3.489602647424154e-05, "epoch": 4.334226988382484, "percentage": 43.34, "elapsed_time": "2:00:34", "remaining_time": "2:37:37", "throughput": 2319.4, "total_tokens": 16779760} {"current_steps": 29105, "total_steps": 67140, "loss": 0.6892, "lr": 3.489005812877093e-05, "epoch": 4.334971700923443, "percentage": 43.35, "elapsed_time": "2:00:35", "remaining_time": "2:37:35", "throughput": 2319.43, "total_tokens": 16782512} {"current_steps": 29110, "total_steps": 67140, "loss": 0.7491, "lr": 3.488408911497039e-05, "epoch": 4.335716413464403, "percentage": 43.36, "elapsed_time": "2:00:36", "remaining_time": "2:37:34", "throughput": 2319.48, "total_tokens": 16785680} {"current_steps": 29115, "total_steps": 67140, "loss": 0.6296, "lr": 3.48781194332433e-05, "epoch": 4.336461126005362, "percentage": 43.36, "elapsed_time": "2:00:37", "remaining_time": "2:37:32", "throughput": 2319.52, "total_tokens": 16788592} {"current_steps": 29120, "total_steps": 67140, "loss": 0.4884, "lr": 3.487214908399306e-05, "epoch": 4.337205838546321, "percentage": 43.37, "elapsed_time": "2:00:39", "remaining_time": "2:37:31", "throughput": 2319.57, "total_tokens": 16791632} {"current_steps": 29125, "total_steps": 67140, "loss": 0.5969, "lr": 3.486617806762312e-05, "epoch": 4.33795055108728, "percentage": 43.38, "elapsed_time": "2:00:40", "remaining_time": "2:37:30", "throughput": 2319.62, "total_tokens": 16794672} {"current_steps": 29130, "total_steps": 67140, "loss": 0.4854, "lr": 3.486020638453698e-05, "epoch": 4.33869526362824, "percentage": 43.39, "elapsed_time": "2:00:41", "remaining_time": "2:37:28", "throughput": 2319.63, "total_tokens": 16797328} {"current_steps": 29135, "total_steps": 67140, "loss": 0.636, "lr": 3.485423403513818e-05, "epoch": 4.339439976169198, "percentage": 43.39, "elapsed_time": "2:00:42", "remaining_time": "2:37:27", "throughput": 2319.65, "total_tokens": 16800048} {"current_steps": 29140, "total_steps": 67140, "loss": 0.6069, "lr": 3.484826101983031e-05, "epoch": 4.340184688710158, "percentage": 43.4, "elapsed_time": "2:00:43", "remaining_time": "2:37:26", "throughput": 2319.68, "total_tokens": 16802832} {"current_steps": 29145, "total_steps": 67140, "loss": 0.4044, "lr": 3.4842287339016997e-05, "epoch": 4.340929401251117, "percentage": 43.41, "elapsed_time": "2:00:44", "remaining_time": "2:37:24", "throughput": 2319.71, "total_tokens": 16805712} {"current_steps": 29150, "total_steps": 67140, "loss": 0.5318, "lr": 3.483631299310193e-05, "epoch": 4.3416741137920765, "percentage": 43.42, "elapsed_time": "2:00:45", "remaining_time": "2:37:23", "throughput": 2319.73, "total_tokens": 16808368} {"current_steps": 29155, "total_steps": 67140, "loss": 0.5924, "lr": 3.483033798248882e-05, "epoch": 4.342418826333035, "percentage": 43.42, "elapsed_time": "2:00:46", "remaining_time": "2:37:21", "throughput": 2319.75, "total_tokens": 16811184} {"current_steps": 29160, "total_steps": 67140, "loss": 0.8635, "lr": 3.4824362307581435e-05, "epoch": 4.343163538873995, "percentage": 43.43, "elapsed_time": "2:00:48", "remaining_time": "2:37:20", "throughput": 2319.79, "total_tokens": 16814032} {"current_steps": 29165, "total_steps": 67140, "loss": 0.8118, "lr": 3.4818385968783584e-05, "epoch": 4.343908251414954, "percentage": 43.44, "elapsed_time": "2:00:49", "remaining_time": "2:37:19", "throughput": 2319.84, "total_tokens": 16817072} {"current_steps": 29170, "total_steps": 67140, "loss": 0.5974, "lr": 3.481240896649913e-05, "epoch": 4.344652963955913, "percentage": 43.45, "elapsed_time": "2:00:50", "remaining_time": "2:37:17", "throughput": 2319.87, "total_tokens": 16819888} {"current_steps": 29175, "total_steps": 67140, "loss": 0.5137, "lr": 3.4806431301131974e-05, "epoch": 4.345397676496872, "percentage": 43.45, "elapsed_time": "2:00:51", "remaining_time": "2:37:16", "throughput": 2319.9, "total_tokens": 16822736} {"current_steps": 29180, "total_steps": 67140, "loss": 0.5444, "lr": 3.480045297308606e-05, "epoch": 4.346142389037832, "percentage": 43.46, "elapsed_time": "2:00:52", "remaining_time": "2:37:14", "throughput": 2319.91, "total_tokens": 16825328} {"current_steps": 29185, "total_steps": 67140, "loss": 0.6467, "lr": 3.479447398276538e-05, "epoch": 4.34688710157879, "percentage": 43.47, "elapsed_time": "2:00:53", "remaining_time": "2:37:13", "throughput": 2319.93, "total_tokens": 16827984} {"current_steps": 29190, "total_steps": 67140, "loss": 0.5113, "lr": 3.4788494330573965e-05, "epoch": 4.34763181411975, "percentage": 43.48, "elapsed_time": "2:00:54", "remaining_time": "2:37:11", "throughput": 2319.93, "total_tokens": 16830512} {"current_steps": 29195, "total_steps": 67140, "loss": 0.6126, "lr": 3.478251401691591e-05, "epoch": 4.348376526660709, "percentage": 43.48, "elapsed_time": "2:00:55", "remaining_time": "2:37:10", "throughput": 2319.99, "total_tokens": 16833648} {"current_steps": 29200, "total_steps": 67140, "loss": 0.6112, "lr": 3.4776533042195324e-05, "epoch": 4.3491212392016685, "percentage": 43.49, "elapsed_time": "2:00:57", "remaining_time": "2:37:09", "throughput": 2320.05, "total_tokens": 16836816} {"current_steps": 29205, "total_steps": 67140, "loss": 0.5232, "lr": 3.477055140681639e-05, "epoch": 4.349865951742627, "percentage": 43.5, "elapsed_time": "2:00:58", "remaining_time": "2:37:07", "throughput": 2320.08, "total_tokens": 16839632} {"current_steps": 29210, "total_steps": 67140, "loss": 0.5103, "lr": 3.4764569111183304e-05, "epoch": 4.350610664283587, "percentage": 43.51, "elapsed_time": "2:00:59", "remaining_time": "2:37:06", "throughput": 2320.11, "total_tokens": 16842512} {"current_steps": 29215, "total_steps": 67140, "loss": 0.4807, "lr": 3.475858615570035e-05, "epoch": 4.351355376824546, "percentage": 43.51, "elapsed_time": "2:01:00", "remaining_time": "2:37:05", "throughput": 2320.13, "total_tokens": 16845200} {"current_steps": 29220, "total_steps": 67140, "loss": 0.6999, "lr": 3.475260254077181e-05, "epoch": 4.352100089365505, "percentage": 43.52, "elapsed_time": "2:01:01", "remaining_time": "2:37:03", "throughput": 2320.16, "total_tokens": 16848016} {"current_steps": 29225, "total_steps": 67140, "loss": 0.6364, "lr": 3.474661826680204e-05, "epoch": 4.352844801906464, "percentage": 43.53, "elapsed_time": "2:01:02", "remaining_time": "2:37:02", "throughput": 2320.19, "total_tokens": 16850800} {"current_steps": 29230, "total_steps": 67140, "loss": 0.701, "lr": 3.474063333419544e-05, "epoch": 4.353589514447424, "percentage": 43.54, "elapsed_time": "2:01:03", "remaining_time": "2:37:00", "throughput": 2320.22, "total_tokens": 16853680} {"current_steps": 29235, "total_steps": 67140, "loss": 0.6618, "lr": 3.473464774335644e-05, "epoch": 4.3543342269883825, "percentage": 43.54, "elapsed_time": "2:01:04", "remaining_time": "2:36:59", "throughput": 2320.26, "total_tokens": 16856560} {"current_steps": 29240, "total_steps": 67140, "loss": 0.7022, "lr": 3.472866149468953e-05, "epoch": 4.355078939529342, "percentage": 43.55, "elapsed_time": "2:01:06", "remaining_time": "2:36:58", "throughput": 2320.29, "total_tokens": 16859440} {"current_steps": 29245, "total_steps": 67140, "loss": 0.6819, "lr": 3.472267458859922e-05, "epoch": 4.355823652070301, "percentage": 43.56, "elapsed_time": "2:01:07", "remaining_time": "2:36:56", "throughput": 2320.31, "total_tokens": 16862288} {"current_steps": 29250, "total_steps": 67140, "loss": 0.8337, "lr": 3.47166870254901e-05, "epoch": 4.35656836461126, "percentage": 43.57, "elapsed_time": "2:01:08", "remaining_time": "2:36:55", "throughput": 2320.34, "total_tokens": 16865008} {"current_steps": 29255, "total_steps": 67140, "loss": 0.5464, "lr": 3.471069880576677e-05, "epoch": 4.357313077152219, "percentage": 43.57, "elapsed_time": "2:01:09", "remaining_time": "2:36:53", "throughput": 2320.38, "total_tokens": 16867920} {"current_steps": 29260, "total_steps": 67140, "loss": 0.5573, "lr": 3.470470992983389e-05, "epoch": 4.358057789693178, "percentage": 43.58, "elapsed_time": "2:01:10", "remaining_time": "2:36:52", "throughput": 2320.41, "total_tokens": 16870736} {"current_steps": 29265, "total_steps": 67140, "loss": 0.7545, "lr": 3.4698720398096176e-05, "epoch": 4.358802502234138, "percentage": 43.59, "elapsed_time": "2:01:11", "remaining_time": "2:36:51", "throughput": 2320.43, "total_tokens": 16873552} {"current_steps": 29270, "total_steps": 67140, "loss": 0.6296, "lr": 3.4692730210958376e-05, "epoch": 4.359547214775096, "percentage": 43.6, "elapsed_time": "2:01:12", "remaining_time": "2:36:49", "throughput": 2320.49, "total_tokens": 16876720} {"current_steps": 29275, "total_steps": 67140, "loss": 0.6846, "lr": 3.468673936882527e-05, "epoch": 4.360291927316056, "percentage": 43.6, "elapsed_time": "2:01:14", "remaining_time": "2:36:48", "throughput": 2320.52, "total_tokens": 16879632} {"current_steps": 29280, "total_steps": 67140, "loss": 0.7177, "lr": 3.46807478721017e-05, "epoch": 4.361036639857015, "percentage": 43.61, "elapsed_time": "2:01:15", "remaining_time": "2:36:47", "throughput": 2320.57, "total_tokens": 16882576} {"current_steps": 29285, "total_steps": 67140, "loss": 0.7512, "lr": 3.4674755721192555e-05, "epoch": 4.3617813523979745, "percentage": 43.62, "elapsed_time": "2:01:16", "remaining_time": "2:36:45", "throughput": 2320.59, "total_tokens": 16885392} {"current_steps": 29290, "total_steps": 67140, "loss": 0.8173, "lr": 3.466876291650274e-05, "epoch": 4.362526064938933, "percentage": 43.63, "elapsed_time": "2:01:17", "remaining_time": "2:36:44", "throughput": 2320.63, "total_tokens": 16888272} {"current_steps": 29295, "total_steps": 67140, "loss": 0.7368, "lr": 3.466276945843725e-05, "epoch": 4.363270777479893, "percentage": 43.63, "elapsed_time": "2:01:18", "remaining_time": "2:36:42", "throughput": 2320.67, "total_tokens": 16891248} {"current_steps": 29300, "total_steps": 67140, "loss": 0.6744, "lr": 3.465677534740107e-05, "epoch": 4.364015490020852, "percentage": 43.64, "elapsed_time": "2:01:19", "remaining_time": "2:36:41", "throughput": 2320.72, "total_tokens": 16894320} {"current_steps": 29305, "total_steps": 67140, "loss": 0.6208, "lr": 3.4650780583799294e-05, "epoch": 4.364760202561811, "percentage": 43.65, "elapsed_time": "2:01:20", "remaining_time": "2:36:40", "throughput": 2320.75, "total_tokens": 16897072} {"current_steps": 29310, "total_steps": 67140, "loss": 0.6064, "lr": 3.464478516803699e-05, "epoch": 4.36550491510277, "percentage": 43.66, "elapsed_time": "2:01:21", "remaining_time": "2:36:38", "throughput": 2320.78, "total_tokens": 16899888} {"current_steps": 29315, "total_steps": 67140, "loss": 0.738, "lr": 3.463878910051932e-05, "epoch": 4.36624962764373, "percentage": 43.66, "elapsed_time": "2:01:23", "remaining_time": "2:36:37", "throughput": 2320.82, "total_tokens": 16902832} {"current_steps": 29320, "total_steps": 67140, "loss": 0.4932, "lr": 3.4632792381651473e-05, "epoch": 4.3669943401846885, "percentage": 43.67, "elapsed_time": "2:01:24", "remaining_time": "2:36:35", "throughput": 2320.83, "total_tokens": 16905456} {"current_steps": 29325, "total_steps": 67140, "loss": 0.6503, "lr": 3.462679501183867e-05, "epoch": 4.367739052725648, "percentage": 43.68, "elapsed_time": "2:01:25", "remaining_time": "2:36:34", "throughput": 2320.87, "total_tokens": 16908400} {"current_steps": 29330, "total_steps": 67140, "loss": 0.6919, "lr": 3.462079699148622e-05, "epoch": 4.368483765266607, "percentage": 43.68, "elapsed_time": "2:01:26", "remaining_time": "2:36:33", "throughput": 2320.9, "total_tokens": 16911248} {"current_steps": 29335, "total_steps": 67140, "loss": 0.5599, "lr": 3.4614798320999406e-05, "epoch": 4.3692284778075665, "percentage": 43.69, "elapsed_time": "2:01:27", "remaining_time": "2:36:31", "throughput": 2320.93, "total_tokens": 16914096} {"current_steps": 29340, "total_steps": 67140, "loss": 0.3906, "lr": 3.4608799000783624e-05, "epoch": 4.369973190348525, "percentage": 43.7, "elapsed_time": "2:01:28", "remaining_time": "2:36:30", "throughput": 2320.97, "total_tokens": 16917008} {"current_steps": 29345, "total_steps": 67140, "loss": 0.5151, "lr": 3.460279903124427e-05, "epoch": 4.370717902889485, "percentage": 43.71, "elapsed_time": "2:01:29", "remaining_time": "2:36:29", "throughput": 2320.99, "total_tokens": 16919728} {"current_steps": 29350, "total_steps": 67140, "loss": 0.4903, "lr": 3.45967984127868e-05, "epoch": 4.371462615430444, "percentage": 43.71, "elapsed_time": "2:01:30", "remaining_time": "2:36:27", "throughput": 2321.02, "total_tokens": 16922544} {"current_steps": 29355, "total_steps": 67140, "loss": 0.6159, "lr": 3.4590797145816714e-05, "epoch": 4.372207327971403, "percentage": 43.72, "elapsed_time": "2:01:32", "remaining_time": "2:36:26", "throughput": 2321.07, "total_tokens": 16925584} {"current_steps": 29360, "total_steps": 67140, "loss": 0.4743, "lr": 3.4584795230739535e-05, "epoch": 4.372952040512362, "percentage": 43.73, "elapsed_time": "2:01:33", "remaining_time": "2:36:24", "throughput": 2321.1, "total_tokens": 16928400} {"current_steps": 29365, "total_steps": 67140, "loss": 0.5749, "lr": 3.457879266796087e-05, "epoch": 4.373696753053322, "percentage": 43.74, "elapsed_time": "2:01:34", "remaining_time": "2:36:23", "throughput": 2321.14, "total_tokens": 16931312} {"current_steps": 29370, "total_steps": 67140, "loss": 0.6479, "lr": 3.457278945788635e-05, "epoch": 4.3744414655942805, "percentage": 43.74, "elapsed_time": "2:01:35", "remaining_time": "2:36:22", "throughput": 2321.17, "total_tokens": 16934160} {"current_steps": 29375, "total_steps": 67140, "loss": 0.6121, "lr": 3.456678560092164e-05, "epoch": 4.37518617813524, "percentage": 43.75, "elapsed_time": "2:01:36", "remaining_time": "2:36:20", "throughput": 2321.21, "total_tokens": 16937136} {"current_steps": 29380, "total_steps": 67140, "loss": 0.6755, "lr": 3.4560781097472436e-05, "epoch": 4.375930890676199, "percentage": 43.76, "elapsed_time": "2:01:37", "remaining_time": "2:36:19", "throughput": 2321.23, "total_tokens": 16939888} {"current_steps": 29385, "total_steps": 67140, "loss": 0.4338, "lr": 3.455477594794454e-05, "epoch": 4.3766756032171585, "percentage": 43.77, "elapsed_time": "2:01:38", "remaining_time": "2:36:17", "throughput": 2321.24, "total_tokens": 16942448} {"current_steps": 29390, "total_steps": 67140, "loss": 0.5165, "lr": 3.454877015274371e-05, "epoch": 4.377420315758117, "percentage": 43.77, "elapsed_time": "2:01:40", "remaining_time": "2:36:16", "throughput": 2321.29, "total_tokens": 16945552} {"current_steps": 29395, "total_steps": 67140, "loss": 0.7034, "lr": 3.4542763712275836e-05, "epoch": 4.378165028299077, "percentage": 43.78, "elapsed_time": "2:01:41", "remaining_time": "2:36:15", "throughput": 2321.32, "total_tokens": 16948400} {"current_steps": 29400, "total_steps": 67140, "loss": 0.7843, "lr": 3.453675662694677e-05, "epoch": 4.378909740840036, "percentage": 43.79, "elapsed_time": "2:01:42", "remaining_time": "2:36:13", "throughput": 2321.37, "total_tokens": 16951376} {"current_steps": 29405, "total_steps": 67140, "loss": 0.5677, "lr": 3.453074889716248e-05, "epoch": 4.379654453380995, "percentage": 43.8, "elapsed_time": "2:01:43", "remaining_time": "2:36:12", "throughput": 2321.4, "total_tokens": 16954288} {"current_steps": 29410, "total_steps": 67140, "loss": 0.6665, "lr": 3.452474052332891e-05, "epoch": 4.380399165921954, "percentage": 43.8, "elapsed_time": "2:01:44", "remaining_time": "2:36:11", "throughput": 2321.43, "total_tokens": 16957136} {"current_steps": 29415, "total_steps": 67140, "loss": 0.6167, "lr": 3.451873150585212e-05, "epoch": 4.381143878462913, "percentage": 43.81, "elapsed_time": "2:01:45", "remaining_time": "2:36:09", "throughput": 2321.48, "total_tokens": 16960208} {"current_steps": 29420, "total_steps": 67140, "loss": 0.7381, "lr": 3.451272184513815e-05, "epoch": 4.3818885910038725, "percentage": 43.82, "elapsed_time": "2:01:46", "remaining_time": "2:36:08", "throughput": 2321.54, "total_tokens": 16963312} {"current_steps": 29425, "total_steps": 67140, "loss": 0.5426, "lr": 3.4506711541593107e-05, "epoch": 4.382633303544832, "percentage": 43.83, "elapsed_time": "2:01:48", "remaining_time": "2:36:06", "throughput": 2321.56, "total_tokens": 16966032} {"current_steps": 29430, "total_steps": 67140, "loss": 0.7846, "lr": 3.450070059562315e-05, "epoch": 4.383378016085791, "percentage": 43.83, "elapsed_time": "2:01:49", "remaining_time": "2:36:05", "throughput": 2321.59, "total_tokens": 16968880} {"current_steps": 29435, "total_steps": 67140, "loss": 0.7626, "lr": 3.449468900763448e-05, "epoch": 4.38412272862675, "percentage": 43.84, "elapsed_time": "2:01:50", "remaining_time": "2:36:04", "throughput": 2321.6, "total_tokens": 16971536} {"current_steps": 29440, "total_steps": 67140, "loss": 0.5185, "lr": 3.448867677803333e-05, "epoch": 4.384867441167709, "percentage": 43.85, "elapsed_time": "2:01:51", "remaining_time": "2:36:02", "throughput": 2321.63, "total_tokens": 16974480} {"current_steps": 29445, "total_steps": 67140, "loss": 0.6385, "lr": 3.4482663907225975e-05, "epoch": 4.385612153708668, "percentage": 43.86, "elapsed_time": "2:01:52", "remaining_time": "2:36:01", "throughput": 2321.69, "total_tokens": 16977584} {"current_steps": 29450, "total_steps": 67140, "loss": 0.7506, "lr": 3.447665039561875e-05, "epoch": 4.386356866249628, "percentage": 43.86, "elapsed_time": "2:01:53", "remaining_time": "2:36:00", "throughput": 2321.73, "total_tokens": 16980592} {"current_steps": 29455, "total_steps": 67140, "loss": 0.6819, "lr": 3.4470636243618026e-05, "epoch": 4.3871015787905865, "percentage": 43.87, "elapsed_time": "2:01:54", "remaining_time": "2:35:58", "throughput": 2321.76, "total_tokens": 16983408} {"current_steps": 29460, "total_steps": 67140, "loss": 0.7028, "lr": 3.44646214516302e-05, "epoch": 4.387846291331546, "percentage": 43.88, "elapsed_time": "2:01:56", "remaining_time": "2:35:57", "throughput": 2321.8, "total_tokens": 16986384} {"current_steps": 29465, "total_steps": 67140, "loss": 0.6029, "lr": 3.4458606020061744e-05, "epoch": 4.388591003872505, "percentage": 43.89, "elapsed_time": "2:01:57", "remaining_time": "2:35:55", "throughput": 2321.83, "total_tokens": 16989200} {"current_steps": 29470, "total_steps": 67140, "loss": 0.4749, "lr": 3.445258994931915e-05, "epoch": 4.3893357164134645, "percentage": 43.89, "elapsed_time": "2:01:58", "remaining_time": "2:35:54", "throughput": 2321.84, "total_tokens": 16991760} {"current_steps": 29475, "total_steps": 67140, "loss": 0.6674, "lr": 3.444657323980895e-05, "epoch": 4.390080428954423, "percentage": 43.9, "elapsed_time": "2:01:59", "remaining_time": "2:35:53", "throughput": 2321.87, "total_tokens": 16994576} {"current_steps": 29480, "total_steps": 67140, "loss": 0.6033, "lr": 3.444055589193774e-05, "epoch": 4.390825141495383, "percentage": 43.91, "elapsed_time": "2:02:00", "remaining_time": "2:35:51", "throughput": 2321.89, "total_tokens": 16997296} {"current_steps": 29485, "total_steps": 67140, "loss": 0.5264, "lr": 3.443453790611215e-05, "epoch": 4.391569854036342, "percentage": 43.92, "elapsed_time": "2:02:01", "remaining_time": "2:35:50", "throughput": 2321.92, "total_tokens": 17000112} {"current_steps": 29490, "total_steps": 67140, "loss": 0.746, "lr": 3.442851928273884e-05, "epoch": 4.392314566577301, "percentage": 43.92, "elapsed_time": "2:02:02", "remaining_time": "2:35:49", "throughput": 2321.98, "total_tokens": 17003280} {"current_steps": 29495, "total_steps": 67140, "loss": 0.6559, "lr": 3.4422500022224536e-05, "epoch": 4.39305927911826, "percentage": 43.93, "elapsed_time": "2:02:03", "remaining_time": "2:35:47", "throughput": 2322.0, "total_tokens": 17006096} {"current_steps": 29500, "total_steps": 67140, "loss": 0.8191, "lr": 3.4416480124975995e-05, "epoch": 4.39380399165922, "percentage": 43.94, "elapsed_time": "2:02:05", "remaining_time": "2:35:46", "throughput": 2322.05, "total_tokens": 17009136} {"current_steps": 29505, "total_steps": 67140, "loss": 0.6571, "lr": 3.44104595914e-05, "epoch": 4.3945487042001785, "percentage": 43.95, "elapsed_time": "2:02:06", "remaining_time": "2:35:44", "throughput": 2322.11, "total_tokens": 17012272} {"current_steps": 29510, "total_steps": 67140, "loss": 0.7353, "lr": 3.440443842190341e-05, "epoch": 4.395293416741138, "percentage": 43.95, "elapsed_time": "2:02:07", "remaining_time": "2:35:43", "throughput": 2322.11, "total_tokens": 17014832} {"current_steps": 29515, "total_steps": 67140, "loss": 0.6134, "lr": 3.439841661689311e-05, "epoch": 4.396038129282097, "percentage": 43.96, "elapsed_time": "2:02:08", "remaining_time": "2:35:42", "throughput": 2322.13, "total_tokens": 17017456} {"current_steps": 29520, "total_steps": 67140, "loss": 0.5911, "lr": 3.439239417677602e-05, "epoch": 4.396782841823057, "percentage": 43.97, "elapsed_time": "2:02:09", "remaining_time": "2:35:40", "throughput": 2322.16, "total_tokens": 17020400} {"current_steps": 29525, "total_steps": 67140, "loss": 0.6878, "lr": 3.4386371101959125e-05, "epoch": 4.397527554364015, "percentage": 43.98, "elapsed_time": "2:02:10", "remaining_time": "2:35:39", "throughput": 2322.19, "total_tokens": 17023248} {"current_steps": 29530, "total_steps": 67140, "loss": 0.6914, "lr": 3.4380347392849424e-05, "epoch": 4.398272266904975, "percentage": 43.98, "elapsed_time": "2:02:11", "remaining_time": "2:35:37", "throughput": 2322.23, "total_tokens": 17026128} {"current_steps": 29535, "total_steps": 67140, "loss": 0.6387, "lr": 3.4374323049854e-05, "epoch": 4.399016979445934, "percentage": 43.99, "elapsed_time": "2:02:12", "remaining_time": "2:35:36", "throughput": 2322.25, "total_tokens": 17028880} {"current_steps": 29540, "total_steps": 67140, "loss": 0.6897, "lr": 3.436829807337992e-05, "epoch": 4.399761691986893, "percentage": 44.0, "elapsed_time": "2:02:14", "remaining_time": "2:35:35", "throughput": 2322.29, "total_tokens": 17031792} {"current_steps": 29545, "total_steps": 67140, "loss": 0.5788, "lr": 3.436227246383435e-05, "epoch": 4.400506404527852, "percentage": 44.01, "elapsed_time": "2:02:15", "remaining_time": "2:35:33", "throughput": 2322.31, "total_tokens": 17034576} {"current_steps": 29550, "total_steps": 67140, "loss": 0.5971, "lr": 3.435624622162448e-05, "epoch": 4.401251117068812, "percentage": 44.01, "elapsed_time": "2:02:16", "remaining_time": "2:35:32", "throughput": 2322.35, "total_tokens": 17037552} {"current_steps": 29555, "total_steps": 67140, "loss": 0.6369, "lr": 3.435021934715752e-05, "epoch": 4.4019958296097705, "percentage": 44.02, "elapsed_time": "2:02:17", "remaining_time": "2:35:31", "throughput": 2322.38, "total_tokens": 17040400} {"current_steps": 29560, "total_steps": 67140, "loss": 0.5033, "lr": 3.4344191840840755e-05, "epoch": 4.40274054215073, "percentage": 44.03, "elapsed_time": "2:02:18", "remaining_time": "2:35:29", "throughput": 2322.4, "total_tokens": 17043120} {"current_steps": 29565, "total_steps": 67140, "loss": 0.6519, "lr": 3.4338163703081495e-05, "epoch": 4.403485254691689, "percentage": 44.03, "elapsed_time": "2:02:19", "remaining_time": "2:35:28", "throughput": 2322.44, "total_tokens": 17046064} {"current_steps": 29570, "total_steps": 67140, "loss": 0.5726, "lr": 3.43321349342871e-05, "epoch": 4.404229967232649, "percentage": 44.04, "elapsed_time": "2:02:20", "remaining_time": "2:35:26", "throughput": 2322.48, "total_tokens": 17048976} {"current_steps": 29575, "total_steps": 67140, "loss": 0.563, "lr": 3.432610553486497e-05, "epoch": 4.404974679773607, "percentage": 44.05, "elapsed_time": "2:02:21", "remaining_time": "2:35:25", "throughput": 2322.49, "total_tokens": 17051600} {"current_steps": 29580, "total_steps": 67140, "loss": 0.7037, "lr": 3.432007550522254e-05, "epoch": 4.405719392314566, "percentage": 44.06, "elapsed_time": "2:02:23", "remaining_time": "2:35:24", "throughput": 2322.53, "total_tokens": 17054512} {"current_steps": 29585, "total_steps": 67140, "loss": 0.6137, "lr": 3.431404484576731e-05, "epoch": 4.406464104855526, "percentage": 44.06, "elapsed_time": "2:02:24", "remaining_time": "2:35:22", "throughput": 2322.54, "total_tokens": 17057168} {"current_steps": 29590, "total_steps": 67140, "loss": 0.6111, "lr": 3.430801355690679e-05, "epoch": 4.407208817396485, "percentage": 44.07, "elapsed_time": "2:02:25", "remaining_time": "2:35:21", "throughput": 2322.57, "total_tokens": 17060016} {"current_steps": 29595, "total_steps": 67140, "loss": 0.6116, "lr": 3.430198163904855e-05, "epoch": 4.407953529937444, "percentage": 44.08, "elapsed_time": "2:02:26", "remaining_time": "2:35:19", "throughput": 2322.59, "total_tokens": 17062736} {"current_steps": 29600, "total_steps": 67140, "loss": 0.712, "lr": 3.429594909260023e-05, "epoch": 4.408698242478403, "percentage": 44.09, "elapsed_time": "2:02:27", "remaining_time": "2:35:18", "throughput": 2322.6, "total_tokens": 17065456} {"current_steps": 29605, "total_steps": 67140, "loss": 0.719, "lr": 3.428991591796944e-05, "epoch": 4.409442955019363, "percentage": 44.09, "elapsed_time": "2:02:28", "remaining_time": "2:35:17", "throughput": 2322.65, "total_tokens": 17068560} {"current_steps": 29610, "total_steps": 67140, "loss": 0.5054, "lr": 3.428388211556391e-05, "epoch": 4.410187667560321, "percentage": 44.1, "elapsed_time": "2:02:29", "remaining_time": "2:35:15", "throughput": 2322.69, "total_tokens": 17071472} {"current_steps": 29615, "total_steps": 67140, "loss": 0.6928, "lr": 3.4277847685791384e-05, "epoch": 4.410932380101281, "percentage": 44.11, "elapsed_time": "2:02:31", "remaining_time": "2:35:14", "throughput": 2322.74, "total_tokens": 17074480} {"current_steps": 29620, "total_steps": 67140, "loss": 0.5924, "lr": 3.427181262905963e-05, "epoch": 4.41167709264224, "percentage": 44.12, "elapsed_time": "2:02:32", "remaining_time": "2:35:13", "throughput": 2322.76, "total_tokens": 17077328} {"current_steps": 29625, "total_steps": 67140, "loss": 0.623, "lr": 3.4265776945776464e-05, "epoch": 4.412421805183199, "percentage": 44.12, "elapsed_time": "2:02:33", "remaining_time": "2:35:11", "throughput": 2322.8, "total_tokens": 17080368} {"current_steps": 29630, "total_steps": 67140, "loss": 0.5262, "lr": 3.425974063634977e-05, "epoch": 4.413166517724158, "percentage": 44.13, "elapsed_time": "2:02:34", "remaining_time": "2:35:10", "throughput": 2322.82, "total_tokens": 17083088} {"current_steps": 29635, "total_steps": 67140, "loss": 0.7615, "lr": 3.4253703701187455e-05, "epoch": 4.413911230265118, "percentage": 44.14, "elapsed_time": "2:02:35", "remaining_time": "2:35:09", "throughput": 2322.87, "total_tokens": 17086160} {"current_steps": 29640, "total_steps": 67140, "loss": 0.6589, "lr": 3.4247666140697466e-05, "epoch": 4.4146559428060765, "percentage": 44.15, "elapsed_time": "2:02:36", "remaining_time": "2:35:07", "throughput": 2322.9, "total_tokens": 17089008} {"current_steps": 29645, "total_steps": 67140, "loss": 0.7997, "lr": 3.424162795528779e-05, "epoch": 4.415400655347036, "percentage": 44.15, "elapsed_time": "2:02:37", "remaining_time": "2:35:06", "throughput": 2322.94, "total_tokens": 17091888} {"current_steps": 29650, "total_steps": 67140, "loss": 0.7523, "lr": 3.423558914536648e-05, "epoch": 4.416145367887995, "percentage": 44.16, "elapsed_time": "2:02:39", "remaining_time": "2:35:04", "throughput": 2322.97, "total_tokens": 17094768} {"current_steps": 29655, "total_steps": 67140, "loss": 0.5216, "lr": 3.42295497113416e-05, "epoch": 4.416890080428955, "percentage": 44.17, "elapsed_time": "2:02:40", "remaining_time": "2:35:03", "throughput": 2323.0, "total_tokens": 17097616} {"current_steps": 29660, "total_steps": 67140, "loss": 0.7173, "lr": 3.4223509653621275e-05, "epoch": 4.417634792969913, "percentage": 44.18, "elapsed_time": "2:02:41", "remaining_time": "2:35:02", "throughput": 2323.03, "total_tokens": 17100432} {"current_steps": 29665, "total_steps": 67140, "loss": 0.6831, "lr": 3.421746897261367e-05, "epoch": 4.418379505510873, "percentage": 44.18, "elapsed_time": "2:02:42", "remaining_time": "2:35:00", "throughput": 2323.05, "total_tokens": 17103248} {"current_steps": 29670, "total_steps": 67140, "loss": 0.5916, "lr": 3.421142766872698e-05, "epoch": 4.419124218051832, "percentage": 44.19, "elapsed_time": "2:02:43", "remaining_time": "2:34:59", "throughput": 2323.1, "total_tokens": 17106256} {"current_steps": 29675, "total_steps": 67140, "loss": 0.4979, "lr": 3.420538574236946e-05, "epoch": 4.419868930592791, "percentage": 44.2, "elapsed_time": "2:02:44", "remaining_time": "2:34:58", "throughput": 2323.13, "total_tokens": 17109168} {"current_steps": 29680, "total_steps": 67140, "loss": 0.5009, "lr": 3.4199343193949404e-05, "epoch": 4.42061364313375, "percentage": 44.21, "elapsed_time": "2:02:45", "remaining_time": "2:34:56", "throughput": 2323.16, "total_tokens": 17112048} {"current_steps": 29685, "total_steps": 67140, "loss": 0.69, "lr": 3.419330002387514e-05, "epoch": 4.42135835567471, "percentage": 44.21, "elapsed_time": "2:02:46", "remaining_time": "2:34:55", "throughput": 2323.18, "total_tokens": 17114832} {"current_steps": 29690, "total_steps": 67140, "loss": 0.5326, "lr": 3.418725623255503e-05, "epoch": 4.422103068215669, "percentage": 44.22, "elapsed_time": "2:02:48", "remaining_time": "2:34:53", "throughput": 2323.19, "total_tokens": 17117360} {"current_steps": 29695, "total_steps": 67140, "loss": 0.7524, "lr": 3.418121182039749e-05, "epoch": 4.422847780756628, "percentage": 44.23, "elapsed_time": "2:02:49", "remaining_time": "2:34:52", "throughput": 2323.24, "total_tokens": 17120464} {"current_steps": 29700, "total_steps": 67140, "loss": 0.6243, "lr": 3.4175166787811004e-05, "epoch": 4.423592493297587, "percentage": 44.24, "elapsed_time": "2:02:50", "remaining_time": "2:34:51", "throughput": 2323.27, "total_tokens": 17123312} {"current_steps": 29705, "total_steps": 67140, "loss": 0.6117, "lr": 3.416912113520403e-05, "epoch": 4.424337205838547, "percentage": 44.24, "elapsed_time": "2:02:51", "remaining_time": "2:34:49", "throughput": 2323.3, "total_tokens": 17126192} {"current_steps": 29710, "total_steps": 67140, "loss": 0.6212, "lr": 3.416307486298513e-05, "epoch": 4.425081918379505, "percentage": 44.25, "elapsed_time": "2:02:52", "remaining_time": "2:34:48", "throughput": 2323.31, "total_tokens": 17128848} {"current_steps": 29715, "total_steps": 67140, "loss": 0.5282, "lr": 3.4157027971562897e-05, "epoch": 4.425826630920465, "percentage": 44.26, "elapsed_time": "2:02:53", "remaining_time": "2:34:46", "throughput": 2323.35, "total_tokens": 17131792} {"current_steps": 29720, "total_steps": 67140, "loss": 0.5202, "lr": 3.4150980461345945e-05, "epoch": 4.426571343461424, "percentage": 44.27, "elapsed_time": "2:02:54", "remaining_time": "2:34:45", "throughput": 2323.36, "total_tokens": 17134416} {"current_steps": 29725, "total_steps": 67140, "loss": 0.569, "lr": 3.414493233274293e-05, "epoch": 4.427316056002383, "percentage": 44.27, "elapsed_time": "2:02:56", "remaining_time": "2:34:44", "throughput": 2323.44, "total_tokens": 17137712} {"current_steps": 29730, "total_steps": 67140, "loss": 0.6108, "lr": 3.413888358616256e-05, "epoch": 4.428060768543342, "percentage": 44.28, "elapsed_time": "2:02:57", "remaining_time": "2:34:42", "throughput": 2323.47, "total_tokens": 17140528} {"current_steps": 29735, "total_steps": 67140, "loss": 0.5899, "lr": 3.413283422201361e-05, "epoch": 4.428805481084302, "percentage": 44.29, "elapsed_time": "2:02:58", "remaining_time": "2:34:41", "throughput": 2323.52, "total_tokens": 17143568} {"current_steps": 29740, "total_steps": 67140, "loss": 0.6362, "lr": 3.412678424070485e-05, "epoch": 4.429550193625261, "percentage": 44.3, "elapsed_time": "2:02:59", "remaining_time": "2:34:40", "throughput": 2323.55, "total_tokens": 17146480} {"current_steps": 29745, "total_steps": 67140, "loss": 0.5479, "lr": 3.4120733642645114e-05, "epoch": 4.43029490616622, "percentage": 44.3, "elapsed_time": "2:03:00", "remaining_time": "2:34:38", "throughput": 2323.59, "total_tokens": 17149424} {"current_steps": 29750, "total_steps": 67140, "loss": 0.5536, "lr": 3.411468242824328e-05, "epoch": 4.431039618707179, "percentage": 44.31, "elapsed_time": "2:03:01", "remaining_time": "2:34:37", "throughput": 2323.63, "total_tokens": 17152336} {"current_steps": 29755, "total_steps": 67140, "loss": 0.5773, "lr": 3.410863059790827e-05, "epoch": 4.431784331248139, "percentage": 44.32, "elapsed_time": "2:03:02", "remaining_time": "2:34:35", "throughput": 2323.65, "total_tokens": 17155152} {"current_steps": 29760, "total_steps": 67140, "loss": 0.5171, "lr": 3.4102578152049035e-05, "epoch": 4.432529043789097, "percentage": 44.33, "elapsed_time": "2:03:03", "remaining_time": "2:34:34", "throughput": 2323.68, "total_tokens": 17157936} {"current_steps": 29765, "total_steps": 67140, "loss": 0.5719, "lr": 3.4096525091074585e-05, "epoch": 4.433273756330056, "percentage": 44.33, "elapsed_time": "2:03:05", "remaining_time": "2:34:33", "throughput": 2323.72, "total_tokens": 17160880} {"current_steps": 29770, "total_steps": 67140, "loss": 0.5889, "lr": 3.409047141539394e-05, "epoch": 4.434018468871016, "percentage": 44.34, "elapsed_time": "2:03:06", "remaining_time": "2:34:31", "throughput": 2323.75, "total_tokens": 17163664} {"current_steps": 29775, "total_steps": 67140, "loss": 0.5192, "lr": 3.40844171254162e-05, "epoch": 4.434763181411975, "percentage": 44.35, "elapsed_time": "2:03:07", "remaining_time": "2:34:30", "throughput": 2323.79, "total_tokens": 17166640} {"current_steps": 29780, "total_steps": 67140, "loss": 0.6761, "lr": 3.4078362221550485e-05, "epoch": 4.435507893952934, "percentage": 44.36, "elapsed_time": "2:03:08", "remaining_time": "2:34:29", "throughput": 2323.84, "total_tokens": 17169712} {"current_steps": 29785, "total_steps": 67140, "loss": 0.52, "lr": 3.4072306704205966e-05, "epoch": 4.436252606493893, "percentage": 44.36, "elapsed_time": "2:03:09", "remaining_time": "2:34:27", "throughput": 2323.88, "total_tokens": 17172752} {"current_steps": 29790, "total_steps": 67140, "loss": 0.9299, "lr": 3.4066250573791834e-05, "epoch": 4.436997319034853, "percentage": 44.37, "elapsed_time": "2:03:10", "remaining_time": "2:34:26", "throughput": 2323.88, "total_tokens": 17175216} {"current_steps": 29795, "total_steps": 67140, "loss": 0.7296, "lr": 3.4060193830717355e-05, "epoch": 4.437742031575811, "percentage": 44.38, "elapsed_time": "2:03:11", "remaining_time": "2:34:24", "throughput": 2323.9, "total_tokens": 17177936} {"current_steps": 29800, "total_steps": 67140, "loss": 0.6115, "lr": 3.405413647539182e-05, "epoch": 4.438486744116771, "percentage": 44.38, "elapsed_time": "2:03:12", "remaining_time": "2:34:23", "throughput": 2323.93, "total_tokens": 17180784} {"current_steps": 29805, "total_steps": 67140, "loss": 0.7405, "lr": 3.404807850822455e-05, "epoch": 4.43923145665773, "percentage": 44.39, "elapsed_time": "2:03:14", "remaining_time": "2:34:22", "throughput": 2323.99, "total_tokens": 17184016} {"current_steps": 29810, "total_steps": 67140, "loss": 0.4528, "lr": 3.4042019929624916e-05, "epoch": 4.439976169198689, "percentage": 44.4, "elapsed_time": "2:03:15", "remaining_time": "2:34:20", "throughput": 2324.03, "total_tokens": 17186992} {"current_steps": 29815, "total_steps": 67140, "loss": 0.853, "lr": 3.403596074000234e-05, "epoch": 4.440720881739648, "percentage": 44.41, "elapsed_time": "2:03:16", "remaining_time": "2:34:19", "throughput": 2324.08, "total_tokens": 17190096} {"current_steps": 29820, "total_steps": 67140, "loss": 0.6689, "lr": 3.402990093976628e-05, "epoch": 4.441465594280608, "percentage": 44.41, "elapsed_time": "2:03:17", "remaining_time": "2:34:18", "throughput": 2324.12, "total_tokens": 17193040} {"current_steps": 29825, "total_steps": 67140, "loss": 0.6833, "lr": 3.402384052932622e-05, "epoch": 4.442210306821567, "percentage": 44.42, "elapsed_time": "2:03:18", "remaining_time": "2:34:16", "throughput": 2324.15, "total_tokens": 17195856} {"current_steps": 29830, "total_steps": 67140, "loss": 0.7742, "lr": 3.4017779509091705e-05, "epoch": 4.442955019362526, "percentage": 44.43, "elapsed_time": "2:03:19", "remaining_time": "2:34:15", "throughput": 2324.19, "total_tokens": 17198800} {"current_steps": 29835, "total_steps": 67140, "loss": 0.6537, "lr": 3.4011717879472315e-05, "epoch": 4.443699731903485, "percentage": 44.44, "elapsed_time": "2:03:21", "remaining_time": "2:34:14", "throughput": 2324.23, "total_tokens": 17201776} {"current_steps": 29840, "total_steps": 67140, "loss": 0.8067, "lr": 3.400565564087767e-05, "epoch": 4.444444444444445, "percentage": 44.44, "elapsed_time": "2:03:22", "remaining_time": "2:34:12", "throughput": 2324.25, "total_tokens": 17204464} {"current_steps": 29845, "total_steps": 67140, "loss": 0.6989, "lr": 3.399959279371743e-05, "epoch": 4.445189156985403, "percentage": 44.45, "elapsed_time": "2:03:23", "remaining_time": "2:34:11", "throughput": 2324.27, "total_tokens": 17207280} {"current_steps": 29850, "total_steps": 67140, "loss": 0.6915, "lr": 3.399352933840131e-05, "epoch": 4.445933869526363, "percentage": 44.46, "elapsed_time": "2:03:24", "remaining_time": "2:34:09", "throughput": 2324.29, "total_tokens": 17210032} {"current_steps": 29855, "total_steps": 67140, "loss": 0.4804, "lr": 3.3987465275339034e-05, "epoch": 4.446678582067322, "percentage": 44.47, "elapsed_time": "2:03:25", "remaining_time": "2:34:08", "throughput": 2324.31, "total_tokens": 17212720} {"current_steps": 29860, "total_steps": 67140, "loss": 0.6498, "lr": 3.3981400604940393e-05, "epoch": 4.4474232946082815, "percentage": 44.47, "elapsed_time": "2:03:26", "remaining_time": "2:34:07", "throughput": 2324.32, "total_tokens": 17215344} {"current_steps": 29865, "total_steps": 67140, "loss": 0.5714, "lr": 3.397533532761522e-05, "epoch": 4.44816800714924, "percentage": 44.48, "elapsed_time": "2:03:27", "remaining_time": "2:34:05", "throughput": 2324.37, "total_tokens": 17218320} {"current_steps": 29870, "total_steps": 67140, "loss": 0.8035, "lr": 3.3969269443773364e-05, "epoch": 4.4489127196902, "percentage": 44.49, "elapsed_time": "2:03:28", "remaining_time": "2:34:04", "throughput": 2324.4, "total_tokens": 17221264} {"current_steps": 29875, "total_steps": 67140, "loss": 0.6323, "lr": 3.396320295382476e-05, "epoch": 4.449657432231159, "percentage": 44.5, "elapsed_time": "2:03:30", "remaining_time": "2:34:03", "throughput": 2324.45, "total_tokens": 17224304} {"current_steps": 29880, "total_steps": 67140, "loss": 0.5994, "lr": 3.3957135858179335e-05, "epoch": 4.450402144772118, "percentage": 44.5, "elapsed_time": "2:03:31", "remaining_time": "2:34:01", "throughput": 2324.47, "total_tokens": 17227088} {"current_steps": 29885, "total_steps": 67140, "loss": 0.498, "lr": 3.395106815724709e-05, "epoch": 4.451146857313077, "percentage": 44.51, "elapsed_time": "2:03:32", "remaining_time": "2:34:00", "throughput": 2324.49, "total_tokens": 17229776} {"current_steps": 29890, "total_steps": 67140, "loss": 0.5698, "lr": 3.3944999851438045e-05, "epoch": 4.451891569854037, "percentage": 44.52, "elapsed_time": "2:03:33", "remaining_time": "2:33:58", "throughput": 2324.53, "total_tokens": 17232752} {"current_steps": 29895, "total_steps": 67140, "loss": 0.6002, "lr": 3.3938930941162285e-05, "epoch": 4.452636282394995, "percentage": 44.53, "elapsed_time": "2:03:34", "remaining_time": "2:33:57", "throughput": 2324.58, "total_tokens": 17235856} {"current_steps": 29900, "total_steps": 67140, "loss": 0.6628, "lr": 3.393286142682991e-05, "epoch": 4.453380994935955, "percentage": 44.53, "elapsed_time": "2:03:35", "remaining_time": "2:33:56", "throughput": 2324.63, "total_tokens": 17238992} {"current_steps": 29905, "total_steps": 67140, "loss": 0.621, "lr": 3.392679130885108e-05, "epoch": 4.454125707476914, "percentage": 44.54, "elapsed_time": "2:03:36", "remaining_time": "2:33:54", "throughput": 2324.68, "total_tokens": 17242064} {"current_steps": 29910, "total_steps": 67140, "loss": 0.7097, "lr": 3.392072058763598e-05, "epoch": 4.4548704200178735, "percentage": 44.55, "elapsed_time": "2:03:38", "remaining_time": "2:33:53", "throughput": 2324.7, "total_tokens": 17244816} {"current_steps": 29915, "total_steps": 67140, "loss": 0.6064, "lr": 3.391464926359487e-05, "epoch": 4.455615132558832, "percentage": 44.56, "elapsed_time": "2:03:39", "remaining_time": "2:33:52", "throughput": 2324.76, "total_tokens": 17247984} {"current_steps": 29920, "total_steps": 67140, "loss": 0.5862, "lr": 3.390857733713799e-05, "epoch": 4.456359845099792, "percentage": 44.56, "elapsed_time": "2:03:40", "remaining_time": "2:33:50", "throughput": 2324.8, "total_tokens": 17250992} {"current_steps": 29925, "total_steps": 67140, "loss": 0.4937, "lr": 3.3902504808675684e-05, "epoch": 4.457104557640751, "percentage": 44.57, "elapsed_time": "2:03:41", "remaining_time": "2:33:49", "throughput": 2324.86, "total_tokens": 17254128} {"current_steps": 29930, "total_steps": 67140, "loss": 0.5249, "lr": 3.389643167861829e-05, "epoch": 4.457849270181709, "percentage": 44.58, "elapsed_time": "2:03:42", "remaining_time": "2:33:48", "throughput": 2324.91, "total_tokens": 17257200} {"current_steps": 29935, "total_steps": 67140, "loss": 0.803, "lr": 3.3890357947376216e-05, "epoch": 4.458593982722669, "percentage": 44.59, "elapsed_time": "2:03:43", "remaining_time": "2:33:46", "throughput": 2324.95, "total_tokens": 17260112} {"current_steps": 29940, "total_steps": 67140, "loss": 0.5105, "lr": 3.38842836153599e-05, "epoch": 4.459338695263629, "percentage": 44.59, "elapsed_time": "2:03:45", "remaining_time": "2:33:45", "throughput": 2324.98, "total_tokens": 17263024} {"current_steps": 29945, "total_steps": 67140, "loss": 0.5213, "lr": 3.3878208682979815e-05, "epoch": 4.4600834078045875, "percentage": 44.6, "elapsed_time": "2:03:46", "remaining_time": "2:33:44", "throughput": 2325.0, "total_tokens": 17265712} {"current_steps": 29950, "total_steps": 67140, "loss": 0.7408, "lr": 3.3872133150646484e-05, "epoch": 4.460828120345546, "percentage": 44.61, "elapsed_time": "2:03:47", "remaining_time": "2:33:42", "throughput": 2325.04, "total_tokens": 17268688} {"current_steps": 29955, "total_steps": 67140, "loss": 0.647, "lr": 3.386605701877047e-05, "epoch": 4.461572832886506, "percentage": 44.62, "elapsed_time": "2:03:48", "remaining_time": "2:33:41", "throughput": 2325.09, "total_tokens": 17271824} {"current_steps": 29960, "total_steps": 67140, "loss": 0.6444, "lr": 3.3859980287762364e-05, "epoch": 4.462317545427465, "percentage": 44.62, "elapsed_time": "2:03:49", "remaining_time": "2:33:40", "throughput": 2325.13, "total_tokens": 17274832} {"current_steps": 29965, "total_steps": 67140, "loss": 0.6635, "lr": 3.385390295803281e-05, "epoch": 4.463062257968424, "percentage": 44.63, "elapsed_time": "2:03:50", "remaining_time": "2:33:38", "throughput": 2325.16, "total_tokens": 17277776} {"current_steps": 29970, "total_steps": 67140, "loss": 0.5981, "lr": 3.3847825029992495e-05, "epoch": 4.463806970509383, "percentage": 44.64, "elapsed_time": "2:03:51", "remaining_time": "2:33:37", "throughput": 2325.16, "total_tokens": 17280240} {"current_steps": 29975, "total_steps": 67140, "loss": 0.7339, "lr": 3.384174650405213e-05, "epoch": 4.464551683050343, "percentage": 44.65, "elapsed_time": "2:03:53", "remaining_time": "2:33:35", "throughput": 2325.2, "total_tokens": 17283184} {"current_steps": 29980, "total_steps": 67140, "loss": 0.613, "lr": 3.3835667380622497e-05, "epoch": 4.465296395591301, "percentage": 44.65, "elapsed_time": "2:03:54", "remaining_time": "2:33:34", "throughput": 2325.22, "total_tokens": 17285936} {"current_steps": 29985, "total_steps": 67140, "loss": 0.5972, "lr": 3.382958766011439e-05, "epoch": 4.466041108132261, "percentage": 44.66, "elapsed_time": "2:03:55", "remaining_time": "2:33:33", "throughput": 2325.26, "total_tokens": 17289008} {"current_steps": 29990, "total_steps": 67140, "loss": 0.5784, "lr": 3.3823507342938634e-05, "epoch": 4.46678582067322, "percentage": 44.67, "elapsed_time": "2:03:56", "remaining_time": "2:33:31", "throughput": 2325.31, "total_tokens": 17292080} {"current_steps": 29995, "total_steps": 67140, "loss": 0.6601, "lr": 3.381742642950612e-05, "epoch": 4.4675305332141795, "percentage": 44.68, "elapsed_time": "2:03:57", "remaining_time": "2:33:30", "throughput": 2325.35, "total_tokens": 17295056} {"current_steps": 30000, "total_steps": 67140, "loss": 0.5502, "lr": 3.3811344920227795e-05, "epoch": 4.468275245755138, "percentage": 44.68, "elapsed_time": "2:03:58", "remaining_time": "2:33:29", "throughput": 2325.41, "total_tokens": 17298224} {"current_steps": 30005, "total_steps": 67140, "loss": 0.6928, "lr": 3.3805262815514596e-05, "epoch": 4.469019958296098, "percentage": 44.69, "elapsed_time": "2:03:59", "remaining_time": "2:33:27", "throughput": 2325.43, "total_tokens": 17300976} {"current_steps": 30010, "total_steps": 67140, "loss": 0.5634, "lr": 3.379918011577753e-05, "epoch": 4.469764670837057, "percentage": 44.7, "elapsed_time": "2:04:01", "remaining_time": "2:33:26", "throughput": 2325.48, "total_tokens": 17304048} {"current_steps": 30015, "total_steps": 67140, "loss": 0.6148, "lr": 3.379309682142766e-05, "epoch": 4.470509383378016, "percentage": 44.71, "elapsed_time": "2:04:02", "remaining_time": "2:33:25", "throughput": 2325.51, "total_tokens": 17306896} {"current_steps": 30020, "total_steps": 67140, "loss": 0.544, "lr": 3.3787012932876036e-05, "epoch": 4.471254095918975, "percentage": 44.71, "elapsed_time": "2:04:03", "remaining_time": "2:33:23", "throughput": 2325.54, "total_tokens": 17309776} {"current_steps": 30025, "total_steps": 67140, "loss": 0.4779, "lr": 3.378092845053382e-05, "epoch": 4.471998808459935, "percentage": 44.72, "elapsed_time": "2:04:04", "remaining_time": "2:33:22", "throughput": 2325.58, "total_tokens": 17312784} {"current_steps": 30030, "total_steps": 67140, "loss": 0.8078, "lr": 3.377484337481216e-05, "epoch": 4.4727435210008935, "percentage": 44.73, "elapsed_time": "2:04:05", "remaining_time": "2:33:20", "throughput": 2325.6, "total_tokens": 17315440} {"current_steps": 30035, "total_steps": 67140, "loss": 0.5303, "lr": 3.376875770612226e-05, "epoch": 4.473488233541853, "percentage": 44.73, "elapsed_time": "2:04:06", "remaining_time": "2:33:19", "throughput": 2325.62, "total_tokens": 17318256} {"current_steps": 30040, "total_steps": 67140, "loss": 0.7207, "lr": 3.376267144487535e-05, "epoch": 4.474232946082812, "percentage": 44.74, "elapsed_time": "2:04:07", "remaining_time": "2:33:18", "throughput": 2325.66, "total_tokens": 17321168} {"current_steps": 30045, "total_steps": 67140, "loss": 0.6616, "lr": 3.375658459148275e-05, "epoch": 4.4749776586237715, "percentage": 44.75, "elapsed_time": "2:04:09", "remaining_time": "2:33:16", "throughput": 2325.7, "total_tokens": 17324112} {"current_steps": 30050, "total_steps": 67140, "loss": 0.672, "lr": 3.375049714635577e-05, "epoch": 4.47572237116473, "percentage": 44.76, "elapsed_time": "2:04:10", "remaining_time": "2:33:15", "throughput": 2325.74, "total_tokens": 17327152} {"current_steps": 30055, "total_steps": 67140, "loss": 0.6239, "lr": 3.374440910990574e-05, "epoch": 4.47646708370569, "percentage": 44.76, "elapsed_time": "2:04:11", "remaining_time": "2:33:14", "throughput": 2325.79, "total_tokens": 17330224} {"current_steps": 30060, "total_steps": 67140, "loss": 0.6272, "lr": 3.3738320482544116e-05, "epoch": 4.477211796246649, "percentage": 44.77, "elapsed_time": "2:04:12", "remaining_time": "2:33:12", "throughput": 2325.82, "total_tokens": 17333104} {"current_steps": 30065, "total_steps": 67140, "loss": 0.6888, "lr": 3.3732231264682326e-05, "epoch": 4.477956508787608, "percentage": 44.78, "elapsed_time": "2:04:13", "remaining_time": "2:33:11", "throughput": 2325.84, "total_tokens": 17335824} {"current_steps": 30070, "total_steps": 67140, "loss": 0.546, "lr": 3.3726141456731835e-05, "epoch": 4.478701221328567, "percentage": 44.79, "elapsed_time": "2:04:14", "remaining_time": "2:33:10", "throughput": 2325.86, "total_tokens": 17338544} {"current_steps": 30075, "total_steps": 67140, "loss": 0.532, "lr": 3.3720051059104186e-05, "epoch": 4.479445933869527, "percentage": 44.79, "elapsed_time": "2:04:15", "remaining_time": "2:33:08", "throughput": 2325.9, "total_tokens": 17341488} {"current_steps": 30080, "total_steps": 67140, "loss": 0.5864, "lr": 3.371396007221094e-05, "epoch": 4.4801906464104855, "percentage": 44.8, "elapsed_time": "2:04:17", "remaining_time": "2:33:07", "throughput": 2325.96, "total_tokens": 17344688} {"current_steps": 30085, "total_steps": 67140, "loss": 0.6577, "lr": 3.3707868496463705e-05, "epoch": 4.480935358951445, "percentage": 44.81, "elapsed_time": "2:04:18", "remaining_time": "2:33:06", "throughput": 2325.98, "total_tokens": 17347472} {"current_steps": 30090, "total_steps": 67140, "loss": 0.6907, "lr": 3.3701776332274116e-05, "epoch": 4.481680071492404, "percentage": 44.82, "elapsed_time": "2:04:19", "remaining_time": "2:33:04", "throughput": 2326.02, "total_tokens": 17350448} {"current_steps": 30095, "total_steps": 67140, "loss": 0.7012, "lr": 3.3695683580053865e-05, "epoch": 4.4824247840333635, "percentage": 44.82, "elapsed_time": "2:04:20", "remaining_time": "2:33:03", "throughput": 2326.05, "total_tokens": 17353328} {"current_steps": 30100, "total_steps": 67140, "loss": 0.6231, "lr": 3.368959024021467e-05, "epoch": 4.483169496574322, "percentage": 44.83, "elapsed_time": "2:04:21", "remaining_time": "2:33:01", "throughput": 2326.08, "total_tokens": 17356112} {"current_steps": 30105, "total_steps": 67140, "loss": 0.7139, "lr": 3.3683496313168294e-05, "epoch": 4.483914209115282, "percentage": 44.84, "elapsed_time": "2:04:22", "remaining_time": "2:33:00", "throughput": 2326.1, "total_tokens": 17358896} {"current_steps": 30110, "total_steps": 67140, "loss": 0.7087, "lr": 3.367740179932655e-05, "epoch": 4.484658921656241, "percentage": 44.85, "elapsed_time": "2:04:23", "remaining_time": "2:32:59", "throughput": 2326.12, "total_tokens": 17361680} {"current_steps": 30115, "total_steps": 67140, "loss": 0.607, "lr": 3.3671306699101266e-05, "epoch": 4.4854036341971995, "percentage": 44.85, "elapsed_time": "2:04:24", "remaining_time": "2:32:57", "throughput": 2326.14, "total_tokens": 17364432} {"current_steps": 30120, "total_steps": 67140, "loss": 0.7231, "lr": 3.3665211012904324e-05, "epoch": 4.486148346738159, "percentage": 44.86, "elapsed_time": "2:04:26", "remaining_time": "2:32:56", "throughput": 2326.15, "total_tokens": 17367152} {"current_steps": 30125, "total_steps": 67140, "loss": 0.5611, "lr": 3.365911474114766e-05, "epoch": 4.486893059279118, "percentage": 44.87, "elapsed_time": "2:04:27", "remaining_time": "2:32:55", "throughput": 2326.2, "total_tokens": 17370192} {"current_steps": 30130, "total_steps": 67140, "loss": 0.5897, "lr": 3.3653017884243224e-05, "epoch": 4.4876377718200775, "percentage": 44.88, "elapsed_time": "2:04:28", "remaining_time": "2:32:53", "throughput": 2326.24, "total_tokens": 17373136} {"current_steps": 30135, "total_steps": 67140, "loss": 0.5394, "lr": 3.364692044260302e-05, "epoch": 4.488382484361036, "percentage": 44.88, "elapsed_time": "2:04:29", "remaining_time": "2:32:52", "throughput": 2326.27, "total_tokens": 17375920} {"current_steps": 30140, "total_steps": 67140, "loss": 0.4892, "lr": 3.3640822416639086e-05, "epoch": 4.489127196901996, "percentage": 44.89, "elapsed_time": "2:04:30", "remaining_time": "2:32:50", "throughput": 2326.29, "total_tokens": 17378672} {"current_steps": 30145, "total_steps": 67140, "loss": 0.6237, "lr": 3.363472380676351e-05, "epoch": 4.489871909442955, "percentage": 44.9, "elapsed_time": "2:04:31", "remaining_time": "2:32:49", "throughput": 2326.33, "total_tokens": 17381552} {"current_steps": 30150, "total_steps": 67140, "loss": 0.6153, "lr": 3.3628624613388407e-05, "epoch": 4.490616621983914, "percentage": 44.91, "elapsed_time": "2:04:32", "remaining_time": "2:32:48", "throughput": 2326.36, "total_tokens": 17384400} {"current_steps": 30155, "total_steps": 67140, "loss": 0.598, "lr": 3.362252483692593e-05, "epoch": 4.491361334524873, "percentage": 44.91, "elapsed_time": "2:04:33", "remaining_time": "2:32:46", "throughput": 2326.38, "total_tokens": 17387152} {"current_steps": 30160, "total_steps": 67140, "loss": 0.5036, "lr": 3.361642447778828e-05, "epoch": 4.492106047065833, "percentage": 44.92, "elapsed_time": "2:04:34", "remaining_time": "2:32:45", "throughput": 2326.38, "total_tokens": 17389680} {"current_steps": 30165, "total_steps": 67140, "loss": 0.4774, "lr": 3.36103235363877e-05, "epoch": 4.4928507596067915, "percentage": 44.93, "elapsed_time": "2:04:36", "remaining_time": "2:32:43", "throughput": 2326.4, "total_tokens": 17392304} {"current_steps": 30170, "total_steps": 67140, "loss": 0.6263, "lr": 3.360422201313646e-05, "epoch": 4.493595472147751, "percentage": 44.94, "elapsed_time": "2:04:37", "remaining_time": "2:32:42", "throughput": 2326.43, "total_tokens": 17395184} {"current_steps": 30175, "total_steps": 67140, "loss": 0.4619, "lr": 3.3598119908446866e-05, "epoch": 4.49434018468871, "percentage": 44.94, "elapsed_time": "2:04:38", "remaining_time": "2:32:41", "throughput": 2326.49, "total_tokens": 17398320} {"current_steps": 30180, "total_steps": 67140, "loss": 0.8168, "lr": 3.3592017222731304e-05, "epoch": 4.4950848972296695, "percentage": 44.95, "elapsed_time": "2:04:39", "remaining_time": "2:32:39", "throughput": 2326.54, "total_tokens": 17401520} {"current_steps": 30185, "total_steps": 67140, "loss": 0.6596, "lr": 3.358591395640215e-05, "epoch": 4.495829609770628, "percentage": 44.96, "elapsed_time": "2:04:40", "remaining_time": "2:32:38", "throughput": 2326.58, "total_tokens": 17404496} {"current_steps": 30190, "total_steps": 67140, "loss": 0.6613, "lr": 3.357981010987183e-05, "epoch": 4.496574322311588, "percentage": 44.97, "elapsed_time": "2:04:41", "remaining_time": "2:32:37", "throughput": 2326.65, "total_tokens": 17407728} {"current_steps": 30195, "total_steps": 67140, "loss": 0.6607, "lr": 3.3573705683552824e-05, "epoch": 4.497319034852547, "percentage": 44.97, "elapsed_time": "2:04:43", "remaining_time": "2:32:35", "throughput": 2326.7, "total_tokens": 17410832} {"current_steps": 30200, "total_steps": 67140, "loss": 0.8879, "lr": 3.356760067785765e-05, "epoch": 4.498063747393506, "percentage": 44.98, "elapsed_time": "2:04:44", "remaining_time": "2:32:34", "throughput": 2326.71, "total_tokens": 17413552} {"current_steps": 30205, "total_steps": 67140, "loss": 0.5839, "lr": 3.356149509319886e-05, "epoch": 4.498808459934465, "percentage": 44.99, "elapsed_time": "2:04:45", "remaining_time": "2:32:33", "throughput": 2326.75, "total_tokens": 17416464} {"current_steps": 30210, "total_steps": 67140, "loss": 0.6846, "lr": 3.355538892998904e-05, "epoch": 4.499553172475425, "percentage": 45.0, "elapsed_time": "2:04:46", "remaining_time": "2:32:31", "throughput": 2326.76, "total_tokens": 17419088} {"current_steps": 30213, "total_steps": 67140, "eval_loss": 0.6573360562324524, "epoch": 4.5, "percentage": 45.0, "elapsed_time": "2:06:01", "remaining_time": "2:34:01", "throughput": 2303.91, "total_tokens": 17420720} {"current_steps": 30215, "total_steps": 67140, "loss": 0.5492, "lr": 3.3549282188640815e-05, "epoch": 4.5002978850163835, "percentage": 45.0, "elapsed_time": "2:06:03", "remaining_time": "2:34:02", "throughput": 2303.47, "total_tokens": 17421968} {"current_steps": 30220, "total_steps": 67140, "loss": 0.6098, "lr": 3.354317486956685e-05, "epoch": 4.501042597557343, "percentage": 45.01, "elapsed_time": "2:06:04", "remaining_time": "2:34:01", "throughput": 2303.5, "total_tokens": 17424752} {"current_steps": 30225, "total_steps": 67140, "loss": 0.5951, "lr": 3.353706697317988e-05, "epoch": 4.501787310098302, "percentage": 45.02, "elapsed_time": "2:06:05", "remaining_time": "2:34:00", "throughput": 2303.55, "total_tokens": 17427728} {"current_steps": 30230, "total_steps": 67140, "loss": 0.6315, "lr": 3.353095849989262e-05, "epoch": 4.5025320226392616, "percentage": 45.03, "elapsed_time": "2:06:06", "remaining_time": "2:33:58", "throughput": 2303.6, "total_tokens": 17430800} {"current_steps": 30235, "total_steps": 67140, "loss": 0.6495, "lr": 3.352484945011787e-05, "epoch": 4.50327673518022, "percentage": 45.03, "elapsed_time": "2:06:07", "remaining_time": "2:33:57", "throughput": 2303.64, "total_tokens": 17433776} {"current_steps": 30240, "total_steps": 67140, "loss": 0.6105, "lr": 3.351873982426846e-05, "epoch": 4.50402144772118, "percentage": 45.04, "elapsed_time": "2:06:09", "remaining_time": "2:33:56", "throughput": 2303.68, "total_tokens": 17436752} {"current_steps": 30245, "total_steps": 67140, "loss": 0.5802, "lr": 3.3512629622757245e-05, "epoch": 4.504766160262139, "percentage": 45.05, "elapsed_time": "2:06:10", "remaining_time": "2:33:54", "throughput": 2303.75, "total_tokens": 17439952} {"current_steps": 30250, "total_steps": 67140, "loss": 0.7294, "lr": 3.350651884599713e-05, "epoch": 4.505510872803098, "percentage": 45.06, "elapsed_time": "2:06:11", "remaining_time": "2:33:53", "throughput": 2303.77, "total_tokens": 17442768} {"current_steps": 30255, "total_steps": 67140, "loss": 0.5106, "lr": 3.350040749440105e-05, "epoch": 4.506255585344057, "percentage": 45.06, "elapsed_time": "2:06:12", "remaining_time": "2:33:51", "throughput": 2303.82, "total_tokens": 17445712} {"current_steps": 30260, "total_steps": 67140, "loss": 0.5679, "lr": 3.3494295568382006e-05, "epoch": 4.507000297885017, "percentage": 45.07, "elapsed_time": "2:06:13", "remaining_time": "2:33:50", "throughput": 2303.87, "total_tokens": 17448816} {"current_steps": 30265, "total_steps": 67140, "loss": 0.5659, "lr": 3.348818306835299e-05, "epoch": 4.5077450104259755, "percentage": 45.08, "elapsed_time": "2:06:14", "remaining_time": "2:33:49", "throughput": 2303.91, "total_tokens": 17451728} {"current_steps": 30270, "total_steps": 67140, "loss": 0.8028, "lr": 3.348206999472708e-05, "epoch": 4.508489722966935, "percentage": 45.08, "elapsed_time": "2:06:16", "remaining_time": "2:33:47", "throughput": 2303.96, "total_tokens": 17454832} {"current_steps": 30275, "total_steps": 67140, "loss": 0.5074, "lr": 3.3475956347917356e-05, "epoch": 4.509234435507894, "percentage": 45.09, "elapsed_time": "2:06:17", "remaining_time": "2:33:46", "throughput": 2304.0, "total_tokens": 17457744} {"current_steps": 30280, "total_steps": 67140, "loss": 0.7424, "lr": 3.346984212833697e-05, "epoch": 4.509979148048853, "percentage": 45.1, "elapsed_time": "2:06:18", "remaining_time": "2:33:45", "throughput": 2304.03, "total_tokens": 17460624} {"current_steps": 30285, "total_steps": 67140, "loss": 0.7297, "lr": 3.346372733639909e-05, "epoch": 4.510723860589812, "percentage": 45.11, "elapsed_time": "2:06:19", "remaining_time": "2:33:43", "throughput": 2304.09, "total_tokens": 17463792} {"current_steps": 30290, "total_steps": 67140, "loss": 0.713, "lr": 3.345761197251692e-05, "epoch": 4.511468573130772, "percentage": 45.11, "elapsed_time": "2:06:20", "remaining_time": "2:33:42", "throughput": 2304.11, "total_tokens": 17466480} {"current_steps": 30295, "total_steps": 67140, "loss": 0.6295, "lr": 3.345149603710373e-05, "epoch": 4.512213285671731, "percentage": 45.12, "elapsed_time": "2:06:21", "remaining_time": "2:33:40", "throughput": 2304.12, "total_tokens": 17469040} {"current_steps": 30300, "total_steps": 67140, "loss": 0.6475, "lr": 3.344537953057279e-05, "epoch": 4.5129579982126895, "percentage": 45.13, "elapsed_time": "2:06:22", "remaining_time": "2:33:39", "throughput": 2304.15, "total_tokens": 17471920} {"current_steps": 30305, "total_steps": 67140, "loss": 0.6576, "lr": 3.343926245333745e-05, "epoch": 4.513702710753649, "percentage": 45.14, "elapsed_time": "2:06:24", "remaining_time": "2:33:38", "throughput": 2304.15, "total_tokens": 17474800} {"current_steps": 30310, "total_steps": 67140, "loss": 0.5654, "lr": 3.343314480581104e-05, "epoch": 4.514447423294608, "percentage": 45.14, "elapsed_time": "2:06:25", "remaining_time": "2:33:36", "throughput": 2304.18, "total_tokens": 17477616} {"current_steps": 30315, "total_steps": 67140, "loss": 0.5231, "lr": 3.342702658840702e-05, "epoch": 4.5151921358355676, "percentage": 45.15, "elapsed_time": "2:06:26", "remaining_time": "2:33:35", "throughput": 2304.19, "total_tokens": 17480208} {"current_steps": 30320, "total_steps": 67140, "loss": 0.7121, "lr": 3.3420907801538784e-05, "epoch": 4.515936848376526, "percentage": 45.16, "elapsed_time": "2:06:27", "remaining_time": "2:33:33", "throughput": 2304.22, "total_tokens": 17483056} {"current_steps": 30325, "total_steps": 67140, "loss": 0.6727, "lr": 3.3414788445619844e-05, "epoch": 4.516681560917486, "percentage": 45.17, "elapsed_time": "2:06:28", "remaining_time": "2:33:32", "throughput": 2304.27, "total_tokens": 17486032} {"current_steps": 30330, "total_steps": 67140, "loss": 0.7872, "lr": 3.340866852106371e-05, "epoch": 4.517426273458445, "percentage": 45.17, "elapsed_time": "2:06:29", "remaining_time": "2:33:31", "throughput": 2304.3, "total_tokens": 17488880} {"current_steps": 30335, "total_steps": 67140, "loss": 0.7155, "lr": 3.340254802828395e-05, "epoch": 4.518170985999404, "percentage": 45.18, "elapsed_time": "2:06:30", "remaining_time": "2:33:29", "throughput": 2304.31, "total_tokens": 17491600} {"current_steps": 30340, "total_steps": 67140, "loss": 0.6872, "lr": 3.339642696769415e-05, "epoch": 4.518915698540363, "percentage": 45.19, "elapsed_time": "2:06:31", "remaining_time": "2:33:28", "throughput": 2304.36, "total_tokens": 17494576} {"current_steps": 30345, "total_steps": 67140, "loss": 0.7464, "lr": 3.339030533970796e-05, "epoch": 4.519660411081323, "percentage": 45.2, "elapsed_time": "2:06:33", "remaining_time": "2:33:27", "throughput": 2304.4, "total_tokens": 17497456} {"current_steps": 30350, "total_steps": 67140, "loss": 0.705, "lr": 3.338418314473904e-05, "epoch": 4.5204051236222815, "percentage": 45.2, "elapsed_time": "2:06:34", "remaining_time": "2:33:25", "throughput": 2304.45, "total_tokens": 17500592} {"current_steps": 30355, "total_steps": 67140, "loss": 0.6107, "lr": 3.3378060383201116e-05, "epoch": 4.521149836163241, "percentage": 45.21, "elapsed_time": "2:06:35", "remaining_time": "2:33:24", "throughput": 2304.48, "total_tokens": 17503440} {"current_steps": 30360, "total_steps": 67140, "loss": 0.653, "lr": 3.337193705550793e-05, "epoch": 4.5218945487042, "percentage": 45.22, "elapsed_time": "2:06:36", "remaining_time": "2:33:22", "throughput": 2304.53, "total_tokens": 17506544} {"current_steps": 30365, "total_steps": 67140, "loss": 0.7836, "lr": 3.3365813162073284e-05, "epoch": 4.52263926124516, "percentage": 45.23, "elapsed_time": "2:06:37", "remaining_time": "2:33:21", "throughput": 2304.59, "total_tokens": 17509680} {"current_steps": 30370, "total_steps": 67140, "loss": 0.5728, "lr": 3.3359688703310984e-05, "epoch": 4.523383973786118, "percentage": 45.23, "elapsed_time": "2:06:38", "remaining_time": "2:33:20", "throughput": 2304.65, "total_tokens": 17512848} {"current_steps": 30375, "total_steps": 67140, "loss": 0.7004, "lr": 3.335356367963492e-05, "epoch": 4.524128686327078, "percentage": 45.24, "elapsed_time": "2:06:40", "remaining_time": "2:33:18", "throughput": 2304.68, "total_tokens": 17515696} {"current_steps": 30380, "total_steps": 67140, "loss": 0.6786, "lr": 3.334743809145898e-05, "epoch": 4.524873398868037, "percentage": 45.25, "elapsed_time": "2:06:41", "remaining_time": "2:33:17", "throughput": 2304.7, "total_tokens": 17518352} {"current_steps": 30385, "total_steps": 67140, "loss": 0.5579, "lr": 3.334131193919712e-05, "epoch": 4.525618111408996, "percentage": 45.26, "elapsed_time": "2:06:42", "remaining_time": "2:33:16", "throughput": 2304.72, "total_tokens": 17521072} {"current_steps": 30390, "total_steps": 67140, "loss": 0.523, "lr": 3.333518522326331e-05, "epoch": 4.526362823949955, "percentage": 45.26, "elapsed_time": "2:06:43", "remaining_time": "2:33:14", "throughput": 2304.74, "total_tokens": 17523824} {"current_steps": 30395, "total_steps": 67140, "loss": 0.5702, "lr": 3.3329057944071564e-05, "epoch": 4.527107536490915, "percentage": 45.27, "elapsed_time": "2:06:44", "remaining_time": "2:33:13", "throughput": 2304.81, "total_tokens": 17527120} {"current_steps": 30400, "total_steps": 67140, "loss": 0.7366, "lr": 3.332293010203595e-05, "epoch": 4.5278522490318736, "percentage": 45.28, "elapsed_time": "2:06:45", "remaining_time": "2:33:11", "throughput": 2304.86, "total_tokens": 17530224} {"current_steps": 30405, "total_steps": 67140, "loss": 0.631, "lr": 3.331680169757056e-05, "epoch": 4.528596961572833, "percentage": 45.29, "elapsed_time": "2:06:46", "remaining_time": "2:33:10", "throughput": 2304.88, "total_tokens": 17532944} {"current_steps": 30410, "total_steps": 67140, "loss": 0.6157, "lr": 3.331067273108952e-05, "epoch": 4.529341674113792, "percentage": 45.29, "elapsed_time": "2:06:48", "remaining_time": "2:33:09", "throughput": 2304.91, "total_tokens": 17535760} {"current_steps": 30415, "total_steps": 67140, "loss": 0.5731, "lr": 3.330454320300701e-05, "epoch": 4.530086386654752, "percentage": 45.3, "elapsed_time": "2:06:49", "remaining_time": "2:33:07", "throughput": 2304.94, "total_tokens": 17538608} {"current_steps": 30420, "total_steps": 67140, "loss": 0.6219, "lr": 3.329841311373723e-05, "epoch": 4.53083109919571, "percentage": 45.31, "elapsed_time": "2:06:50", "remaining_time": "2:33:06", "throughput": 2304.97, "total_tokens": 17541360} {"current_steps": 30425, "total_steps": 67140, "loss": 0.6042, "lr": 3.3292282463694435e-05, "epoch": 4.53157581173667, "percentage": 45.32, "elapsed_time": "2:06:51", "remaining_time": "2:33:04", "throughput": 2304.99, "total_tokens": 17544112} {"current_steps": 30430, "total_steps": 67140, "loss": 0.5911, "lr": 3.328615125329291e-05, "epoch": 4.532320524277629, "percentage": 45.32, "elapsed_time": "2:06:52", "remaining_time": "2:33:03", "throughput": 2305.06, "total_tokens": 17547344} {"current_steps": 30435, "total_steps": 67140, "loss": 0.6683, "lr": 3.328001948294695e-05, "epoch": 4.533065236818588, "percentage": 45.33, "elapsed_time": "2:06:53", "remaining_time": "2:33:02", "throughput": 2305.08, "total_tokens": 17550096} {"current_steps": 30440, "total_steps": 67140, "loss": 0.6495, "lr": 3.327388715307096e-05, "epoch": 4.533809949359547, "percentage": 45.34, "elapsed_time": "2:06:54", "remaining_time": "2:33:00", "throughput": 2305.13, "total_tokens": 17553136} {"current_steps": 30445, "total_steps": 67140, "loss": 0.6069, "lr": 3.3267754264079314e-05, "epoch": 4.534554661900506, "percentage": 45.35, "elapsed_time": "2:06:55", "remaining_time": "2:32:59", "throughput": 2305.17, "total_tokens": 17556016} {"current_steps": 30450, "total_steps": 67140, "loss": 0.7444, "lr": 3.326162081638644e-05, "epoch": 4.535299374441466, "percentage": 45.35, "elapsed_time": "2:06:57", "remaining_time": "2:32:58", "throughput": 2305.22, "total_tokens": 17559056} {"current_steps": 30455, "total_steps": 67140, "loss": 0.4694, "lr": 3.3255486810406825e-05, "epoch": 4.536044086982425, "percentage": 45.36, "elapsed_time": "2:06:58", "remaining_time": "2:32:56", "throughput": 2305.23, "total_tokens": 17561712} {"current_steps": 30460, "total_steps": 67140, "loss": 0.7125, "lr": 3.324935224655497e-05, "epoch": 4.536788799523384, "percentage": 45.37, "elapsed_time": "2:06:59", "remaining_time": "2:32:55", "throughput": 2305.27, "total_tokens": 17564656} {"current_steps": 30465, "total_steps": 67140, "loss": 0.6952, "lr": 3.324321712524544e-05, "epoch": 4.537533512064343, "percentage": 45.38, "elapsed_time": "2:07:00", "remaining_time": "2:32:53", "throughput": 2305.34, "total_tokens": 17567920} {"current_steps": 30470, "total_steps": 67140, "loss": 0.7329, "lr": 3.32370814468928e-05, "epoch": 4.538278224605302, "percentage": 45.38, "elapsed_time": "2:07:01", "remaining_time": "2:32:52", "throughput": 2305.39, "total_tokens": 17570928} {"current_steps": 30475, "total_steps": 67140, "loss": 0.5492, "lr": 3.323094521191169e-05, "epoch": 4.539022937146262, "percentage": 45.39, "elapsed_time": "2:07:02", "remaining_time": "2:32:51", "throughput": 2305.42, "total_tokens": 17573840} {"current_steps": 30480, "total_steps": 67140, "loss": 0.795, "lr": 3.322480842071677e-05, "epoch": 4.539767649687221, "percentage": 45.4, "elapsed_time": "2:07:03", "remaining_time": "2:32:49", "throughput": 2305.46, "total_tokens": 17576688} {"current_steps": 30485, "total_steps": 67140, "loss": 0.7578, "lr": 3.321867107372274e-05, "epoch": 4.5405123622281796, "percentage": 45.41, "elapsed_time": "2:07:05", "remaining_time": "2:32:48", "throughput": 2305.49, "total_tokens": 17579568} {"current_steps": 30490, "total_steps": 67140, "loss": 0.4681, "lr": 3.321253317134432e-05, "epoch": 4.541257074769139, "percentage": 45.41, "elapsed_time": "2:07:06", "remaining_time": "2:32:46", "throughput": 2305.52, "total_tokens": 17582384} {"current_steps": 30495, "total_steps": 67140, "loss": 0.7313, "lr": 3.320639471399631e-05, "epoch": 4.542001787310098, "percentage": 45.42, "elapsed_time": "2:07:07", "remaining_time": "2:32:45", "throughput": 2305.56, "total_tokens": 17585328} {"current_steps": 30500, "total_steps": 67140, "loss": 0.5647, "lr": 3.3200255702093506e-05, "epoch": 4.542746499851058, "percentage": 45.43, "elapsed_time": "2:07:08", "remaining_time": "2:32:44", "throughput": 2305.59, "total_tokens": 17588112} {"current_steps": 30505, "total_steps": 67140, "loss": 0.5533, "lr": 3.319411613605076e-05, "epoch": 4.543491212392016, "percentage": 45.43, "elapsed_time": "2:07:09", "remaining_time": "2:32:42", "throughput": 2305.62, "total_tokens": 17590928} {"current_steps": 30510, "total_steps": 67140, "loss": 0.5402, "lr": 3.3187976016282964e-05, "epoch": 4.544235924932976, "percentage": 45.44, "elapsed_time": "2:07:10", "remaining_time": "2:32:41", "throughput": 2305.66, "total_tokens": 17593904} {"current_steps": 30515, "total_steps": 67140, "loss": 0.4526, "lr": 3.3181835343205035e-05, "epoch": 4.544980637473935, "percentage": 45.45, "elapsed_time": "2:07:11", "remaining_time": "2:32:40", "throughput": 2305.69, "total_tokens": 17596752} {"current_steps": 30520, "total_steps": 67140, "loss": 0.7465, "lr": 3.317569411723194e-05, "epoch": 4.545725350014894, "percentage": 45.46, "elapsed_time": "2:07:12", "remaining_time": "2:32:38", "throughput": 2305.71, "total_tokens": 17599472} {"current_steps": 30525, "total_steps": 67140, "loss": 0.7274, "lr": 3.316955233877868e-05, "epoch": 4.546470062555853, "percentage": 45.46, "elapsed_time": "2:07:14", "remaining_time": "2:32:37", "throughput": 2305.74, "total_tokens": 17602320} {"current_steps": 30530, "total_steps": 67140, "loss": 0.6378, "lr": 3.316341000826029e-05, "epoch": 4.547214775096813, "percentage": 45.47, "elapsed_time": "2:07:15", "remaining_time": "2:32:35", "throughput": 2305.79, "total_tokens": 17605328} {"current_steps": 30535, "total_steps": 67140, "loss": 0.8051, "lr": 3.315726712609183e-05, "epoch": 4.547959487637772, "percentage": 45.48, "elapsed_time": "2:07:16", "remaining_time": "2:32:34", "throughput": 2305.82, "total_tokens": 17608240} {"current_steps": 30540, "total_steps": 67140, "loss": 0.5922, "lr": 3.3151123692688424e-05, "epoch": 4.548704200178731, "percentage": 45.49, "elapsed_time": "2:07:17", "remaining_time": "2:32:33", "throughput": 2305.85, "total_tokens": 17610992} {"current_steps": 30545, "total_steps": 67140, "loss": 0.5777, "lr": 3.3144979708465226e-05, "epoch": 4.54944891271969, "percentage": 45.49, "elapsed_time": "2:07:18", "remaining_time": "2:32:31", "throughput": 2305.87, "total_tokens": 17613712} {"current_steps": 30550, "total_steps": 67140, "loss": 0.5461, "lr": 3.313883517383741e-05, "epoch": 4.55019362526065, "percentage": 45.5, "elapsed_time": "2:07:19", "remaining_time": "2:32:30", "throughput": 2305.9, "total_tokens": 17616592} {"current_steps": 30555, "total_steps": 67140, "loss": 0.5897, "lr": 3.313269008922021e-05, "epoch": 4.550938337801608, "percentage": 45.51, "elapsed_time": "2:07:20", "remaining_time": "2:32:28", "throughput": 2305.96, "total_tokens": 17619728} {"current_steps": 30560, "total_steps": 67140, "loss": 0.5529, "lr": 3.312654445502887e-05, "epoch": 4.551683050342568, "percentage": 45.52, "elapsed_time": "2:07:22", "remaining_time": "2:32:27", "throughput": 2305.99, "total_tokens": 17622576} {"current_steps": 30565, "total_steps": 67140, "loss": 0.712, "lr": 3.3120398271678706e-05, "epoch": 4.552427762883527, "percentage": 45.52, "elapsed_time": "2:07:23", "remaining_time": "2:32:26", "throughput": 2306.02, "total_tokens": 17625360} {"current_steps": 30570, "total_steps": 67140, "loss": 0.6931, "lr": 3.311425153958503e-05, "epoch": 4.553172475424486, "percentage": 45.53, "elapsed_time": "2:07:24", "remaining_time": "2:32:24", "throughput": 2306.06, "total_tokens": 17628368} {"current_steps": 30575, "total_steps": 67140, "loss": 0.5909, "lr": 3.310810425916323e-05, "epoch": 4.553917187965445, "percentage": 45.54, "elapsed_time": "2:07:25", "remaining_time": "2:32:23", "throughput": 2306.1, "total_tokens": 17631312} {"current_steps": 30580, "total_steps": 67140, "loss": 0.6534, "lr": 3.3101956430828715e-05, "epoch": 4.554661900506405, "percentage": 45.55, "elapsed_time": "2:07:26", "remaining_time": "2:32:21", "throughput": 2306.13, "total_tokens": 17634160} {"current_steps": 30585, "total_steps": 67140, "loss": 0.6289, "lr": 3.309580805499692e-05, "epoch": 4.555406613047364, "percentage": 45.55, "elapsed_time": "2:07:27", "remaining_time": "2:32:20", "throughput": 2306.18, "total_tokens": 17637168} {"current_steps": 30590, "total_steps": 67140, "loss": 0.6931, "lr": 3.3089659132083327e-05, "epoch": 4.556151325588323, "percentage": 45.56, "elapsed_time": "2:07:28", "remaining_time": "2:32:19", "throughput": 2306.22, "total_tokens": 17640144} {"current_steps": 30595, "total_steps": 67140, "loss": 0.6186, "lr": 3.3083509662503466e-05, "epoch": 4.556896038129282, "percentage": 45.57, "elapsed_time": "2:07:30", "remaining_time": "2:32:17", "throughput": 2306.26, "total_tokens": 17643088} {"current_steps": 30600, "total_steps": 67140, "loss": 0.6606, "lr": 3.3077359646672884e-05, "epoch": 4.557640750670242, "percentage": 45.58, "elapsed_time": "2:07:31", "remaining_time": "2:32:16", "throughput": 2306.28, "total_tokens": 17645904} {"current_steps": 30605, "total_steps": 67140, "loss": 0.5661, "lr": 3.307120908500718e-05, "epoch": 4.5583854632112, "percentage": 45.58, "elapsed_time": "2:07:32", "remaining_time": "2:32:15", "throughput": 2306.34, "total_tokens": 17649040} {"current_steps": 30610, "total_steps": 67140, "loss": 0.7688, "lr": 3.3065057977921986e-05, "epoch": 4.559130175752159, "percentage": 45.59, "elapsed_time": "2:07:33", "remaining_time": "2:32:13", "throughput": 2306.4, "total_tokens": 17652240} {"current_steps": 30615, "total_steps": 67140, "loss": 0.5865, "lr": 3.305890632583295e-05, "epoch": 4.559874888293119, "percentage": 45.6, "elapsed_time": "2:07:34", "remaining_time": "2:32:12", "throughput": 2306.4, "total_tokens": 17654800} {"current_steps": 30620, "total_steps": 67140, "loss": 0.7488, "lr": 3.30527541291558e-05, "epoch": 4.5606196008340785, "percentage": 45.61, "elapsed_time": "2:07:35", "remaining_time": "2:32:10", "throughput": 2306.44, "total_tokens": 17657744} {"current_steps": 30625, "total_steps": 67140, "loss": 0.8042, "lr": 3.304660138830626e-05, "epoch": 4.561364313375037, "percentage": 45.61, "elapsed_time": "2:07:36", "remaining_time": "2:32:09", "throughput": 2306.49, "total_tokens": 17660784} {"current_steps": 30630, "total_steps": 67140, "loss": 0.6932, "lr": 3.3040448103700124e-05, "epoch": 4.562109025915996, "percentage": 45.62, "elapsed_time": "2:07:38", "remaining_time": "2:32:08", "throughput": 2306.51, "total_tokens": 17663504} {"current_steps": 30635, "total_steps": 67140, "loss": 0.5687, "lr": 3.303429427575319e-05, "epoch": 4.562853738456956, "percentage": 45.63, "elapsed_time": "2:07:39", "remaining_time": "2:32:06", "throughput": 2306.52, "total_tokens": 17666128} {"current_steps": 30640, "total_steps": 67140, "loss": 0.6273, "lr": 3.30281399048813e-05, "epoch": 4.563598450997915, "percentage": 45.64, "elapsed_time": "2:07:40", "remaining_time": "2:32:05", "throughput": 2306.58, "total_tokens": 17669296} {"current_steps": 30645, "total_steps": 67140, "loss": 0.5068, "lr": 3.302198499150038e-05, "epoch": 4.564343163538874, "percentage": 45.64, "elapsed_time": "2:07:41", "remaining_time": "2:32:04", "throughput": 2306.61, "total_tokens": 17672144} {"current_steps": 30650, "total_steps": 67140, "loss": 0.4376, "lr": 3.301582953602631e-05, "epoch": 4.565087876079833, "percentage": 45.65, "elapsed_time": "2:07:42", "remaining_time": "2:32:02", "throughput": 2306.63, "total_tokens": 17674864} {"current_steps": 30655, "total_steps": 67140, "loss": 0.6308, "lr": 3.300967353887507e-05, "epoch": 4.565832588620792, "percentage": 45.66, "elapsed_time": "2:07:43", "remaining_time": "2:32:01", "throughput": 2306.66, "total_tokens": 17677712} {"current_steps": 30660, "total_steps": 67140, "loss": 0.6755, "lr": 3.300351700046267e-05, "epoch": 4.566577301161751, "percentage": 45.67, "elapsed_time": "2:07:44", "remaining_time": "2:31:59", "throughput": 2306.66, "total_tokens": 17680176} {"current_steps": 30665, "total_steps": 67140, "loss": 0.7003, "lr": 3.299735992120513e-05, "epoch": 4.567322013702711, "percentage": 45.67, "elapsed_time": "2:07:45", "remaining_time": "2:31:58", "throughput": 2306.7, "total_tokens": 17683088} {"current_steps": 30670, "total_steps": 67140, "loss": 0.901, "lr": 3.299120230151852e-05, "epoch": 4.56806672624367, "percentage": 45.68, "elapsed_time": "2:07:47", "remaining_time": "2:31:57", "throughput": 2306.76, "total_tokens": 17686256} {"current_steps": 30675, "total_steps": 67140, "loss": 0.7258, "lr": 3.298504414181894e-05, "epoch": 4.568811438784629, "percentage": 45.69, "elapsed_time": "2:07:48", "remaining_time": "2:31:55", "throughput": 2306.78, "total_tokens": 17688976} {"current_steps": 30680, "total_steps": 67140, "loss": 0.6207, "lr": 3.297888544252255e-05, "epoch": 4.569556151325588, "percentage": 45.7, "elapsed_time": "2:07:49", "remaining_time": "2:31:54", "throughput": 2306.8, "total_tokens": 17691728} {"current_steps": 30685, "total_steps": 67140, "loss": 0.6805, "lr": 3.2972726204045515e-05, "epoch": 4.570300863866548, "percentage": 45.7, "elapsed_time": "2:07:50", "remaining_time": "2:31:52", "throughput": 2306.81, "total_tokens": 17694224} {"current_steps": 30690, "total_steps": 67140, "loss": 0.7214, "lr": 3.2966566426804057e-05, "epoch": 4.571045576407506, "percentage": 45.71, "elapsed_time": "2:07:51", "remaining_time": "2:31:51", "throughput": 2306.83, "total_tokens": 17696944} {"current_steps": 30695, "total_steps": 67140, "loss": 0.5531, "lr": 3.296040611121444e-05, "epoch": 4.571790288948466, "percentage": 45.72, "elapsed_time": "2:07:52", "remaining_time": "2:31:49", "throughput": 2306.84, "total_tokens": 17699632} {"current_steps": 30700, "total_steps": 67140, "loss": 0.6578, "lr": 3.295424525769293e-05, "epoch": 4.572535001489425, "percentage": 45.73, "elapsed_time": "2:07:53", "remaining_time": "2:31:48", "throughput": 2306.87, "total_tokens": 17702384} {"current_steps": 30705, "total_steps": 67140, "loss": 0.6771, "lr": 3.2948083866655865e-05, "epoch": 4.5732797140303845, "percentage": 45.73, "elapsed_time": "2:07:54", "remaining_time": "2:31:47", "throughput": 2306.88, "total_tokens": 17705008} {"current_steps": 30710, "total_steps": 67140, "loss": 0.5122, "lr": 3.294192193851963e-05, "epoch": 4.574024426571343, "percentage": 45.74, "elapsed_time": "2:07:56", "remaining_time": "2:31:45", "throughput": 2306.91, "total_tokens": 17707952} {"current_steps": 30715, "total_steps": 67140, "loss": 0.7142, "lr": 3.293575947370057e-05, "epoch": 4.574769139112303, "percentage": 45.75, "elapsed_time": "2:07:57", "remaining_time": "2:31:44", "throughput": 2306.94, "total_tokens": 17710768} {"current_steps": 30720, "total_steps": 67140, "loss": 0.582, "lr": 3.2929596472615165e-05, "epoch": 4.575513851653262, "percentage": 45.76, "elapsed_time": "2:07:58", "remaining_time": "2:31:42", "throughput": 2306.96, "total_tokens": 17713456} {"current_steps": 30725, "total_steps": 67140, "loss": 0.5695, "lr": 3.292343293567986e-05, "epoch": 4.576258564194221, "percentage": 45.76, "elapsed_time": "2:07:59", "remaining_time": "2:31:41", "throughput": 2306.99, "total_tokens": 17716208} {"current_steps": 30730, "total_steps": 67140, "loss": 0.4637, "lr": 3.291726886331119e-05, "epoch": 4.57700327673518, "percentage": 45.77, "elapsed_time": "2:08:00", "remaining_time": "2:31:40", "throughput": 2307.04, "total_tokens": 17719312} {"current_steps": 30735, "total_steps": 67140, "loss": 0.7308, "lr": 3.291110425592566e-05, "epoch": 4.57774798927614, "percentage": 45.78, "elapsed_time": "2:08:01", "remaining_time": "2:31:38", "throughput": 2307.07, "total_tokens": 17722160} {"current_steps": 30740, "total_steps": 67140, "loss": 0.5533, "lr": 3.290493911393988e-05, "epoch": 4.578492701817098, "percentage": 45.78, "elapsed_time": "2:08:02", "remaining_time": "2:31:37", "throughput": 2307.11, "total_tokens": 17725008} {"current_steps": 30745, "total_steps": 67140, "loss": 0.5233, "lr": 3.289877343777045e-05, "epoch": 4.579237414358058, "percentage": 45.79, "elapsed_time": "2:08:03", "remaining_time": "2:31:35", "throughput": 2307.13, "total_tokens": 17727824} {"current_steps": 30750, "total_steps": 67140, "loss": 0.6215, "lr": 3.2892607227834024e-05, "epoch": 4.579982126899017, "percentage": 45.8, "elapsed_time": "2:08:05", "remaining_time": "2:31:34", "throughput": 2307.22, "total_tokens": 17731312} {"current_steps": 30755, "total_steps": 67140, "loss": 0.7049, "lr": 3.288644048454729e-05, "epoch": 4.5807268394399765, "percentage": 45.81, "elapsed_time": "2:08:06", "remaining_time": "2:31:33", "throughput": 2307.24, "total_tokens": 17734032} {"current_steps": 30760, "total_steps": 67140, "loss": 0.7521, "lr": 3.288027320832698e-05, "epoch": 4.581471551980935, "percentage": 45.81, "elapsed_time": "2:08:07", "remaining_time": "2:31:31", "throughput": 2307.27, "total_tokens": 17736848} {"current_steps": 30765, "total_steps": 67140, "loss": 0.525, "lr": 3.287410539958984e-05, "epoch": 4.582216264521895, "percentage": 45.82, "elapsed_time": "2:08:08", "remaining_time": "2:31:30", "throughput": 2307.31, "total_tokens": 17739792} {"current_steps": 30770, "total_steps": 67140, "loss": 0.6458, "lr": 3.286793705875267e-05, "epoch": 4.582960977062854, "percentage": 45.83, "elapsed_time": "2:08:09", "remaining_time": "2:31:29", "throughput": 2307.33, "total_tokens": 17742480} {"current_steps": 30775, "total_steps": 67140, "loss": 0.6505, "lr": 3.2861768186232306e-05, "epoch": 4.583705689603813, "percentage": 45.84, "elapsed_time": "2:08:10", "remaining_time": "2:31:27", "throughput": 2307.36, "total_tokens": 17745328} {"current_steps": 30780, "total_steps": 67140, "loss": 0.6815, "lr": 3.2855598782445606e-05, "epoch": 4.584450402144772, "percentage": 45.84, "elapsed_time": "2:08:11", "remaining_time": "2:31:26", "throughput": 2307.4, "total_tokens": 17748240} {"current_steps": 30785, "total_steps": 67140, "loss": 0.6779, "lr": 3.2849428847809474e-05, "epoch": 4.585195114685732, "percentage": 45.85, "elapsed_time": "2:08:12", "remaining_time": "2:31:24", "throughput": 2307.42, "total_tokens": 17750928} {"current_steps": 30790, "total_steps": 67140, "loss": 0.7863, "lr": 3.2843258382740866e-05, "epoch": 4.5859398272266905, "percentage": 45.86, "elapsed_time": "2:08:14", "remaining_time": "2:31:23", "throughput": 2307.46, "total_tokens": 17753840} {"current_steps": 30795, "total_steps": 67140, "loss": 0.6951, "lr": 3.283708738765674e-05, "epoch": 4.586684539767649, "percentage": 45.87, "elapsed_time": "2:08:15", "remaining_time": "2:31:22", "throughput": 2307.47, "total_tokens": 17756496} {"current_steps": 30800, "total_steps": 67140, "loss": 0.548, "lr": 3.283091586297411e-05, "epoch": 4.587429252308609, "percentage": 45.87, "elapsed_time": "2:08:16", "remaining_time": "2:31:20", "throughput": 2307.49, "total_tokens": 17759184} {"current_steps": 30805, "total_steps": 67140, "loss": 0.5438, "lr": 3.2824743809110024e-05, "epoch": 4.5881739648495685, "percentage": 45.88, "elapsed_time": "2:08:17", "remaining_time": "2:31:19", "throughput": 2307.52, "total_tokens": 17761936} {"current_steps": 30810, "total_steps": 67140, "loss": 0.6053, "lr": 3.281857122648157e-05, "epoch": 4.588918677390527, "percentage": 45.89, "elapsed_time": "2:08:18", "remaining_time": "2:31:17", "throughput": 2307.55, "total_tokens": 17764880} {"current_steps": 30815, "total_steps": 67140, "loss": 0.7027, "lr": 3.281239811550586e-05, "epoch": 4.589663389931486, "percentage": 45.9, "elapsed_time": "2:08:19", "remaining_time": "2:31:16", "throughput": 2307.57, "total_tokens": 17767536} {"current_steps": 30820, "total_steps": 67140, "loss": 0.6872, "lr": 3.280622447660004e-05, "epoch": 4.590408102472446, "percentage": 45.9, "elapsed_time": "2:08:20", "remaining_time": "2:31:15", "throughput": 2307.6, "total_tokens": 17770384} {"current_steps": 30825, "total_steps": 67140, "loss": 0.6831, "lr": 3.280005031018131e-05, "epoch": 4.591152815013404, "percentage": 45.91, "elapsed_time": "2:08:21", "remaining_time": "2:31:13", "throughput": 2307.63, "total_tokens": 17773296} {"current_steps": 30830, "total_steps": 67140, "loss": 0.5484, "lr": 3.2793875616666904e-05, "epoch": 4.591897527554364, "percentage": 45.92, "elapsed_time": "2:08:23", "remaining_time": "2:31:12", "throughput": 2307.65, "total_tokens": 17775984} {"current_steps": 30835, "total_steps": 67140, "loss": 0.6395, "lr": 3.278770039647406e-05, "epoch": 4.592642240095323, "percentage": 45.93, "elapsed_time": "2:08:24", "remaining_time": "2:31:10", "throughput": 2307.67, "total_tokens": 17778736} {"current_steps": 30840, "total_steps": 67140, "loss": 0.5877, "lr": 3.278152465002008e-05, "epoch": 4.5933869526362825, "percentage": 45.93, "elapsed_time": "2:08:25", "remaining_time": "2:31:09", "throughput": 2307.71, "total_tokens": 17781584} {"current_steps": 30845, "total_steps": 67140, "loss": 0.6476, "lr": 3.277534837772232e-05, "epoch": 4.594131665177241, "percentage": 45.94, "elapsed_time": "2:08:26", "remaining_time": "2:31:08", "throughput": 2307.73, "total_tokens": 17784304} {"current_steps": 30850, "total_steps": 67140, "loss": 0.7029, "lr": 3.276917157999811e-05, "epoch": 4.594876377718201, "percentage": 45.95, "elapsed_time": "2:08:27", "remaining_time": "2:31:06", "throughput": 2307.78, "total_tokens": 17787376} {"current_steps": 30855, "total_steps": 67140, "loss": 0.6073, "lr": 3.276299425726489e-05, "epoch": 4.59562109025916, "percentage": 45.96, "elapsed_time": "2:08:28", "remaining_time": "2:31:05", "throughput": 2307.8, "total_tokens": 17790128} {"current_steps": 30860, "total_steps": 67140, "loss": 0.6499, "lr": 3.275681640994007e-05, "epoch": 4.596365802800119, "percentage": 45.96, "elapsed_time": "2:08:29", "remaining_time": "2:31:03", "throughput": 2307.82, "total_tokens": 17792848} {"current_steps": 30865, "total_steps": 67140, "loss": 0.547, "lr": 3.275063803844113e-05, "epoch": 4.597110515341078, "percentage": 45.97, "elapsed_time": "2:08:30", "remaining_time": "2:31:02", "throughput": 2307.84, "total_tokens": 17795600} {"current_steps": 30870, "total_steps": 67140, "loss": 0.5845, "lr": 3.274445914318559e-05, "epoch": 4.597855227882038, "percentage": 45.98, "elapsed_time": "2:08:32", "remaining_time": "2:31:01", "throughput": 2307.84, "total_tokens": 17798096} {"current_steps": 30875, "total_steps": 67140, "loss": 0.8024, "lr": 3.273827972459099e-05, "epoch": 4.5985999404229965, "percentage": 45.99, "elapsed_time": "2:08:33", "remaining_time": "2:30:59", "throughput": 2307.88, "total_tokens": 17801072} {"current_steps": 30880, "total_steps": 67140, "loss": 0.6241, "lr": 3.27320997830749e-05, "epoch": 4.599344652963956, "percentage": 45.99, "elapsed_time": "2:08:34", "remaining_time": "2:30:58", "throughput": 2307.92, "total_tokens": 17804016} {"current_steps": 30885, "total_steps": 67140, "loss": 0.5784, "lr": 3.2725919319054946e-05, "epoch": 4.600089365504915, "percentage": 46.0, "elapsed_time": "2:08:35", "remaining_time": "2:30:56", "throughput": 2307.93, "total_tokens": 17806672} {"current_steps": 30890, "total_steps": 67140, "loss": 0.7917, "lr": 3.271973833294877e-05, "epoch": 4.6008340780458745, "percentage": 46.01, "elapsed_time": "2:08:36", "remaining_time": "2:30:55", "throughput": 2307.99, "total_tokens": 17809840} {"current_steps": 30895, "total_steps": 67140, "loss": 0.5958, "lr": 3.2713556825174074e-05, "epoch": 4.601578790586833, "percentage": 46.02, "elapsed_time": "2:08:37", "remaining_time": "2:30:54", "throughput": 2308.03, "total_tokens": 17812816} {"current_steps": 30900, "total_steps": 67140, "loss": 0.4211, "lr": 3.270737479614856e-05, "epoch": 4.602323503127793, "percentage": 46.02, "elapsed_time": "2:08:38", "remaining_time": "2:30:52", "throughput": 2308.06, "total_tokens": 17815664} {"current_steps": 30905, "total_steps": 67140, "loss": 0.6068, "lr": 3.270119224629e-05, "epoch": 4.603068215668752, "percentage": 46.03, "elapsed_time": "2:08:39", "remaining_time": "2:30:51", "throughput": 2308.07, "total_tokens": 17818224} {"current_steps": 30910, "total_steps": 67140, "loss": 0.412, "lr": 3.269500917601618e-05, "epoch": 4.603812928209711, "percentage": 46.04, "elapsed_time": "2:08:41", "remaining_time": "2:30:49", "throughput": 2308.09, "total_tokens": 17821008} {"current_steps": 30915, "total_steps": 67140, "loss": 0.8391, "lr": 3.268882558574492e-05, "epoch": 4.60455764075067, "percentage": 46.05, "elapsed_time": "2:08:42", "remaining_time": "2:30:48", "throughput": 2308.12, "total_tokens": 17823792} {"current_steps": 30920, "total_steps": 67140, "loss": 0.7195, "lr": 3.268264147589409e-05, "epoch": 4.60530235329163, "percentage": 46.05, "elapsed_time": "2:08:43", "remaining_time": "2:30:47", "throughput": 2308.16, "total_tokens": 17826704} {"current_steps": 30925, "total_steps": 67140, "loss": 0.764, "lr": 3.2676456846881583e-05, "epoch": 4.6060470658325885, "percentage": 46.06, "elapsed_time": "2:08:44", "remaining_time": "2:30:45", "throughput": 2308.22, "total_tokens": 17829936} {"current_steps": 30930, "total_steps": 67140, "loss": 0.8109, "lr": 3.267027169912533e-05, "epoch": 4.606791778373548, "percentage": 46.07, "elapsed_time": "2:08:45", "remaining_time": "2:30:44", "throughput": 2308.26, "total_tokens": 17832976} {"current_steps": 30935, "total_steps": 67140, "loss": 0.722, "lr": 3.2664086033043304e-05, "epoch": 4.607536490914507, "percentage": 46.08, "elapsed_time": "2:08:46", "remaining_time": "2:30:43", "throughput": 2308.31, "total_tokens": 17835952} {"current_steps": 30940, "total_steps": 67140, "loss": 0.5882, "lr": 3.265789984905351e-05, "epoch": 4.6082812034554665, "percentage": 46.08, "elapsed_time": "2:08:48", "remaining_time": "2:30:41", "throughput": 2308.36, "total_tokens": 17839056} {"current_steps": 30945, "total_steps": 67140, "loss": 0.6903, "lr": 3.265171314757397e-05, "epoch": 4.609025915996425, "percentage": 46.09, "elapsed_time": "2:08:49", "remaining_time": "2:30:40", "throughput": 2308.4, "total_tokens": 17841968} {"current_steps": 30950, "total_steps": 67140, "loss": 0.7566, "lr": 3.264552592902277e-05, "epoch": 4.609770628537385, "percentage": 46.1, "elapsed_time": "2:08:50", "remaining_time": "2:30:39", "throughput": 2308.44, "total_tokens": 17844912} {"current_steps": 30955, "total_steps": 67140, "loss": 0.7416, "lr": 3.2639338193818006e-05, "epoch": 4.610515341078344, "percentage": 46.11, "elapsed_time": "2:08:51", "remaining_time": "2:30:37", "throughput": 2308.48, "total_tokens": 17847888} {"current_steps": 30960, "total_steps": 67140, "loss": 0.6059, "lr": 3.2633149942377834e-05, "epoch": 4.6112600536193025, "percentage": 46.11, "elapsed_time": "2:08:52", "remaining_time": "2:30:36", "throughput": 2308.53, "total_tokens": 17850960} {"current_steps": 30965, "total_steps": 67140, "loss": 0.5528, "lr": 3.2626961175120414e-05, "epoch": 4.612004766160262, "percentage": 46.12, "elapsed_time": "2:08:53", "remaining_time": "2:30:34", "throughput": 2308.57, "total_tokens": 17853872} {"current_steps": 30970, "total_steps": 67140, "loss": 0.598, "lr": 3.262077189246398e-05, "epoch": 4.612749478701222, "percentage": 46.13, "elapsed_time": "2:08:54", "remaining_time": "2:30:33", "throughput": 2308.61, "total_tokens": 17856816} {"current_steps": 30975, "total_steps": 67140, "loss": 0.6048, "lr": 3.261458209482675e-05, "epoch": 4.6134941912421805, "percentage": 46.13, "elapsed_time": "2:08:56", "remaining_time": "2:30:32", "throughput": 2308.66, "total_tokens": 17859984} {"current_steps": 30980, "total_steps": 67140, "loss": 0.5744, "lr": 3.260839178262703e-05, "epoch": 4.614238903783139, "percentage": 46.14, "elapsed_time": "2:08:57", "remaining_time": "2:30:30", "throughput": 2308.68, "total_tokens": 17862640} {"current_steps": 30985, "total_steps": 67140, "loss": 0.5551, "lr": 3.260220095628312e-05, "epoch": 4.614983616324099, "percentage": 46.15, "elapsed_time": "2:08:58", "remaining_time": "2:30:29", "throughput": 2308.71, "total_tokens": 17865456} {"current_steps": 30990, "total_steps": 67140, "loss": 0.5769, "lr": 3.259600961621339e-05, "epoch": 4.615728328865059, "percentage": 46.16, "elapsed_time": "2:08:59", "remaining_time": "2:30:28", "throughput": 2308.72, "total_tokens": 17868048} {"current_steps": 30995, "total_steps": 67140, "loss": 0.6437, "lr": 3.25898177628362e-05, "epoch": 4.616473041406017, "percentage": 46.16, "elapsed_time": "2:09:00", "remaining_time": "2:30:26", "throughput": 2308.76, "total_tokens": 17870960} {"current_steps": 31000, "total_steps": 67140, "loss": 0.9059, "lr": 3.258362539656999e-05, "epoch": 4.617217753946976, "percentage": 46.17, "elapsed_time": "2:09:01", "remaining_time": "2:30:25", "throughput": 2308.81, "total_tokens": 17874032} {"current_steps": 31005, "total_steps": 67140, "loss": 0.6059, "lr": 3.2577432517833204e-05, "epoch": 4.617962466487936, "percentage": 46.18, "elapsed_time": "2:09:02", "remaining_time": "2:30:23", "throughput": 2308.84, "total_tokens": 17876944} {"current_steps": 31010, "total_steps": 67140, "loss": 0.5954, "lr": 3.257123912704435e-05, "epoch": 4.6187071790288945, "percentage": 46.19, "elapsed_time": "2:09:03", "remaining_time": "2:30:22", "throughput": 2308.86, "total_tokens": 17879728} {"current_steps": 31015, "total_steps": 67140, "loss": 0.7343, "lr": 3.2565045224621923e-05, "epoch": 4.619451891569854, "percentage": 46.19, "elapsed_time": "2:09:05", "remaining_time": "2:30:21", "throughput": 2308.9, "total_tokens": 17882640} {"current_steps": 31020, "total_steps": 67140, "loss": 0.5262, "lr": 3.25588508109845e-05, "epoch": 4.620196604110813, "percentage": 46.2, "elapsed_time": "2:09:06", "remaining_time": "2:30:19", "throughput": 2308.95, "total_tokens": 17885744} {"current_steps": 31025, "total_steps": 67140, "loss": 0.7437, "lr": 3.2552655886550674e-05, "epoch": 4.6209413166517725, "percentage": 46.21, "elapsed_time": "2:09:07", "remaining_time": "2:30:18", "throughput": 2308.94, "total_tokens": 17888080} {"current_steps": 31030, "total_steps": 67140, "loss": 0.6599, "lr": 3.254646045173907e-05, "epoch": 4.621686029192731, "percentage": 46.22, "elapsed_time": "2:09:08", "remaining_time": "2:30:16", "throughput": 2308.97, "total_tokens": 17890896} {"current_steps": 31035, "total_steps": 67140, "loss": 0.6455, "lr": 3.254026450696835e-05, "epoch": 4.622430741733691, "percentage": 46.22, "elapsed_time": "2:09:09", "remaining_time": "2:30:15", "throughput": 2309.0, "total_tokens": 17893712} {"current_steps": 31040, "total_steps": 67140, "loss": 0.6264, "lr": 3.253406805265721e-05, "epoch": 4.62317545427465, "percentage": 46.23, "elapsed_time": "2:09:10", "remaining_time": "2:30:14", "throughput": 2309.03, "total_tokens": 17896528} {"current_steps": 31045, "total_steps": 67140, "loss": 0.7361, "lr": 3.252787108922438e-05, "epoch": 4.623920166815609, "percentage": 46.24, "elapsed_time": "2:09:11", "remaining_time": "2:30:12", "throughput": 2309.05, "total_tokens": 17899312} {"current_steps": 31050, "total_steps": 67140, "loss": 0.6318, "lr": 3.252167361708863e-05, "epoch": 4.624664879356568, "percentage": 46.25, "elapsed_time": "2:09:12", "remaining_time": "2:30:11", "throughput": 2309.11, "total_tokens": 17902480} {"current_steps": 31055, "total_steps": 67140, "loss": 0.7142, "lr": 3.251547563666876e-05, "epoch": 4.625409591897528, "percentage": 46.25, "elapsed_time": "2:09:14", "remaining_time": "2:30:10", "throughput": 2309.14, "total_tokens": 17905392} {"current_steps": 31060, "total_steps": 67140, "loss": 0.5548, "lr": 3.25092771483836e-05, "epoch": 4.6261543044384865, "percentage": 46.26, "elapsed_time": "2:09:15", "remaining_time": "2:30:08", "throughput": 2309.18, "total_tokens": 17908272} {"current_steps": 31065, "total_steps": 67140, "loss": 0.7472, "lr": 3.2503078152652024e-05, "epoch": 4.626899016979446, "percentage": 46.27, "elapsed_time": "2:09:16", "remaining_time": "2:30:07", "throughput": 2309.21, "total_tokens": 17911152} {"current_steps": 31070, "total_steps": 67140, "loss": 0.5491, "lr": 3.2496878649892924e-05, "epoch": 4.627643729520405, "percentage": 46.28, "elapsed_time": "2:09:17", "remaining_time": "2:30:05", "throughput": 2309.23, "total_tokens": 17913872} {"current_steps": 31075, "total_steps": 67140, "loss": 0.5069, "lr": 3.2490678640525255e-05, "epoch": 4.628388442061365, "percentage": 46.28, "elapsed_time": "2:09:18", "remaining_time": "2:30:04", "throughput": 2309.24, "total_tokens": 17916464} {"current_steps": 31080, "total_steps": 67140, "loss": 0.6208, "lr": 3.248447812496797e-05, "epoch": 4.629133154602323, "percentage": 46.29, "elapsed_time": "2:09:19", "remaining_time": "2:30:03", "throughput": 2309.28, "total_tokens": 17919376} {"current_steps": 31085, "total_steps": 67140, "loss": 0.8341, "lr": 3.2478277103640086e-05, "epoch": 4.629877867143283, "percentage": 46.3, "elapsed_time": "2:09:20", "remaining_time": "2:30:01", "throughput": 2309.3, "total_tokens": 17922128} {"current_steps": 31090, "total_steps": 67140, "loss": 0.4389, "lr": 3.247207557696064e-05, "epoch": 4.630622579684242, "percentage": 46.31, "elapsed_time": "2:09:21", "remaining_time": "2:30:00", "throughput": 2309.33, "total_tokens": 17924880} {"current_steps": 31095, "total_steps": 67140, "loss": 0.7798, "lr": 3.2465873545348715e-05, "epoch": 4.631367292225201, "percentage": 46.31, "elapsed_time": "2:09:23", "remaining_time": "2:29:58", "throughput": 2309.4, "total_tokens": 17928208} {"current_steps": 31100, "total_steps": 67140, "loss": 0.7477, "lr": 3.2459671009223394e-05, "epoch": 4.63211200476616, "percentage": 46.32, "elapsed_time": "2:09:24", "remaining_time": "2:29:57", "throughput": 2309.48, "total_tokens": 17931760} {"current_steps": 31105, "total_steps": 67140, "loss": 0.7781, "lr": 3.245346796900384e-05, "epoch": 4.63285671730712, "percentage": 46.33, "elapsed_time": "2:09:25", "remaining_time": "2:29:56", "throughput": 2309.52, "total_tokens": 17934672} {"current_steps": 31110, "total_steps": 67140, "loss": 0.7357, "lr": 3.244726442510923e-05, "epoch": 4.6336014298480785, "percentage": 46.34, "elapsed_time": "2:09:26", "remaining_time": "2:29:54", "throughput": 2309.54, "total_tokens": 17937488} {"current_steps": 31115, "total_steps": 67140, "loss": 0.494, "lr": 3.244106037795877e-05, "epoch": 4.634346142389038, "percentage": 46.34, "elapsed_time": "2:09:27", "remaining_time": "2:29:53", "throughput": 2309.57, "total_tokens": 17940272} {"current_steps": 31120, "total_steps": 67140, "loss": 0.6002, "lr": 3.243485582797169e-05, "epoch": 4.635090854929997, "percentage": 46.35, "elapsed_time": "2:09:28", "remaining_time": "2:29:52", "throughput": 2309.62, "total_tokens": 17943312} {"current_steps": 31125, "total_steps": 67140, "loss": 0.6191, "lr": 3.242865077556729e-05, "epoch": 4.635835567470957, "percentage": 46.36, "elapsed_time": "2:09:30", "remaining_time": "2:29:50", "throughput": 2309.67, "total_tokens": 17946448} {"current_steps": 31130, "total_steps": 67140, "loss": 0.745, "lr": 3.2422445221164876e-05, "epoch": 4.636580280011915, "percentage": 46.37, "elapsed_time": "2:09:31", "remaining_time": "2:29:49", "throughput": 2309.71, "total_tokens": 17949328} {"current_steps": 31135, "total_steps": 67140, "loss": 0.5494, "lr": 3.241623916518378e-05, "epoch": 4.637324992552875, "percentage": 46.37, "elapsed_time": "2:09:32", "remaining_time": "2:29:48", "throughput": 2309.74, "total_tokens": 17952112} {"current_steps": 31140, "total_steps": 67140, "loss": 0.6612, "lr": 3.2410032608043405e-05, "epoch": 4.638069705093834, "percentage": 46.38, "elapsed_time": "2:09:33", "remaining_time": "2:29:46", "throughput": 2309.74, "total_tokens": 17954608} {"current_steps": 31145, "total_steps": 67140, "loss": 0.5924, "lr": 3.2403825550163144e-05, "epoch": 4.6388144176347925, "percentage": 46.39, "elapsed_time": "2:09:34", "remaining_time": "2:29:45", "throughput": 2309.78, "total_tokens": 17957680} {"current_steps": 31150, "total_steps": 67140, "loss": 0.5407, "lr": 3.239761799196246e-05, "epoch": 4.639559130175752, "percentage": 46.4, "elapsed_time": "2:09:35", "remaining_time": "2:29:43", "throughput": 2309.82, "total_tokens": 17960560} {"current_steps": 31155, "total_steps": 67140, "loss": 0.6333, "lr": 3.2391409933860825e-05, "epoch": 4.640303842716712, "percentage": 46.4, "elapsed_time": "2:09:36", "remaining_time": "2:29:42", "throughput": 2309.84, "total_tokens": 17963408} {"current_steps": 31160, "total_steps": 67140, "loss": 0.6269, "lr": 3.238520137627777e-05, "epoch": 4.641048555257671, "percentage": 46.41, "elapsed_time": "2:09:38", "remaining_time": "2:29:41", "throughput": 2309.87, "total_tokens": 17966160} {"current_steps": 31165, "total_steps": 67140, "loss": 0.5807, "lr": 3.237899231963282e-05, "epoch": 4.641793267798629, "percentage": 46.42, "elapsed_time": "2:09:39", "remaining_time": "2:29:39", "throughput": 2309.92, "total_tokens": 17969296} {"current_steps": 31170, "total_steps": 67140, "loss": 0.5315, "lr": 3.237278276434557e-05, "epoch": 4.642537980339589, "percentage": 46.43, "elapsed_time": "2:09:40", "remaining_time": "2:29:38", "throughput": 2309.96, "total_tokens": 17972272} {"current_steps": 31175, "total_steps": 67140, "loss": 0.6273, "lr": 3.236657271083564e-05, "epoch": 4.643282692880548, "percentage": 46.43, "elapsed_time": "2:09:41", "remaining_time": "2:29:37", "throughput": 2309.98, "total_tokens": 17975024} {"current_steps": 31180, "total_steps": 67140, "loss": 0.6139, "lr": 3.236036215952267e-05, "epoch": 4.644027405421507, "percentage": 46.44, "elapsed_time": "2:09:42", "remaining_time": "2:29:35", "throughput": 2310.03, "total_tokens": 17978064} {"current_steps": 31185, "total_steps": 67140, "loss": 0.7332, "lr": 3.2354151110826355e-05, "epoch": 4.644772117962466, "percentage": 46.45, "elapsed_time": "2:09:43", "remaining_time": "2:29:34", "throughput": 2310.06, "total_tokens": 17980944} {"current_steps": 31190, "total_steps": 67140, "loss": 0.8485, "lr": 3.234793956516641e-05, "epoch": 4.645516830503426, "percentage": 46.46, "elapsed_time": "2:09:44", "remaining_time": "2:29:32", "throughput": 2310.08, "total_tokens": 17983664} {"current_steps": 31195, "total_steps": 67140, "loss": 0.6543, "lr": 3.234172752296259e-05, "epoch": 4.6462615430443845, "percentage": 46.46, "elapsed_time": "2:09:46", "remaining_time": "2:29:31", "throughput": 2310.11, "total_tokens": 17986544} {"current_steps": 31200, "total_steps": 67140, "loss": 0.5541, "lr": 3.233551498463466e-05, "epoch": 4.647006255585344, "percentage": 46.47, "elapsed_time": "2:09:47", "remaining_time": "2:29:30", "throughput": 2310.15, "total_tokens": 17989456} {"current_steps": 31205, "total_steps": 67140, "loss": 0.6034, "lr": 3.2329301950602456e-05, "epoch": 4.647750968126303, "percentage": 46.48, "elapsed_time": "2:09:48", "remaining_time": "2:29:28", "throughput": 2310.19, "total_tokens": 17992496} {"current_steps": 31210, "total_steps": 67140, "loss": 0.6789, "lr": 3.232308842128583e-05, "epoch": 4.648495680667263, "percentage": 46.48, "elapsed_time": "2:09:49", "remaining_time": "2:29:27", "throughput": 2310.22, "total_tokens": 17995344} {"current_steps": 31215, "total_steps": 67140, "loss": 0.6108, "lr": 3.2316874397104656e-05, "epoch": 4.649240393208221, "percentage": 46.49, "elapsed_time": "2:09:50", "remaining_time": "2:29:26", "throughput": 2310.26, "total_tokens": 17998256} {"current_steps": 31220, "total_steps": 67140, "loss": 0.6227, "lr": 3.231065987847885e-05, "epoch": 4.649985105749181, "percentage": 46.5, "elapsed_time": "2:09:51", "remaining_time": "2:29:24", "throughput": 2310.31, "total_tokens": 18001360} {"current_steps": 31225, "total_steps": 67140, "loss": 0.6869, "lr": 3.2304444865828394e-05, "epoch": 4.65072981829014, "percentage": 46.51, "elapsed_time": "2:09:52", "remaining_time": "2:29:23", "throughput": 2310.35, "total_tokens": 18004304} {"current_steps": 31230, "total_steps": 67140, "loss": 0.6197, "lr": 3.229822935957324e-05, "epoch": 4.651474530831099, "percentage": 46.51, "elapsed_time": "2:09:54", "remaining_time": "2:29:21", "throughput": 2310.38, "total_tokens": 18007120} {"current_steps": 31235, "total_steps": 67140, "loss": 0.5909, "lr": 3.2292013360133416e-05, "epoch": 4.652219243372058, "percentage": 46.52, "elapsed_time": "2:09:55", "remaining_time": "2:29:20", "throughput": 2310.4, "total_tokens": 18009808} {"current_steps": 31240, "total_steps": 67140, "loss": 0.6435, "lr": 3.228579686792898e-05, "epoch": 4.652963955913018, "percentage": 46.53, "elapsed_time": "2:09:56", "remaining_time": "2:29:19", "throughput": 2310.42, "total_tokens": 18012592} {"current_steps": 31245, "total_steps": 67140, "loss": 0.7385, "lr": 3.227957988338001e-05, "epoch": 4.653708668453977, "percentage": 46.54, "elapsed_time": "2:09:57", "remaining_time": "2:29:17", "throughput": 2310.46, "total_tokens": 18015568} {"current_steps": 31250, "total_steps": 67140, "loss": 0.7058, "lr": 3.227336240690663e-05, "epoch": 4.654453380994936, "percentage": 46.54, "elapsed_time": "2:09:58", "remaining_time": "2:29:16", "throughput": 2310.49, "total_tokens": 18018384} {"current_steps": 31255, "total_steps": 67140, "loss": 0.608, "lr": 3.226714443892899e-05, "epoch": 4.655198093535895, "percentage": 46.55, "elapsed_time": "2:09:59", "remaining_time": "2:29:15", "throughput": 2310.51, "total_tokens": 18021104} {"current_steps": 31260, "total_steps": 67140, "loss": 0.5332, "lr": 3.226092597986728e-05, "epoch": 4.655942806076855, "percentage": 46.56, "elapsed_time": "2:10:00", "remaining_time": "2:29:13", "throughput": 2310.53, "total_tokens": 18023824} {"current_steps": 31265, "total_steps": 67140, "loss": 0.5952, "lr": 3.225470703014171e-05, "epoch": 4.656687518617813, "percentage": 46.57, "elapsed_time": "2:10:01", "remaining_time": "2:29:12", "throughput": 2310.56, "total_tokens": 18026704} {"current_steps": 31270, "total_steps": 67140, "loss": 0.5399, "lr": 3.224848759017253e-05, "epoch": 4.657432231158773, "percentage": 46.57, "elapsed_time": "2:10:02", "remaining_time": "2:29:10", "throughput": 2310.59, "total_tokens": 18029520} {"current_steps": 31275, "total_steps": 67140, "loss": 0.5321, "lr": 3.224226766038004e-05, "epoch": 4.658176943699732, "percentage": 46.58, "elapsed_time": "2:10:04", "remaining_time": "2:29:09", "throughput": 2310.61, "total_tokens": 18032176} {"current_steps": 31280, "total_steps": 67140, "loss": 0.6914, "lr": 3.223604724118453e-05, "epoch": 4.658921656240691, "percentage": 46.59, "elapsed_time": "2:10:05", "remaining_time": "2:29:08", "throughput": 2310.66, "total_tokens": 18035248} {"current_steps": 31285, "total_steps": 67140, "loss": 0.561, "lr": 3.2229826333006374e-05, "epoch": 4.65966636878165, "percentage": 46.6, "elapsed_time": "2:10:06", "remaining_time": "2:29:06", "throughput": 2310.67, "total_tokens": 18037936} {"current_steps": 31290, "total_steps": 67140, "loss": 0.5405, "lr": 3.222360493626595e-05, "epoch": 4.66041108132261, "percentage": 46.6, "elapsed_time": "2:10:07", "remaining_time": "2:29:05", "throughput": 2310.69, "total_tokens": 18040624} {"current_steps": 31295, "total_steps": 67140, "loss": 0.765, "lr": 3.2217383051383676e-05, "epoch": 4.661155793863569, "percentage": 46.61, "elapsed_time": "2:10:08", "remaining_time": "2:29:03", "throughput": 2310.72, "total_tokens": 18043536} {"current_steps": 31300, "total_steps": 67140, "loss": 0.6622, "lr": 3.2211160678779994e-05, "epoch": 4.661900506404528, "percentage": 46.62, "elapsed_time": "2:10:09", "remaining_time": "2:29:02", "throughput": 2310.76, "total_tokens": 18046480} {"current_steps": 31305, "total_steps": 67140, "loss": 0.6703, "lr": 3.22049378188754e-05, "epoch": 4.662645218945487, "percentage": 46.63, "elapsed_time": "2:10:10", "remaining_time": "2:29:01", "throughput": 2310.79, "total_tokens": 18049328} {"current_steps": 31310, "total_steps": 67140, "loss": 0.5668, "lr": 3.219871447209039e-05, "epoch": 4.663389931486446, "percentage": 46.63, "elapsed_time": "2:10:12", "remaining_time": "2:28:59", "throughput": 2310.84, "total_tokens": 18052368} {"current_steps": 31315, "total_steps": 67140, "loss": 0.6795, "lr": 3.219249063884553e-05, "epoch": 4.664134644027405, "percentage": 46.64, "elapsed_time": "2:10:13", "remaining_time": "2:28:58", "throughput": 2310.87, "total_tokens": 18055280} {"current_steps": 31320, "total_steps": 67140, "loss": 0.8229, "lr": 3.2186266319561395e-05, "epoch": 4.664879356568365, "percentage": 46.65, "elapsed_time": "2:10:14", "remaining_time": "2:28:57", "throughput": 2310.93, "total_tokens": 18058416} {"current_steps": 31325, "total_steps": 67140, "loss": 0.6237, "lr": 3.21800415146586e-05, "epoch": 4.665624069109324, "percentage": 46.66, "elapsed_time": "2:10:15", "remaining_time": "2:28:55", "throughput": 2310.94, "total_tokens": 18061008} {"current_steps": 31330, "total_steps": 67140, "loss": 0.5716, "lr": 3.217381622455778e-05, "epoch": 4.666368781650283, "percentage": 46.66, "elapsed_time": "2:10:16", "remaining_time": "2:28:54", "throughput": 2310.98, "total_tokens": 18064080} {"current_steps": 31335, "total_steps": 67140, "loss": 0.5853, "lr": 3.216759044967965e-05, "epoch": 4.667113494191242, "percentage": 46.67, "elapsed_time": "2:10:17", "remaining_time": "2:28:53", "throughput": 2311.03, "total_tokens": 18067120} {"current_steps": 31340, "total_steps": 67140, "loss": 0.7301, "lr": 3.2161364190444884e-05, "epoch": 4.667858206732202, "percentage": 46.68, "elapsed_time": "2:10:18", "remaining_time": "2:28:51", "throughput": 2311.04, "total_tokens": 18069808} {"current_steps": 31345, "total_steps": 67140, "loss": 0.5542, "lr": 3.2155137447274245e-05, "epoch": 4.668602919273161, "percentage": 46.69, "elapsed_time": "2:10:20", "remaining_time": "2:28:50", "throughput": 2311.07, "total_tokens": 18072688} {"current_steps": 31350, "total_steps": 67140, "loss": 0.6824, "lr": 3.2148910220588495e-05, "epoch": 4.669347631814119, "percentage": 46.69, "elapsed_time": "2:10:21", "remaining_time": "2:28:48", "throughput": 2311.1, "total_tokens": 18075440} {"current_steps": 31355, "total_steps": 67140, "loss": 0.7617, "lr": 3.2142682510808474e-05, "epoch": 4.670092344355079, "percentage": 46.7, "elapsed_time": "2:10:22", "remaining_time": "2:28:47", "throughput": 2311.16, "total_tokens": 18078672} {"current_steps": 31360, "total_steps": 67140, "loss": 0.6532, "lr": 3.213645431835501e-05, "epoch": 4.670837056896038, "percentage": 46.71, "elapsed_time": "2:10:23", "remaining_time": "2:28:46", "throughput": 2311.21, "total_tokens": 18081680} {"current_steps": 31365, "total_steps": 67140, "loss": 0.5026, "lr": 3.213022564364897e-05, "epoch": 4.671581769436997, "percentage": 46.72, "elapsed_time": "2:10:24", "remaining_time": "2:28:44", "throughput": 2311.25, "total_tokens": 18084656} {"current_steps": 31370, "total_steps": 67140, "loss": 0.6001, "lr": 3.212399648711127e-05, "epoch": 4.672326481977956, "percentage": 46.72, "elapsed_time": "2:10:25", "remaining_time": "2:28:43", "throughput": 2311.27, "total_tokens": 18087472} {"current_steps": 31375, "total_steps": 67140, "loss": 0.6656, "lr": 3.2117766849162855e-05, "epoch": 4.673071194518916, "percentage": 46.73, "elapsed_time": "2:10:26", "remaining_time": "2:28:42", "throughput": 2311.33, "total_tokens": 18090640} {"current_steps": 31380, "total_steps": 67140, "loss": 0.5255, "lr": 3.211153673022469e-05, "epoch": 4.673815907059875, "percentage": 46.74, "elapsed_time": "2:10:28", "remaining_time": "2:28:40", "throughput": 2311.36, "total_tokens": 18093456} {"current_steps": 31385, "total_steps": 67140, "loss": 0.5523, "lr": 3.2105306130717786e-05, "epoch": 4.674560619600834, "percentage": 46.75, "elapsed_time": "2:10:29", "remaining_time": "2:28:39", "throughput": 2311.39, "total_tokens": 18096304} {"current_steps": 31390, "total_steps": 67140, "loss": 0.6897, "lr": 3.209907505106319e-05, "epoch": 4.675305332141793, "percentage": 46.75, "elapsed_time": "2:10:30", "remaining_time": "2:28:37", "throughput": 2311.42, "total_tokens": 18099184} {"current_steps": 31395, "total_steps": 67140, "loss": 0.6665, "lr": 3.209284349168196e-05, "epoch": 4.676050044682753, "percentage": 46.76, "elapsed_time": "2:10:31", "remaining_time": "2:28:36", "throughput": 2311.48, "total_tokens": 18102352} {"current_steps": 31400, "total_steps": 67140, "loss": 0.5866, "lr": 3.20866114529952e-05, "epoch": 4.676794757223711, "percentage": 46.77, "elapsed_time": "2:10:32", "remaining_time": "2:28:35", "throughput": 2311.5, "total_tokens": 18104976} {"current_steps": 31405, "total_steps": 67140, "loss": 0.7121, "lr": 3.208037893542406e-05, "epoch": 4.677539469764671, "percentage": 46.78, "elapsed_time": "2:10:33", "remaining_time": "2:28:33", "throughput": 2311.53, "total_tokens": 18107792} {"current_steps": 31410, "total_steps": 67140, "loss": 0.5846, "lr": 3.207414593938969e-05, "epoch": 4.67828418230563, "percentage": 46.78, "elapsed_time": "2:10:34", "remaining_time": "2:28:32", "throughput": 2311.55, "total_tokens": 18110608} {"current_steps": 31415, "total_steps": 67140, "loss": 0.4592, "lr": 3.2067912465313305e-05, "epoch": 4.6790288948465895, "percentage": 46.79, "elapsed_time": "2:10:35", "remaining_time": "2:28:31", "throughput": 2311.57, "total_tokens": 18113392} {"current_steps": 31420, "total_steps": 67140, "loss": 0.6491, "lr": 3.2061678513616125e-05, "epoch": 4.679773607387548, "percentage": 46.8, "elapsed_time": "2:10:37", "remaining_time": "2:28:29", "throughput": 2311.6, "total_tokens": 18116176} {"current_steps": 31425, "total_steps": 67140, "loss": 0.7462, "lr": 3.205544408471943e-05, "epoch": 4.680518319928508, "percentage": 46.81, "elapsed_time": "2:10:38", "remaining_time": "2:28:28", "throughput": 2311.62, "total_tokens": 18118960} {"current_steps": 31430, "total_steps": 67140, "loss": 0.6664, "lr": 3.20492091790445e-05, "epoch": 4.681263032469467, "percentage": 46.81, "elapsed_time": "2:10:39", "remaining_time": "2:28:26", "throughput": 2311.63, "total_tokens": 18121616} {"current_steps": 31435, "total_steps": 67140, "loss": 0.5801, "lr": 3.2042973797012674e-05, "epoch": 4.682007745010426, "percentage": 46.82, "elapsed_time": "2:10:40", "remaining_time": "2:28:25", "throughput": 2311.64, "total_tokens": 18124176} {"current_steps": 31440, "total_steps": 67140, "loss": 0.4862, "lr": 3.203673793904532e-05, "epoch": 4.682752457551385, "percentage": 46.83, "elapsed_time": "2:10:41", "remaining_time": "2:28:24", "throughput": 2311.67, "total_tokens": 18126992} {"current_steps": 31445, "total_steps": 67140, "loss": 0.586, "lr": 3.2030501605563824e-05, "epoch": 4.683497170092345, "percentage": 46.83, "elapsed_time": "2:10:42", "remaining_time": "2:28:22", "throughput": 2311.72, "total_tokens": 18130064} {"current_steps": 31450, "total_steps": 67140, "loss": 0.729, "lr": 3.202426479698961e-05, "epoch": 4.684241882633303, "percentage": 46.84, "elapsed_time": "2:10:43", "remaining_time": "2:28:21", "throughput": 2311.77, "total_tokens": 18133072} {"current_steps": 31455, "total_steps": 67140, "loss": 0.7873, "lr": 3.201802751374415e-05, "epoch": 4.684986595174263, "percentage": 46.85, "elapsed_time": "2:10:44", "remaining_time": "2:28:19", "throughput": 2311.79, "total_tokens": 18135856} {"current_steps": 31460, "total_steps": 67140, "loss": 0.6646, "lr": 3.201178975624891e-05, "epoch": 4.685731307715222, "percentage": 46.86, "elapsed_time": "2:10:46", "remaining_time": "2:28:18", "throughput": 2311.82, "total_tokens": 18138768} {"current_steps": 31465, "total_steps": 67140, "loss": 0.7157, "lr": 3.200555152492543e-05, "epoch": 4.6864760202561815, "percentage": 46.86, "elapsed_time": "2:10:47", "remaining_time": "2:28:17", "throughput": 2311.87, "total_tokens": 18141744} {"current_steps": 31470, "total_steps": 67140, "loss": 0.6816, "lr": 3.199931282019527e-05, "epoch": 4.68722073279714, "percentage": 46.87, "elapsed_time": "2:10:48", "remaining_time": "2:28:15", "throughput": 2311.9, "total_tokens": 18144720} {"current_steps": 31475, "total_steps": 67140, "loss": 0.55, "lr": 3.1993073642479996e-05, "epoch": 4.687965445338099, "percentage": 46.88, "elapsed_time": "2:10:49", "remaining_time": "2:28:14", "throughput": 2311.92, "total_tokens": 18147472} {"current_steps": 31480, "total_steps": 67140, "loss": 0.8765, "lr": 3.1986833992201235e-05, "epoch": 4.688710157879059, "percentage": 46.89, "elapsed_time": "2:10:50", "remaining_time": "2:28:13", "throughput": 2311.96, "total_tokens": 18150384} {"current_steps": 31485, "total_steps": 67140, "loss": 0.6225, "lr": 3.198059386978064e-05, "epoch": 4.689454870420018, "percentage": 46.89, "elapsed_time": "2:10:51", "remaining_time": "2:28:11", "throughput": 2312.02, "total_tokens": 18153488} {"current_steps": 31490, "total_steps": 67140, "loss": 0.8289, "lr": 3.19743532756399e-05, "epoch": 4.690199582960977, "percentage": 46.9, "elapsed_time": "2:10:52", "remaining_time": "2:28:10", "throughput": 2312.05, "total_tokens": 18156368} {"current_steps": 31495, "total_steps": 67140, "loss": 0.5425, "lr": 3.1968112210200715e-05, "epoch": 4.690944295501936, "percentage": 46.91, "elapsed_time": "2:10:54", "remaining_time": "2:28:08", "throughput": 2312.09, "total_tokens": 18159344} {"current_steps": 31500, "total_steps": 67140, "loss": 0.5918, "lr": 3.1961870673884845e-05, "epoch": 4.6916890080428955, "percentage": 46.92, "elapsed_time": "2:10:55", "remaining_time": "2:28:07", "throughput": 2312.13, "total_tokens": 18162320} {"current_steps": 31505, "total_steps": 67140, "loss": 0.6079, "lr": 3.1955628667114055e-05, "epoch": 4.692433720583855, "percentage": 46.92, "elapsed_time": "2:10:56", "remaining_time": "2:28:06", "throughput": 2312.16, "total_tokens": 18165136} {"current_steps": 31510, "total_steps": 67140, "loss": 0.7323, "lr": 3.1949386190310154e-05, "epoch": 4.693178433124814, "percentage": 46.93, "elapsed_time": "2:10:57", "remaining_time": "2:28:04", "throughput": 2312.2, "total_tokens": 18168112} {"current_steps": 31515, "total_steps": 67140, "loss": 0.7106, "lr": 3.1943143243895e-05, "epoch": 4.693923145665773, "percentage": 46.94, "elapsed_time": "2:10:58", "remaining_time": "2:28:03", "throughput": 2312.24, "total_tokens": 18171088} {"current_steps": 31520, "total_steps": 67140, "loss": 0.5173, "lr": 3.193689982829044e-05, "epoch": 4.694667858206732, "percentage": 46.95, "elapsed_time": "2:10:59", "remaining_time": "2:28:02", "throughput": 2312.3, "total_tokens": 18174288} {"current_steps": 31525, "total_steps": 67140, "loss": 0.7377, "lr": 3.1930655943918405e-05, "epoch": 4.695412570747691, "percentage": 46.95, "elapsed_time": "2:11:00", "remaining_time": "2:28:00", "throughput": 2312.34, "total_tokens": 18177296} {"current_steps": 31530, "total_steps": 67140, "loss": 0.6489, "lr": 3.192441159120081e-05, "epoch": 4.696157283288651, "percentage": 46.96, "elapsed_time": "2:11:02", "remaining_time": "2:27:59", "throughput": 2312.35, "total_tokens": 18179888} {"current_steps": 31535, "total_steps": 67140, "loss": 0.6767, "lr": 3.1918166770559644e-05, "epoch": 4.696901995829609, "percentage": 46.97, "elapsed_time": "2:11:03", "remaining_time": "2:27:58", "throughput": 2312.41, "total_tokens": 18182992} {"current_steps": 31540, "total_steps": 67140, "loss": 0.7528, "lr": 3.191192148241689e-05, "epoch": 4.697646708370569, "percentage": 46.98, "elapsed_time": "2:11:04", "remaining_time": "2:27:56", "throughput": 2312.45, "total_tokens": 18185968} {"current_steps": 31545, "total_steps": 67140, "loss": 0.6664, "lr": 3.190567572719457e-05, "epoch": 4.698391420911528, "percentage": 46.98, "elapsed_time": "2:11:05", "remaining_time": "2:27:55", "throughput": 2312.45, "total_tokens": 18188560} {"current_steps": 31550, "total_steps": 67140, "loss": 0.7474, "lr": 3.189942950531478e-05, "epoch": 4.6991361334524875, "percentage": 46.99, "elapsed_time": "2:11:06", "remaining_time": "2:27:54", "throughput": 2312.5, "total_tokens": 18191696} {"current_steps": 31555, "total_steps": 67140, "loss": 0.5143, "lr": 3.189318281719959e-05, "epoch": 4.699880845993446, "percentage": 47.0, "elapsed_time": "2:11:07", "remaining_time": "2:27:52", "throughput": 2312.53, "total_tokens": 18194480} {"current_steps": 31560, "total_steps": 67140, "loss": 0.5707, "lr": 3.1886935663271125e-05, "epoch": 4.700625558534406, "percentage": 47.01, "elapsed_time": "2:11:08", "remaining_time": "2:27:51", "throughput": 2312.58, "total_tokens": 18197552} {"current_steps": 31565, "total_steps": 67140, "loss": 0.7068, "lr": 3.188068804395155e-05, "epoch": 4.701370271075365, "percentage": 47.01, "elapsed_time": "2:11:10", "remaining_time": "2:27:49", "throughput": 2312.62, "total_tokens": 18200528} {"current_steps": 31570, "total_steps": 67140, "loss": 0.6471, "lr": 3.1874439959663055e-05, "epoch": 4.702114983616324, "percentage": 47.02, "elapsed_time": "2:11:11", "remaining_time": "2:27:48", "throughput": 2312.64, "total_tokens": 18203216} {"current_steps": 31575, "total_steps": 67140, "loss": 0.5376, "lr": 3.1868191410827855e-05, "epoch": 4.702859696157283, "percentage": 47.03, "elapsed_time": "2:11:12", "remaining_time": "2:27:47", "throughput": 2312.68, "total_tokens": 18206192} {"current_steps": 31580, "total_steps": 67140, "loss": 0.7033, "lr": 3.18619423978682e-05, "epoch": 4.703604408698243, "percentage": 47.04, "elapsed_time": "2:11:13", "remaining_time": "2:27:45", "throughput": 2312.7, "total_tokens": 18209040} {"current_steps": 31585, "total_steps": 67140, "loss": 0.6432, "lr": 3.185569292120638e-05, "epoch": 4.7043491212392015, "percentage": 47.04, "elapsed_time": "2:11:14", "remaining_time": "2:27:44", "throughput": 2312.73, "total_tokens": 18211856} {"current_steps": 31590, "total_steps": 67140, "loss": 0.579, "lr": 3.1849442981264707e-05, "epoch": 4.705093833780161, "percentage": 47.05, "elapsed_time": "2:11:15", "remaining_time": "2:27:43", "throughput": 2312.78, "total_tokens": 18214960} {"current_steps": 31595, "total_steps": 67140, "loss": 0.6198, "lr": 3.184319257846553e-05, "epoch": 4.70583854632112, "percentage": 47.06, "elapsed_time": "2:11:16", "remaining_time": "2:27:41", "throughput": 2312.81, "total_tokens": 18217744} {"current_steps": 31600, "total_steps": 67140, "loss": 0.4536, "lr": 3.183694171323121e-05, "epoch": 4.7065832588620795, "percentage": 47.07, "elapsed_time": "2:11:18", "remaining_time": "2:27:40", "throughput": 2312.83, "total_tokens": 18220464} {"current_steps": 31605, "total_steps": 67140, "loss": 0.6554, "lr": 3.183069038598417e-05, "epoch": 4.707327971403038, "percentage": 47.07, "elapsed_time": "2:11:19", "remaining_time": "2:27:38", "throughput": 2312.87, "total_tokens": 18223408} {"current_steps": 31610, "total_steps": 67140, "loss": 0.7415, "lr": 3.182443859714685e-05, "epoch": 4.708072683943998, "percentage": 47.08, "elapsed_time": "2:11:20", "remaining_time": "2:27:37", "throughput": 2312.91, "total_tokens": 18226416} {"current_steps": 31615, "total_steps": 67140, "loss": 0.6384, "lr": 3.181818634714171e-05, "epoch": 4.708817396484957, "percentage": 47.09, "elapsed_time": "2:11:21", "remaining_time": "2:27:36", "throughput": 2312.93, "total_tokens": 18229072} {"current_steps": 31620, "total_steps": 67140, "loss": 0.6883, "lr": 3.1811933636391266e-05, "epoch": 4.709562109025916, "percentage": 47.1, "elapsed_time": "2:11:22", "remaining_time": "2:27:34", "throughput": 2312.95, "total_tokens": 18231824} {"current_steps": 31625, "total_steps": 67140, "loss": 0.553, "lr": 3.1805680465318035e-05, "epoch": 4.710306821566875, "percentage": 47.1, "elapsed_time": "2:11:23", "remaining_time": "2:27:33", "throughput": 2312.97, "total_tokens": 18234576} {"current_steps": 31630, "total_steps": 67140, "loss": 0.6932, "lr": 3.179942683434458e-05, "epoch": 4.711051534107835, "percentage": 47.11, "elapsed_time": "2:11:24", "remaining_time": "2:27:31", "throughput": 2312.99, "total_tokens": 18237360} {"current_steps": 31635, "total_steps": 67140, "loss": 0.8463, "lr": 3.1793172743893515e-05, "epoch": 4.7117962466487935, "percentage": 47.12, "elapsed_time": "2:11:25", "remaining_time": "2:27:30", "throughput": 2313.02, "total_tokens": 18240176} {"current_steps": 31640, "total_steps": 67140, "loss": 0.7988, "lr": 3.178691819438746e-05, "epoch": 4.712540959189753, "percentage": 47.13, "elapsed_time": "2:11:27", "remaining_time": "2:27:29", "throughput": 2313.07, "total_tokens": 18243344} {"current_steps": 31645, "total_steps": 67140, "loss": 0.7307, "lr": 3.178066318624905e-05, "epoch": 4.713285671730712, "percentage": 47.13, "elapsed_time": "2:11:28", "remaining_time": "2:27:27", "throughput": 2313.11, "total_tokens": 18246256} {"current_steps": 31650, "total_steps": 67140, "loss": 0.6676, "lr": 3.1774407719901e-05, "epoch": 4.7140303842716715, "percentage": 47.14, "elapsed_time": "2:11:29", "remaining_time": "2:27:26", "throughput": 2313.16, "total_tokens": 18249328} {"current_steps": 31655, "total_steps": 67140, "loss": 0.6047, "lr": 3.1768151795766025e-05, "epoch": 4.71477509681263, "percentage": 47.15, "elapsed_time": "2:11:30", "remaining_time": "2:27:25", "throughput": 2313.2, "total_tokens": 18252304} {"current_steps": 31660, "total_steps": 67140, "loss": 0.4656, "lr": 3.1761895414266865e-05, "epoch": 4.715519809353589, "percentage": 47.16, "elapsed_time": "2:11:31", "remaining_time": "2:27:23", "throughput": 2313.22, "total_tokens": 18255120} {"current_steps": 31665, "total_steps": 67140, "loss": 0.6345, "lr": 3.1755638575826295e-05, "epoch": 4.716264521894549, "percentage": 47.16, "elapsed_time": "2:11:32", "remaining_time": "2:27:22", "throughput": 2313.26, "total_tokens": 18258096} {"current_steps": 31670, "total_steps": 67140, "loss": 0.8339, "lr": 3.1749381280867146e-05, "epoch": 4.717009234435508, "percentage": 47.17, "elapsed_time": "2:11:33", "remaining_time": "2:27:21", "throughput": 2313.27, "total_tokens": 18260720} {"current_steps": 31675, "total_steps": 67140, "loss": 0.5795, "lr": 3.174312352981225e-05, "epoch": 4.717753946976467, "percentage": 47.18, "elapsed_time": "2:11:35", "remaining_time": "2:27:19", "throughput": 2313.29, "total_tokens": 18263440} {"current_steps": 31680, "total_steps": 67140, "loss": 0.8423, "lr": 3.173686532308448e-05, "epoch": 4.718498659517426, "percentage": 47.18, "elapsed_time": "2:11:36", "remaining_time": "2:27:18", "throughput": 2313.31, "total_tokens": 18266192} {"current_steps": 31685, "total_steps": 67140, "loss": 0.6868, "lr": 3.1730606661106736e-05, "epoch": 4.7192433720583855, "percentage": 47.19, "elapsed_time": "2:11:37", "remaining_time": "2:27:16", "throughput": 2313.37, "total_tokens": 18269392} {"current_steps": 31690, "total_steps": 67140, "loss": 0.5431, "lr": 3.172434754430197e-05, "epoch": 4.719988084599344, "percentage": 47.2, "elapsed_time": "2:11:38", "remaining_time": "2:27:15", "throughput": 2313.4, "total_tokens": 18272272} {"current_steps": 31695, "total_steps": 67140, "loss": 0.5167, "lr": 3.1718087973093135e-05, "epoch": 4.720732797140304, "percentage": 47.21, "elapsed_time": "2:11:39", "remaining_time": "2:27:14", "throughput": 2313.45, "total_tokens": 18275408} {"current_steps": 31700, "total_steps": 67140, "loss": 0.657, "lr": 3.171182794790322e-05, "epoch": 4.721477509681263, "percentage": 47.21, "elapsed_time": "2:11:40", "remaining_time": "2:27:12", "throughput": 2313.5, "total_tokens": 18278448} {"current_steps": 31705, "total_steps": 67140, "loss": 0.5501, "lr": 3.1705567469155266e-05, "epoch": 4.722222222222222, "percentage": 47.22, "elapsed_time": "2:11:41", "remaining_time": "2:27:11", "throughput": 2313.52, "total_tokens": 18281136} {"current_steps": 31710, "total_steps": 67140, "loss": 0.592, "lr": 3.169930653727232e-05, "epoch": 4.722966934763181, "percentage": 47.23, "elapsed_time": "2:11:43", "remaining_time": "2:27:10", "throughput": 2313.56, "total_tokens": 18284080} {"current_steps": 31715, "total_steps": 67140, "loss": 0.6273, "lr": 3.169304515267748e-05, "epoch": 4.723711647304141, "percentage": 47.24, "elapsed_time": "2:11:44", "remaining_time": "2:27:08", "throughput": 2313.59, "total_tokens": 18286992} {"current_steps": 31720, "total_steps": 67140, "loss": 0.6286, "lr": 3.168678331579387e-05, "epoch": 4.7244563598450995, "percentage": 47.24, "elapsed_time": "2:11:45", "remaining_time": "2:27:07", "throughput": 2313.62, "total_tokens": 18289936} {"current_steps": 31725, "total_steps": 67140, "loss": 0.4882, "lr": 3.168052102704461e-05, "epoch": 4.725201072386059, "percentage": 47.25, "elapsed_time": "2:11:46", "remaining_time": "2:27:06", "throughput": 2313.65, "total_tokens": 18292752} {"current_steps": 31730, "total_steps": 67140, "loss": 0.6014, "lr": 3.1674258286852906e-05, "epoch": 4.725945784927018, "percentage": 47.26, "elapsed_time": "2:11:47", "remaining_time": "2:27:04", "throughput": 2313.69, "total_tokens": 18295728} {"current_steps": 31735, "total_steps": 67140, "loss": 0.6147, "lr": 3.1667995095641975e-05, "epoch": 4.7266904974679775, "percentage": 47.27, "elapsed_time": "2:11:48", "remaining_time": "2:27:03", "throughput": 2313.72, "total_tokens": 18298576} {"current_steps": 31740, "total_steps": 67140, "loss": 0.6775, "lr": 3.1661731453835036e-05, "epoch": 4.727435210008936, "percentage": 47.27, "elapsed_time": "2:11:49", "remaining_time": "2:27:01", "throughput": 2313.74, "total_tokens": 18301360} {"current_steps": 31745, "total_steps": 67140, "loss": 0.7092, "lr": 3.165546736185537e-05, "epoch": 4.728179922549896, "percentage": 47.28, "elapsed_time": "2:11:51", "remaining_time": "2:27:00", "throughput": 2313.82, "total_tokens": 18304880} {"current_steps": 31750, "total_steps": 67140, "loss": 0.599, "lr": 3.1649202820126275e-05, "epoch": 4.728924635090855, "percentage": 47.29, "elapsed_time": "2:11:52", "remaining_time": "2:26:59", "throughput": 2313.85, "total_tokens": 18307664} {"current_steps": 31755, "total_steps": 67140, "loss": 0.6445, "lr": 3.16429378290711e-05, "epoch": 4.729669347631814, "percentage": 47.3, "elapsed_time": "2:11:53", "remaining_time": "2:26:57", "throughput": 2313.87, "total_tokens": 18310384} {"current_steps": 31760, "total_steps": 67140, "loss": 0.5664, "lr": 3.1636672389113185e-05, "epoch": 4.730414060172773, "percentage": 47.3, "elapsed_time": "2:11:54", "remaining_time": "2:26:56", "throughput": 2313.89, "total_tokens": 18313168} {"current_steps": 31765, "total_steps": 67140, "loss": 0.6658, "lr": 3.163040650067593e-05, "epoch": 4.731158772713733, "percentage": 47.31, "elapsed_time": "2:11:55", "remaining_time": "2:26:55", "throughput": 2313.97, "total_tokens": 18316560} {"current_steps": 31770, "total_steps": 67140, "loss": 0.6184, "lr": 3.162414016418277e-05, "epoch": 4.7319034852546915, "percentage": 47.32, "elapsed_time": "2:11:56", "remaining_time": "2:26:53", "throughput": 2313.99, "total_tokens": 18319280} {"current_steps": 31775, "total_steps": 67140, "loss": 0.5923, "lr": 3.161787338005715e-05, "epoch": 4.732648197795651, "percentage": 47.33, "elapsed_time": "2:11:57", "remaining_time": "2:26:52", "throughput": 2314.01, "total_tokens": 18322064} {"current_steps": 31780, "total_steps": 67140, "loss": 0.512, "lr": 3.161160614872254e-05, "epoch": 4.73339291033661, "percentage": 47.33, "elapsed_time": "2:11:59", "remaining_time": "2:26:51", "throughput": 2314.04, "total_tokens": 18324912} {"current_steps": 31785, "total_steps": 67140, "loss": 0.4842, "lr": 3.160533847060248e-05, "epoch": 4.73413762287757, "percentage": 47.34, "elapsed_time": "2:12:00", "remaining_time": "2:26:49", "throughput": 2314.06, "total_tokens": 18327664} {"current_steps": 31790, "total_steps": 67140, "loss": 0.6212, "lr": 3.1599070346120497e-05, "epoch": 4.734882335418528, "percentage": 47.35, "elapsed_time": "2:12:01", "remaining_time": "2:26:48", "throughput": 2314.11, "total_tokens": 18330736} {"current_steps": 31795, "total_steps": 67140, "loss": 0.952, "lr": 3.1592801775700165e-05, "epoch": 4.735627047959488, "percentage": 47.36, "elapsed_time": "2:12:02", "remaining_time": "2:26:47", "throughput": 2314.15, "total_tokens": 18333680} {"current_steps": 31800, "total_steps": 67140, "loss": 0.5475, "lr": 3.1586532759765095e-05, "epoch": 4.736371760500447, "percentage": 47.36, "elapsed_time": "2:12:03", "remaining_time": "2:26:45", "throughput": 2314.16, "total_tokens": 18336336} {"current_steps": 31805, "total_steps": 67140, "loss": 0.6359, "lr": 3.158026329873893e-05, "epoch": 4.737116473041406, "percentage": 47.37, "elapsed_time": "2:12:04", "remaining_time": "2:26:44", "throughput": 2314.21, "total_tokens": 18339344} {"current_steps": 31810, "total_steps": 67140, "loss": 0.6017, "lr": 3.157399339304532e-05, "epoch": 4.737861185582365, "percentage": 47.38, "elapsed_time": "2:12:05", "remaining_time": "2:26:42", "throughput": 2314.25, "total_tokens": 18342352} {"current_steps": 31815, "total_steps": 67140, "loss": 0.5751, "lr": 3.1567723043107955e-05, "epoch": 4.738605898123325, "percentage": 47.39, "elapsed_time": "2:12:06", "remaining_time": "2:26:41", "throughput": 2314.26, "total_tokens": 18345040} {"current_steps": 31820, "total_steps": 67140, "loss": 0.5096, "lr": 3.156145224935059e-05, "epoch": 4.7393506106642835, "percentage": 47.39, "elapsed_time": "2:12:08", "remaining_time": "2:26:40", "throughput": 2314.31, "total_tokens": 18348176} {"current_steps": 31825, "total_steps": 67140, "loss": 0.7363, "lr": 3.1555181012196936e-05, "epoch": 4.740095323205242, "percentage": 47.4, "elapsed_time": "2:12:09", "remaining_time": "2:26:38", "throughput": 2314.33, "total_tokens": 18350896} {"current_steps": 31830, "total_steps": 67140, "loss": 0.5114, "lr": 3.154890933207081e-05, "epoch": 4.740840035746202, "percentage": 47.41, "elapsed_time": "2:12:10", "remaining_time": "2:26:37", "throughput": 2314.35, "total_tokens": 18353680} {"current_steps": 31835, "total_steps": 67140, "loss": 0.7524, "lr": 3.154263720939602e-05, "epoch": 4.741584748287162, "percentage": 47.42, "elapsed_time": "2:12:11", "remaining_time": "2:26:36", "throughput": 2314.41, "total_tokens": 18356912} {"current_steps": 31840, "total_steps": 67140, "loss": 0.5396, "lr": 3.15363646445964e-05, "epoch": 4.74232946082812, "percentage": 47.42, "elapsed_time": "2:12:12", "remaining_time": "2:26:34", "throughput": 2314.45, "total_tokens": 18359856} {"current_steps": 31845, "total_steps": 67140, "loss": 0.7996, "lr": 3.153009163809584e-05, "epoch": 4.743074173369079, "percentage": 47.43, "elapsed_time": "2:12:13", "remaining_time": "2:26:33", "throughput": 2314.46, "total_tokens": 18362416} {"current_steps": 31850, "total_steps": 67140, "loss": 0.6291, "lr": 3.1523818190318234e-05, "epoch": 4.743818885910039, "percentage": 47.44, "elapsed_time": "2:12:14", "remaining_time": "2:26:31", "throughput": 2314.49, "total_tokens": 18365360} {"current_steps": 31855, "total_steps": 67140, "loss": 0.7988, "lr": 3.151754430168752e-05, "epoch": 4.744563598450998, "percentage": 47.45, "elapsed_time": "2:12:16", "remaining_time": "2:26:30", "throughput": 2314.5, "total_tokens": 18367952} {"current_steps": 31860, "total_steps": 67140, "loss": 0.5252, "lr": 3.151126997262766e-05, "epoch": 4.745308310991957, "percentage": 47.45, "elapsed_time": "2:12:17", "remaining_time": "2:26:29", "throughput": 2314.53, "total_tokens": 18370736} {"current_steps": 31865, "total_steps": 67140, "loss": 0.5924, "lr": 3.150499520356264e-05, "epoch": 4.746053023532916, "percentage": 47.46, "elapsed_time": "2:12:18", "remaining_time": "2:26:27", "throughput": 2314.56, "total_tokens": 18373712} {"current_steps": 31870, "total_steps": 67140, "loss": 0.5251, "lr": 3.1498719994916507e-05, "epoch": 4.746797736073876, "percentage": 47.47, "elapsed_time": "2:12:19", "remaining_time": "2:26:26", "throughput": 2314.61, "total_tokens": 18376816} {"current_steps": 31875, "total_steps": 67140, "loss": 0.8682, "lr": 3.149244434711328e-05, "epoch": 4.747542448614834, "percentage": 47.48, "elapsed_time": "2:12:20", "remaining_time": "2:26:25", "throughput": 2314.63, "total_tokens": 18379536} {"current_steps": 31880, "total_steps": 67140, "loss": 0.7897, "lr": 3.148616826057708e-05, "epoch": 4.748287161155794, "percentage": 47.48, "elapsed_time": "2:12:21", "remaining_time": "2:26:23", "throughput": 2314.67, "total_tokens": 18382512} {"current_steps": 31885, "total_steps": 67140, "loss": 0.591, "lr": 3.147989173573199e-05, "epoch": 4.749031873696753, "percentage": 47.49, "elapsed_time": "2:12:22", "remaining_time": "2:26:22", "throughput": 2314.69, "total_tokens": 18385232} {"current_steps": 31890, "total_steps": 67140, "loss": 0.7772, "lr": 3.147361477300216e-05, "epoch": 4.749776586237712, "percentage": 47.5, "elapsed_time": "2:12:24", "remaining_time": "2:26:21", "throughput": 2314.73, "total_tokens": 18388272} {"current_steps": 31895, "total_steps": 67140, "loss": 0.6874, "lr": 3.1467337372811764e-05, "epoch": 4.750521298778671, "percentage": 47.51, "elapsed_time": "2:12:25", "remaining_time": "2:26:19", "throughput": 2314.79, "total_tokens": 18391440} {"current_steps": 31900, "total_steps": 67140, "loss": 0.5813, "lr": 3.1461059535585e-05, "epoch": 4.751266011319631, "percentage": 47.51, "elapsed_time": "2:12:26", "remaining_time": "2:26:18", "throughput": 2314.84, "total_tokens": 18394544} {"current_steps": 31905, "total_steps": 67140, "loss": 0.7225, "lr": 3.1454781261746114e-05, "epoch": 4.7520107238605895, "percentage": 47.52, "elapsed_time": "2:12:27", "remaining_time": "2:26:17", "throughput": 2314.91, "total_tokens": 18397840} {"current_steps": 31910, "total_steps": 67140, "loss": 0.5563, "lr": 3.1448502551719336e-05, "epoch": 4.752755436401549, "percentage": 47.53, "elapsed_time": "2:12:28", "remaining_time": "2:26:15", "throughput": 2314.92, "total_tokens": 18400496} {"current_steps": 31915, "total_steps": 67140, "loss": 0.6235, "lr": 3.1442223405928985e-05, "epoch": 4.753500148942508, "percentage": 47.54, "elapsed_time": "2:12:29", "remaining_time": "2:26:14", "throughput": 2314.95, "total_tokens": 18403408} {"current_steps": 31920, "total_steps": 67140, "loss": 0.6058, "lr": 3.1435943824799375e-05, "epoch": 4.754244861483468, "percentage": 47.54, "elapsed_time": "2:12:30", "remaining_time": "2:26:12", "throughput": 2314.99, "total_tokens": 18406384} {"current_steps": 31925, "total_steps": 67140, "loss": 0.7614, "lr": 3.142966380875483e-05, "epoch": 4.754989574024426, "percentage": 47.55, "elapsed_time": "2:12:32", "remaining_time": "2:26:11", "throughput": 2315.02, "total_tokens": 18409232} {"current_steps": 31930, "total_steps": 67140, "loss": 0.4514, "lr": 3.1423383358219756e-05, "epoch": 4.755734286565386, "percentage": 47.56, "elapsed_time": "2:12:33", "remaining_time": "2:26:10", "throughput": 2315.05, "total_tokens": 18412144} {"current_steps": 31935, "total_steps": 67140, "loss": 0.5662, "lr": 3.1417102473618554e-05, "epoch": 4.756478999106345, "percentage": 47.56, "elapsed_time": "2:12:34", "remaining_time": "2:26:08", "throughput": 2315.08, "total_tokens": 18414896} {"current_steps": 31940, "total_steps": 67140, "loss": 0.5523, "lr": 3.141082115537565e-05, "epoch": 4.757223711647304, "percentage": 47.57, "elapsed_time": "2:12:35", "remaining_time": "2:26:07", "throughput": 2315.12, "total_tokens": 18417840} {"current_steps": 31945, "total_steps": 67140, "loss": 0.5809, "lr": 3.1404539403915515e-05, "epoch": 4.757968424188263, "percentage": 47.58, "elapsed_time": "2:12:36", "remaining_time": "2:26:06", "throughput": 2315.15, "total_tokens": 18420688} {"current_steps": 31950, "total_steps": 67140, "loss": 0.7553, "lr": 3.139825721966265e-05, "epoch": 4.758713136729223, "percentage": 47.59, "elapsed_time": "2:12:37", "remaining_time": "2:26:04", "throughput": 2315.16, "total_tokens": 18423312} {"current_steps": 31955, "total_steps": 67140, "loss": 0.6056, "lr": 3.139197460304157e-05, "epoch": 4.759457849270182, "percentage": 47.59, "elapsed_time": "2:12:38", "remaining_time": "2:26:03", "throughput": 2315.17, "total_tokens": 18425968} {"current_steps": 31960, "total_steps": 67140, "loss": 0.64, "lr": 3.138569155447685e-05, "epoch": 4.760202561811141, "percentage": 47.6, "elapsed_time": "2:12:39", "remaining_time": "2:26:01", "throughput": 2315.18, "total_tokens": 18428656} {"current_steps": 31965, "total_steps": 67140, "loss": 0.675, "lr": 3.137940807439304e-05, "epoch": 4.7609472743521, "percentage": 47.61, "elapsed_time": "2:12:41", "remaining_time": "2:26:00", "throughput": 2315.3, "total_tokens": 18432816} {"current_steps": 31970, "total_steps": 67140, "loss": 0.6326, "lr": 3.137312416321478e-05, "epoch": 4.76169198689306, "percentage": 47.62, "elapsed_time": "2:12:42", "remaining_time": "2:25:59", "throughput": 2315.33, "total_tokens": 18435600} {"current_steps": 31975, "total_steps": 67140, "loss": 0.616, "lr": 3.1366839821366696e-05, "epoch": 4.762436699434018, "percentage": 47.62, "elapsed_time": "2:12:43", "remaining_time": "2:25:58", "throughput": 2315.34, "total_tokens": 18438352} {"current_steps": 31980, "total_steps": 67140, "loss": 0.6207, "lr": 3.136055504927347e-05, "epoch": 4.763181411974978, "percentage": 47.63, "elapsed_time": "2:12:44", "remaining_time": "2:25:56", "throughput": 2315.37, "total_tokens": 18441200} {"current_steps": 31985, "total_steps": 67140, "loss": 0.5353, "lr": 3.135426984735978e-05, "epoch": 4.763926124515937, "percentage": 47.64, "elapsed_time": "2:12:45", "remaining_time": "2:25:55", "throughput": 2315.4, "total_tokens": 18444144} {"current_steps": 31990, "total_steps": 67140, "loss": 0.7148, "lr": 3.134798421605037e-05, "epoch": 4.764670837056896, "percentage": 47.65, "elapsed_time": "2:12:46", "remaining_time": "2:25:53", "throughput": 2315.43, "total_tokens": 18446928} {"current_steps": 31995, "total_steps": 67140, "loss": 0.509, "lr": 3.134169815577e-05, "epoch": 4.765415549597855, "percentage": 47.65, "elapsed_time": "2:12:48", "remaining_time": "2:25:52", "throughput": 2315.47, "total_tokens": 18449872} {"current_steps": 32000, "total_steps": 67140, "loss": 0.7053, "lr": 3.133541166694345e-05, "epoch": 4.766160262138815, "percentage": 47.66, "elapsed_time": "2:12:49", "remaining_time": "2:25:51", "throughput": 2315.52, "total_tokens": 18453008} {"current_steps": 32005, "total_steps": 67140, "loss": 0.6457, "lr": 3.132912474999555e-05, "epoch": 4.766904974679774, "percentage": 47.67, "elapsed_time": "2:12:50", "remaining_time": "2:25:49", "throughput": 2315.58, "total_tokens": 18456368} {"current_steps": 32010, "total_steps": 67140, "loss": 0.7997, "lr": 3.132283740535111e-05, "epoch": 4.767649687220732, "percentage": 47.68, "elapsed_time": "2:12:51", "remaining_time": "2:25:48", "throughput": 2315.61, "total_tokens": 18459152} {"current_steps": 32015, "total_steps": 67140, "loss": 0.7698, "lr": 3.131654963343504e-05, "epoch": 4.768394399761692, "percentage": 47.68, "elapsed_time": "2:12:52", "remaining_time": "2:25:47", "throughput": 2315.62, "total_tokens": 18461840} {"current_steps": 32020, "total_steps": 67140, "loss": 0.6591, "lr": 3.1310261434672234e-05, "epoch": 4.769139112302652, "percentage": 47.69, "elapsed_time": "2:12:53", "remaining_time": "2:25:45", "throughput": 2315.68, "total_tokens": 18464976} {"current_steps": 32025, "total_steps": 67140, "loss": 0.6548, "lr": 3.13039728094876e-05, "epoch": 4.76988382484361, "percentage": 47.7, "elapsed_time": "2:12:55", "remaining_time": "2:25:44", "throughput": 2315.7, "total_tokens": 18467856} {"current_steps": 32030, "total_steps": 67140, "loss": 0.6368, "lr": 3.129768375830612e-05, "epoch": 4.770628537384569, "percentage": 47.71, "elapsed_time": "2:12:56", "remaining_time": "2:25:43", "throughput": 2315.78, "total_tokens": 18471248} {"current_steps": 32035, "total_steps": 67140, "loss": 0.4786, "lr": 3.1291394281552776e-05, "epoch": 4.771373249925529, "percentage": 47.71, "elapsed_time": "2:12:57", "remaining_time": "2:25:41", "throughput": 2315.78, "total_tokens": 18473776} {"current_steps": 32040, "total_steps": 67140, "loss": 0.5559, "lr": 3.128510437965259e-05, "epoch": 4.772117962466488, "percentage": 47.72, "elapsed_time": "2:12:58", "remaining_time": "2:25:40", "throughput": 2315.82, "total_tokens": 18476720} {"current_steps": 32045, "total_steps": 67140, "loss": 0.6534, "lr": 3.127881405303059e-05, "epoch": 4.772862675007447, "percentage": 47.73, "elapsed_time": "2:12:59", "remaining_time": "2:25:39", "throughput": 2315.83, "total_tokens": 18479408} {"current_steps": 32050, "total_steps": 67140, "loss": 0.6616, "lr": 3.127252330211187e-05, "epoch": 4.773607387548406, "percentage": 47.74, "elapsed_time": "2:13:00", "remaining_time": "2:25:37", "throughput": 2315.86, "total_tokens": 18482192} {"current_steps": 32055, "total_steps": 67140, "loss": 0.5623, "lr": 3.126623212732153e-05, "epoch": 4.774352100089366, "percentage": 47.74, "elapsed_time": "2:13:01", "remaining_time": "2:25:36", "throughput": 2315.91, "total_tokens": 18485360} {"current_steps": 32060, "total_steps": 67140, "loss": 0.5302, "lr": 3.12599405290847e-05, "epoch": 4.775096812630324, "percentage": 47.75, "elapsed_time": "2:13:03", "remaining_time": "2:25:35", "throughput": 2315.95, "total_tokens": 18488336} {"current_steps": 32065, "total_steps": 67140, "loss": 0.6547, "lr": 3.125364850782654e-05, "epoch": 4.775841525171284, "percentage": 47.76, "elapsed_time": "2:13:04", "remaining_time": "2:25:33", "throughput": 2315.98, "total_tokens": 18491184} {"current_steps": 32070, "total_steps": 67140, "loss": 0.5118, "lr": 3.124735606397224e-05, "epoch": 4.776586237712243, "percentage": 47.77, "elapsed_time": "2:13:05", "remaining_time": "2:25:32", "throughput": 2315.99, "total_tokens": 18493808} {"current_steps": 32075, "total_steps": 67140, "loss": 0.6552, "lr": 3.124106319794701e-05, "epoch": 4.777330950253202, "percentage": 47.77, "elapsed_time": "2:13:06", "remaining_time": "2:25:30", "throughput": 2316.04, "total_tokens": 18496816} {"current_steps": 32080, "total_steps": 67140, "loss": 0.5995, "lr": 3.123476991017611e-05, "epoch": 4.778075662794161, "percentage": 47.78, "elapsed_time": "2:13:07", "remaining_time": "2:25:29", "throughput": 2316.05, "total_tokens": 18499472} {"current_steps": 32085, "total_steps": 67140, "loss": 0.5981, "lr": 3.122847620108481e-05, "epoch": 4.778820375335121, "percentage": 47.79, "elapsed_time": "2:13:08", "remaining_time": "2:25:28", "throughput": 2316.07, "total_tokens": 18502224} {"current_steps": 32090, "total_steps": 67140, "loss": 0.5033, "lr": 3.122218207109841e-05, "epoch": 4.77956508787608, "percentage": 47.8, "elapsed_time": "2:13:09", "remaining_time": "2:25:26", "throughput": 2316.11, "total_tokens": 18505104} {"current_steps": 32095, "total_steps": 67140, "loss": 0.7495, "lr": 3.1215887520642237e-05, "epoch": 4.780309800417039, "percentage": 47.8, "elapsed_time": "2:13:10", "remaining_time": "2:25:25", "throughput": 2316.15, "total_tokens": 18508080} {"current_steps": 32100, "total_steps": 67140, "loss": 0.5567, "lr": 3.120959255014166e-05, "epoch": 4.781054512957998, "percentage": 47.81, "elapsed_time": "2:13:12", "remaining_time": "2:25:23", "throughput": 2316.16, "total_tokens": 18510768} {"current_steps": 32105, "total_steps": 67140, "loss": 0.7695, "lr": 3.120329716002208e-05, "epoch": 4.781799225498958, "percentage": 47.82, "elapsed_time": "2:13:13", "remaining_time": "2:25:22", "throughput": 2316.21, "total_tokens": 18513840} {"current_steps": 32110, "total_steps": 67140, "loss": 0.6999, "lr": 3.119700135070888e-05, "epoch": 4.782543938039916, "percentage": 47.83, "elapsed_time": "2:13:14", "remaining_time": "2:25:21", "throughput": 2316.23, "total_tokens": 18516624} {"current_steps": 32115, "total_steps": 67140, "loss": 0.502, "lr": 3.119070512262753e-05, "epoch": 4.783288650580876, "percentage": 47.83, "elapsed_time": "2:13:15", "remaining_time": "2:25:19", "throughput": 2316.27, "total_tokens": 18519568} {"current_steps": 32120, "total_steps": 67140, "loss": 0.6816, "lr": 3.1184408476203496e-05, "epoch": 4.784033363121835, "percentage": 47.84, "elapsed_time": "2:13:16", "remaining_time": "2:25:18", "throughput": 2316.29, "total_tokens": 18522288} {"current_steps": 32125, "total_steps": 67140, "loss": 0.7462, "lr": 3.1178111411862285e-05, "epoch": 4.7847780756627944, "percentage": 47.85, "elapsed_time": "2:13:17", "remaining_time": "2:25:17", "throughput": 2316.32, "total_tokens": 18525136} {"current_steps": 32130, "total_steps": 67140, "loss": 0.7116, "lr": 3.117181393002942e-05, "epoch": 4.785522788203753, "percentage": 47.86, "elapsed_time": "2:13:18", "remaining_time": "2:25:15", "throughput": 2316.38, "total_tokens": 18528368} {"current_steps": 32135, "total_steps": 67140, "loss": 0.5516, "lr": 3.116551603113046e-05, "epoch": 4.786267500744713, "percentage": 47.86, "elapsed_time": "2:13:20", "remaining_time": "2:25:14", "throughput": 2316.44, "total_tokens": 18531600} {"current_steps": 32140, "total_steps": 67140, "loss": 0.7009, "lr": 3.1159217715591e-05, "epoch": 4.787012213285672, "percentage": 47.87, "elapsed_time": "2:13:21", "remaining_time": "2:25:13", "throughput": 2316.48, "total_tokens": 18534576} {"current_steps": 32145, "total_steps": 67140, "loss": 0.6381, "lr": 3.115291898383664e-05, "epoch": 4.787756925826631, "percentage": 47.88, "elapsed_time": "2:13:22", "remaining_time": "2:25:11", "throughput": 2316.52, "total_tokens": 18537552} {"current_steps": 32150, "total_steps": 67140, "loss": 0.7491, "lr": 3.114661983629304e-05, "epoch": 4.78850163836759, "percentage": 47.89, "elapsed_time": "2:13:23", "remaining_time": "2:25:10", "throughput": 2316.56, "total_tokens": 18540560} {"current_steps": 32155, "total_steps": 67140, "loss": 0.6027, "lr": 3.114032027338585e-05, "epoch": 4.78924635090855, "percentage": 47.89, "elapsed_time": "2:13:24", "remaining_time": "2:25:09", "throughput": 2316.59, "total_tokens": 18543408} {"current_steps": 32160, "total_steps": 67140, "loss": 0.7552, "lr": 3.113402029554079e-05, "epoch": 4.789991063449508, "percentage": 47.9, "elapsed_time": "2:13:25", "remaining_time": "2:25:07", "throughput": 2316.61, "total_tokens": 18546224} {"current_steps": 32165, "total_steps": 67140, "loss": 0.506, "lr": 3.112771990318358e-05, "epoch": 4.790735775990468, "percentage": 47.91, "elapsed_time": "2:13:26", "remaining_time": "2:25:06", "throughput": 2316.64, "total_tokens": 18548976} {"current_steps": 32170, "total_steps": 67140, "loss": 0.7127, "lr": 3.112141909673997e-05, "epoch": 4.791480488531427, "percentage": 47.91, "elapsed_time": "2:13:28", "remaining_time": "2:25:05", "throughput": 2316.67, "total_tokens": 18551952} {"current_steps": 32175, "total_steps": 67140, "loss": 0.7131, "lr": 3.1115117876635735e-05, "epoch": 4.792225201072386, "percentage": 47.92, "elapsed_time": "2:13:29", "remaining_time": "2:25:03", "throughput": 2316.72, "total_tokens": 18555024} {"current_steps": 32180, "total_steps": 67140, "loss": 0.5349, "lr": 3.1108816243296716e-05, "epoch": 4.792969913613345, "percentage": 47.93, "elapsed_time": "2:13:30", "remaining_time": "2:25:02", "throughput": 2316.77, "total_tokens": 18558096} {"current_steps": 32185, "total_steps": 67140, "loss": 0.5747, "lr": 3.110251419714872e-05, "epoch": 4.793714626154305, "percentage": 47.94, "elapsed_time": "2:13:31", "remaining_time": "2:25:00", "throughput": 2316.8, "total_tokens": 18561008} {"current_steps": 32190, "total_steps": 67140, "loss": 0.5474, "lr": 3.109621173861762e-05, "epoch": 4.794459338695264, "percentage": 47.94, "elapsed_time": "2:13:32", "remaining_time": "2:24:59", "throughput": 2316.89, "total_tokens": 18564688} {"current_steps": 32195, "total_steps": 67140, "loss": 0.6863, "lr": 3.1089908868129316e-05, "epoch": 4.795204051236222, "percentage": 47.95, "elapsed_time": "2:13:33", "remaining_time": "2:24:58", "throughput": 2316.93, "total_tokens": 18567728} {"current_steps": 32200, "total_steps": 67140, "loss": 0.654, "lr": 3.108360558610974e-05, "epoch": 4.795948763777182, "percentage": 47.96, "elapsed_time": "2:13:35", "remaining_time": "2:24:57", "throughput": 2316.95, "total_tokens": 18570448} {"current_steps": 32205, "total_steps": 67140, "loss": 0.6983, "lr": 3.1077301892984834e-05, "epoch": 4.796693476318142, "percentage": 47.97, "elapsed_time": "2:13:36", "remaining_time": "2:24:55", "throughput": 2316.99, "total_tokens": 18573392} {"current_steps": 32210, "total_steps": 67140, "loss": 0.7012, "lr": 3.107099778918057e-05, "epoch": 4.7974381888591004, "percentage": 47.97, "elapsed_time": "2:13:37", "remaining_time": "2:24:54", "throughput": 2317.02, "total_tokens": 18576240} {"current_steps": 32215, "total_steps": 67140, "loss": 0.5141, "lr": 3.106469327512296e-05, "epoch": 4.798182901400059, "percentage": 47.98, "elapsed_time": "2:13:38", "remaining_time": "2:24:52", "throughput": 2317.03, "total_tokens": 18578864} {"current_steps": 32220, "total_steps": 67140, "loss": 0.58, "lr": 3.1058388351238035e-05, "epoch": 4.798927613941019, "percentage": 47.99, "elapsed_time": "2:13:39", "remaining_time": "2:24:51", "throughput": 2317.05, "total_tokens": 18581680} {"current_steps": 32225, "total_steps": 67140, "loss": 0.6509, "lr": 3.105208301795185e-05, "epoch": 4.799672326481978, "percentage": 48.0, "elapsed_time": "2:13:40", "remaining_time": "2:24:50", "throughput": 2317.08, "total_tokens": 18584496} {"current_steps": 32230, "total_steps": 67140, "loss": 0.5617, "lr": 3.1045777275690505e-05, "epoch": 4.800417039022937, "percentage": 48.0, "elapsed_time": "2:13:41", "remaining_time": "2:24:48", "throughput": 2317.09, "total_tokens": 18587184} {"current_steps": 32235, "total_steps": 67140, "loss": 0.6178, "lr": 3.1039471124880114e-05, "epoch": 4.801161751563896, "percentage": 48.01, "elapsed_time": "2:13:42", "remaining_time": "2:24:47", "throughput": 2317.14, "total_tokens": 18590352} {"current_steps": 32240, "total_steps": 67140, "loss": 0.658, "lr": 3.103316456594683e-05, "epoch": 4.801906464104856, "percentage": 48.02, "elapsed_time": "2:13:44", "remaining_time": "2:24:46", "throughput": 2317.18, "total_tokens": 18593296} {"current_steps": 32245, "total_steps": 67140, "loss": 0.5269, "lr": 3.1026857599316795e-05, "epoch": 4.802651176645814, "percentage": 48.03, "elapsed_time": "2:13:45", "remaining_time": "2:24:44", "throughput": 2317.2, "total_tokens": 18596112} {"current_steps": 32250, "total_steps": 67140, "loss": 0.597, "lr": 3.102055022541623e-05, "epoch": 4.803395889186774, "percentage": 48.03, "elapsed_time": "2:13:46", "remaining_time": "2:24:43", "throughput": 2317.32, "total_tokens": 18600240} {"current_steps": 32255, "total_steps": 67140, "loss": 0.5275, "lr": 3.1014242444671366e-05, "epoch": 4.804140601727733, "percentage": 48.04, "elapsed_time": "2:13:47", "remaining_time": "2:24:42", "throughput": 2317.35, "total_tokens": 18603088} {"current_steps": 32260, "total_steps": 67140, "loss": 0.4702, "lr": 3.100793425750845e-05, "epoch": 4.8048853142686925, "percentage": 48.05, "elapsed_time": "2:13:48", "remaining_time": "2:24:40", "throughput": 2317.36, "total_tokens": 18605808} {"current_steps": 32265, "total_steps": 67140, "loss": 0.5692, "lr": 3.100162566435375e-05, "epoch": 4.805630026809651, "percentage": 48.06, "elapsed_time": "2:13:49", "remaining_time": "2:24:39", "throughput": 2317.4, "total_tokens": 18608720} {"current_steps": 32270, "total_steps": 67140, "loss": 0.482, "lr": 3.0995316665633606e-05, "epoch": 4.806374739350611, "percentage": 48.06, "elapsed_time": "2:13:51", "remaining_time": "2:24:38", "throughput": 2317.43, "total_tokens": 18611568} {"current_steps": 32275, "total_steps": 67140, "loss": 0.4371, "lr": 3.098900726177432e-05, "epoch": 4.80711945189157, "percentage": 48.07, "elapsed_time": "2:13:52", "remaining_time": "2:24:36", "throughput": 2317.46, "total_tokens": 18614416} {"current_steps": 32280, "total_steps": 67140, "loss": 0.6233, "lr": 3.0982697453202284e-05, "epoch": 4.807864164432529, "percentage": 48.08, "elapsed_time": "2:13:53", "remaining_time": "2:24:35", "throughput": 2317.49, "total_tokens": 18617232} {"current_steps": 32285, "total_steps": 67140, "loss": 0.5973, "lr": 3.0976387240343886e-05, "epoch": 4.808608876973488, "percentage": 48.09, "elapsed_time": "2:13:54", "remaining_time": "2:24:34", "throughput": 2317.52, "total_tokens": 18620080} {"current_steps": 32290, "total_steps": 67140, "loss": 0.6568, "lr": 3.097007662362552e-05, "epoch": 4.809353589514448, "percentage": 48.09, "elapsed_time": "2:13:55", "remaining_time": "2:24:32", "throughput": 2317.54, "total_tokens": 18622960} {"current_steps": 32295, "total_steps": 67140, "loss": 0.6453, "lr": 3.096376560347365e-05, "epoch": 4.8100983020554064, "percentage": 48.1, "elapsed_time": "2:13:56", "remaining_time": "2:24:31", "throughput": 2317.58, "total_tokens": 18625936} {"current_steps": 32300, "total_steps": 67140, "loss": 0.7298, "lr": 3.095745418031476e-05, "epoch": 4.810843014596366, "percentage": 48.11, "elapsed_time": "2:13:57", "remaining_time": "2:24:30", "throughput": 2317.63, "total_tokens": 18629072} {"current_steps": 32305, "total_steps": 67140, "loss": 0.6891, "lr": 3.095114235457533e-05, "epoch": 4.811587727137325, "percentage": 48.12, "elapsed_time": "2:13:59", "remaining_time": "2:24:28", "throughput": 2317.66, "total_tokens": 18631952} {"current_steps": 32310, "total_steps": 67140, "loss": 0.794, "lr": 3.094483012668189e-05, "epoch": 4.8123324396782845, "percentage": 48.12, "elapsed_time": "2:14:00", "remaining_time": "2:24:27", "throughput": 2317.7, "total_tokens": 18634928} {"current_steps": 32315, "total_steps": 67140, "loss": 0.7127, "lr": 3.093851749706101e-05, "epoch": 4.813077152219243, "percentage": 48.13, "elapsed_time": "2:14:01", "remaining_time": "2:24:25", "throughput": 2317.72, "total_tokens": 18637648} {"current_steps": 32320, "total_steps": 67140, "loss": 0.5293, "lr": 3.093220446613926e-05, "epoch": 4.813821864760203, "percentage": 48.14, "elapsed_time": "2:14:02", "remaining_time": "2:24:24", "throughput": 2317.74, "total_tokens": 18640368} {"current_steps": 32325, "total_steps": 67140, "loss": 0.5532, "lr": 3.092589103434324e-05, "epoch": 4.814566577301162, "percentage": 48.15, "elapsed_time": "2:14:03", "remaining_time": "2:24:23", "throughput": 2317.79, "total_tokens": 18643536} {"current_steps": 32330, "total_steps": 67140, "loss": 0.6639, "lr": 3.0919577202099606e-05, "epoch": 4.815311289842121, "percentage": 48.15, "elapsed_time": "2:14:04", "remaining_time": "2:24:21", "throughput": 2317.84, "total_tokens": 18646608} {"current_steps": 32335, "total_steps": 67140, "loss": 0.6853, "lr": 3.091326296983501e-05, "epoch": 4.81605600238308, "percentage": 48.16, "elapsed_time": "2:14:05", "remaining_time": "2:24:20", "throughput": 2317.87, "total_tokens": 18649456} {"current_steps": 32340, "total_steps": 67140, "loss": 0.6866, "lr": 3.0906948337976146e-05, "epoch": 4.816800714924039, "percentage": 48.17, "elapsed_time": "2:14:07", "remaining_time": "2:24:19", "throughput": 2317.91, "total_tokens": 18652368} {"current_steps": 32345, "total_steps": 67140, "loss": 0.6785, "lr": 3.090063330694972e-05, "epoch": 4.8175454274649985, "percentage": 48.18, "elapsed_time": "2:14:08", "remaining_time": "2:24:17", "throughput": 2317.94, "total_tokens": 18655312} {"current_steps": 32350, "total_steps": 67140, "loss": 0.66, "lr": 3.08943178771825e-05, "epoch": 4.818290140005958, "percentage": 48.18, "elapsed_time": "2:14:09", "remaining_time": "2:24:16", "throughput": 2317.97, "total_tokens": 18658128} {"current_steps": 32355, "total_steps": 67140, "loss": 0.6446, "lr": 3.088800204910123e-05, "epoch": 4.819034852546917, "percentage": 48.19, "elapsed_time": "2:14:10", "remaining_time": "2:24:15", "throughput": 2318.01, "total_tokens": 18661040} {"current_steps": 32360, "total_steps": 67140, "loss": 0.4625, "lr": 3.088168582313273e-05, "epoch": 4.819779565087876, "percentage": 48.2, "elapsed_time": "2:14:11", "remaining_time": "2:24:13", "throughput": 2318.01, "total_tokens": 18663632} {"current_steps": 32365, "total_steps": 67140, "loss": 0.4292, "lr": 3.087536919970381e-05, "epoch": 4.820524277628835, "percentage": 48.21, "elapsed_time": "2:14:12", "remaining_time": "2:24:12", "throughput": 2318.03, "total_tokens": 18666352} {"current_steps": 32370, "total_steps": 67140, "loss": 0.5658, "lr": 3.0869052179241334e-05, "epoch": 4.821268990169795, "percentage": 48.21, "elapsed_time": "2:14:13", "remaining_time": "2:24:10", "throughput": 2318.06, "total_tokens": 18669136} {"current_steps": 32375, "total_steps": 67140, "loss": 0.6442, "lr": 3.0862734762172164e-05, "epoch": 4.822013702710754, "percentage": 48.22, "elapsed_time": "2:14:14", "remaining_time": "2:24:09", "throughput": 2318.1, "total_tokens": 18672016} {"current_steps": 32380, "total_steps": 67140, "loss": 0.5396, "lr": 3.085641694892322e-05, "epoch": 4.8227584152517124, "percentage": 48.23, "elapsed_time": "2:14:16", "remaining_time": "2:24:08", "throughput": 2318.14, "total_tokens": 18675088} {"current_steps": 32385, "total_steps": 67140, "loss": 0.8758, "lr": 3.085009873992143e-05, "epoch": 4.823503127792672, "percentage": 48.24, "elapsed_time": "2:14:17", "remaining_time": "2:24:06", "throughput": 2318.18, "total_tokens": 18678000} {"current_steps": 32390, "total_steps": 67140, "loss": 0.6264, "lr": 3.084378013559374e-05, "epoch": 4.824247840333631, "percentage": 48.24, "elapsed_time": "2:14:18", "remaining_time": "2:24:05", "throughput": 2318.19, "total_tokens": 18680560} {"current_steps": 32395, "total_steps": 67140, "loss": 0.4967, "lr": 3.083746113636716e-05, "epoch": 4.8249925528745905, "percentage": 48.25, "elapsed_time": "2:14:19", "remaining_time": "2:24:04", "throughput": 2318.21, "total_tokens": 18683376} {"current_steps": 32400, "total_steps": 67140, "loss": 0.5788, "lr": 3.083114174266869e-05, "epoch": 4.825737265415549, "percentage": 48.26, "elapsed_time": "2:14:20", "remaining_time": "2:24:02", "throughput": 2318.27, "total_tokens": 18686608} {"current_steps": 32405, "total_steps": 67140, "loss": 0.665, "lr": 3.082482195492536e-05, "epoch": 4.826481977956509, "percentage": 48.26, "elapsed_time": "2:14:21", "remaining_time": "2:24:01", "throughput": 2318.33, "total_tokens": 18689776} {"current_steps": 32410, "total_steps": 67140, "loss": 0.6832, "lr": 3.081850177356425e-05, "epoch": 4.827226690497468, "percentage": 48.27, "elapsed_time": "2:14:22", "remaining_time": "2:24:00", "throughput": 2318.37, "total_tokens": 18692880} {"current_steps": 32415, "total_steps": 67140, "loss": 0.9709, "lr": 3.0812181199012455e-05, "epoch": 4.827971403038427, "percentage": 48.28, "elapsed_time": "2:14:24", "remaining_time": "2:23:58", "throughput": 2318.43, "total_tokens": 18696048} {"current_steps": 32420, "total_steps": 67140, "loss": 0.6484, "lr": 3.080586023169707e-05, "epoch": 4.828716115579386, "percentage": 48.29, "elapsed_time": "2:14:25", "remaining_time": "2:23:57", "throughput": 2318.46, "total_tokens": 18698992} {"current_steps": 32425, "total_steps": 67140, "loss": 0.7523, "lr": 3.079953887204527e-05, "epoch": 4.829460828120346, "percentage": 48.29, "elapsed_time": "2:14:26", "remaining_time": "2:23:56", "throughput": 2318.49, "total_tokens": 18701776} {"current_steps": 32430, "total_steps": 67140, "loss": 0.6338, "lr": 3.07932171204842e-05, "epoch": 4.8302055406613045, "percentage": 48.3, "elapsed_time": "2:14:27", "remaining_time": "2:23:54", "throughput": 2318.52, "total_tokens": 18704752} {"current_steps": 32435, "total_steps": 67140, "loss": 0.7865, "lr": 3.0786894977441074e-05, "epoch": 4.830950253202264, "percentage": 48.31, "elapsed_time": "2:14:28", "remaining_time": "2:23:53", "throughput": 2318.55, "total_tokens": 18707664} {"current_steps": 32440, "total_steps": 67140, "loss": 0.6808, "lr": 3.078057244334311e-05, "epoch": 4.831694965743223, "percentage": 48.32, "elapsed_time": "2:14:29", "remaining_time": "2:23:51", "throughput": 2318.57, "total_tokens": 18710320} {"current_steps": 32445, "total_steps": 67140, "loss": 0.6459, "lr": 3.077424951861757e-05, "epoch": 4.8324396782841825, "percentage": 48.32, "elapsed_time": "2:14:30", "remaining_time": "2:23:50", "throughput": 2318.62, "total_tokens": 18713456} {"current_steps": 32450, "total_steps": 67140, "loss": 0.5247, "lr": 3.0767926203691724e-05, "epoch": 4.833184390825141, "percentage": 48.33, "elapsed_time": "2:14:32", "remaining_time": "2:23:49", "throughput": 2318.64, "total_tokens": 18716304} {"current_steps": 32455, "total_steps": 67140, "loss": 0.7147, "lr": 3.076160249899286e-05, "epoch": 4.833929103366101, "percentage": 48.34, "elapsed_time": "2:14:33", "remaining_time": "2:23:47", "throughput": 2318.68, "total_tokens": 18719312} {"current_steps": 32460, "total_steps": 67140, "loss": 0.4679, "lr": 3.075527840494834e-05, "epoch": 4.83467381590706, "percentage": 48.35, "elapsed_time": "2:14:34", "remaining_time": "2:23:46", "throughput": 2318.71, "total_tokens": 18722128} {"current_steps": 32465, "total_steps": 67140, "loss": 0.7452, "lr": 3.074895392198551e-05, "epoch": 4.835418528448019, "percentage": 48.35, "elapsed_time": "2:14:35", "remaining_time": "2:23:45", "throughput": 2318.75, "total_tokens": 18725136} {"current_steps": 32470, "total_steps": 67140, "loss": 0.4785, "lr": 3.074262905053173e-05, "epoch": 4.836163240988978, "percentage": 48.36, "elapsed_time": "2:14:36", "remaining_time": "2:23:43", "throughput": 2318.82, "total_tokens": 18728432} {"current_steps": 32475, "total_steps": 67140, "loss": 0.7737, "lr": 3.073630379101443e-05, "epoch": 4.836907953529938, "percentage": 48.37, "elapsed_time": "2:14:37", "remaining_time": "2:23:42", "throughput": 2318.86, "total_tokens": 18731408} {"current_steps": 32480, "total_steps": 67140, "loss": 0.6668, "lr": 3.072997814386106e-05, "epoch": 4.8376526660708965, "percentage": 48.38, "elapsed_time": "2:14:39", "remaining_time": "2:23:41", "throughput": 2318.89, "total_tokens": 18734320} {"current_steps": 32485, "total_steps": 67140, "loss": 0.6916, "lr": 3.0723652109499046e-05, "epoch": 4.838397378611856, "percentage": 48.38, "elapsed_time": "2:14:40", "remaining_time": "2:23:39", "throughput": 2318.91, "total_tokens": 18737104} {"current_steps": 32490, "total_steps": 67140, "loss": 0.5826, "lr": 3.0717325688355893e-05, "epoch": 4.839142091152815, "percentage": 48.39, "elapsed_time": "2:14:41", "remaining_time": "2:23:38", "throughput": 2318.95, "total_tokens": 18740144} {"current_steps": 32495, "total_steps": 67140, "loss": 0.523, "lr": 3.071099888085911e-05, "epoch": 4.8398868036937746, "percentage": 48.4, "elapsed_time": "2:14:42", "remaining_time": "2:23:37", "throughput": 2318.98, "total_tokens": 18742928} {"current_steps": 32500, "total_steps": 67140, "loss": 0.6258, "lr": 3.070467168743626e-05, "epoch": 4.840631516234733, "percentage": 48.41, "elapsed_time": "2:14:43", "remaining_time": "2:23:35", "throughput": 2318.99, "total_tokens": 18745680} {"current_steps": 32505, "total_steps": 67140, "loss": 0.4963, "lr": 3.0698344108514886e-05, "epoch": 4.841376228775693, "percentage": 48.41, "elapsed_time": "2:14:44", "remaining_time": "2:23:34", "throughput": 2319.02, "total_tokens": 18748560} {"current_steps": 32510, "total_steps": 67140, "loss": 0.6481, "lr": 3.069201614452258e-05, "epoch": 4.842120941316652, "percentage": 48.42, "elapsed_time": "2:14:45", "remaining_time": "2:23:33", "throughput": 2319.05, "total_tokens": 18751440} {"current_steps": 32515, "total_steps": 67140, "loss": 0.5542, "lr": 3.0685687795886964e-05, "epoch": 4.842865653857611, "percentage": 48.43, "elapsed_time": "2:14:46", "remaining_time": "2:23:31", "throughput": 2319.1, "total_tokens": 18754544} {"current_steps": 32520, "total_steps": 67140, "loss": 0.688, "lr": 3.067935906303568e-05, "epoch": 4.84361036639857, "percentage": 48.44, "elapsed_time": "2:14:48", "remaining_time": "2:23:30", "throughput": 2319.11, "total_tokens": 18757232} {"current_steps": 32525, "total_steps": 67140, "loss": 0.6011, "lr": 3.0673029946396406e-05, "epoch": 4.844355078939529, "percentage": 48.44, "elapsed_time": "2:14:49", "remaining_time": "2:23:29", "throughput": 2319.12, "total_tokens": 18759824} {"current_steps": 32530, "total_steps": 67140, "loss": 0.6704, "lr": 3.0666700446396835e-05, "epoch": 4.8450997914804885, "percentage": 48.45, "elapsed_time": "2:14:50", "remaining_time": "2:23:27", "throughput": 2319.16, "total_tokens": 18762864} {"current_steps": 32535, "total_steps": 67140, "loss": 0.5842, "lr": 3.0660370563464694e-05, "epoch": 4.845844504021448, "percentage": 48.46, "elapsed_time": "2:14:51", "remaining_time": "2:23:26", "throughput": 2319.18, "total_tokens": 18765584} {"current_steps": 32540, "total_steps": 67140, "loss": 0.6085, "lr": 3.065404029802771e-05, "epoch": 4.846589216562407, "percentage": 48.47, "elapsed_time": "2:14:52", "remaining_time": "2:23:24", "throughput": 2319.23, "total_tokens": 18768752} {"current_steps": 32545, "total_steps": 67140, "loss": 0.6375, "lr": 3.064770965051367e-05, "epoch": 4.847333929103366, "percentage": 48.47, "elapsed_time": "2:14:53", "remaining_time": "2:23:23", "throughput": 2319.27, "total_tokens": 18771856} {"current_steps": 32550, "total_steps": 67140, "loss": 0.5079, "lr": 3.0641378621350384e-05, "epoch": 4.848078641644325, "percentage": 48.48, "elapsed_time": "2:14:54", "remaining_time": "2:23:22", "throughput": 2319.3, "total_tokens": 18774640} {"current_steps": 32555, "total_steps": 67140, "loss": 0.4786, "lr": 3.063504721096566e-05, "epoch": 4.848823354185284, "percentage": 48.49, "elapsed_time": "2:14:56", "remaining_time": "2:23:20", "throughput": 2319.32, "total_tokens": 18777424} {"current_steps": 32560, "total_steps": 67140, "loss": 0.7043, "lr": 3.0628715419787355e-05, "epoch": 4.849568066726244, "percentage": 48.5, "elapsed_time": "2:14:57", "remaining_time": "2:23:19", "throughput": 2319.34, "total_tokens": 18780208} {"current_steps": 32565, "total_steps": 67140, "loss": 0.5278, "lr": 3.062238324824336e-05, "epoch": 4.8503127792672025, "percentage": 48.5, "elapsed_time": "2:14:58", "remaining_time": "2:23:18", "throughput": 2319.38, "total_tokens": 18783152} {"current_steps": 32570, "total_steps": 67140, "loss": 0.5873, "lr": 3.061605069676155e-05, "epoch": 4.851057491808162, "percentage": 48.51, "elapsed_time": "2:14:59", "remaining_time": "2:23:16", "throughput": 2319.43, "total_tokens": 18786288} {"current_steps": 32575, "total_steps": 67140, "loss": 0.5549, "lr": 3.0609717765769866e-05, "epoch": 4.851802204349121, "percentage": 48.52, "elapsed_time": "2:15:00", "remaining_time": "2:23:15", "throughput": 2319.46, "total_tokens": 18789136} {"current_steps": 32580, "total_steps": 67140, "loss": 0.6352, "lr": 3.060338445569627e-05, "epoch": 4.8525469168900806, "percentage": 48.53, "elapsed_time": "2:15:01", "remaining_time": "2:23:14", "throughput": 2319.49, "total_tokens": 18792016} {"current_steps": 32585, "total_steps": 67140, "loss": 0.5657, "lr": 3.059705076696873e-05, "epoch": 4.853291629431039, "percentage": 48.53, "elapsed_time": "2:15:02", "remaining_time": "2:23:12", "throughput": 2319.52, "total_tokens": 18794896} {"current_steps": 32590, "total_steps": 67140, "loss": 0.6695, "lr": 3.059071670001526e-05, "epoch": 4.854036341971999, "percentage": 48.54, "elapsed_time": "2:15:04", "remaining_time": "2:23:11", "throughput": 2319.53, "total_tokens": 18797552} {"current_steps": 32595, "total_steps": 67140, "loss": 0.5223, "lr": 3.058438225526388e-05, "epoch": 4.854781054512958, "percentage": 48.55, "elapsed_time": "2:15:05", "remaining_time": "2:23:09", "throughput": 2319.54, "total_tokens": 18800080} {"current_steps": 32600, "total_steps": 67140, "loss": 0.6286, "lr": 3.057804743314266e-05, "epoch": 4.855525767053917, "percentage": 48.56, "elapsed_time": "2:15:06", "remaining_time": "2:23:08", "throughput": 2319.57, "total_tokens": 18803056} {"current_steps": 32605, "total_steps": 67140, "loss": 0.6837, "lr": 3.0571712234079666e-05, "epoch": 4.856270479594876, "percentage": 48.56, "elapsed_time": "2:15:07", "remaining_time": "2:23:07", "throughput": 2319.6, "total_tokens": 18806000} {"current_steps": 32610, "total_steps": 67140, "loss": 0.6023, "lr": 3.0565376658503e-05, "epoch": 4.857015192135836, "percentage": 48.57, "elapsed_time": "2:15:08", "remaining_time": "2:23:05", "throughput": 2319.62, "total_tokens": 18808752} {"current_steps": 32615, "total_steps": 67140, "loss": 0.6648, "lr": 3.055904070684082e-05, "epoch": 4.8577599046767945, "percentage": 48.58, "elapsed_time": "2:15:09", "remaining_time": "2:23:04", "throughput": 2319.62, "total_tokens": 18811248} {"current_steps": 32620, "total_steps": 67140, "loss": 0.6813, "lr": 3.055270437952127e-05, "epoch": 4.858504617217754, "percentage": 48.59, "elapsed_time": "2:15:10", "remaining_time": "2:23:03", "throughput": 2319.68, "total_tokens": 18814544} {"current_steps": 32625, "total_steps": 67140, "loss": 0.7692, "lr": 3.054636767697254e-05, "epoch": 4.859249329758713, "percentage": 48.59, "elapsed_time": "2:15:11", "remaining_time": "2:23:01", "throughput": 2319.72, "total_tokens": 18817392} {"current_steps": 32630, "total_steps": 67140, "loss": 0.6398, "lr": 3.054003059962283e-05, "epoch": 4.859994042299673, "percentage": 48.6, "elapsed_time": "2:15:13", "remaining_time": "2:23:00", "throughput": 2319.75, "total_tokens": 18820336} {"current_steps": 32635, "total_steps": 67140, "loss": 0.6547, "lr": 3.0533693147900365e-05, "epoch": 4.860738754840631, "percentage": 48.61, "elapsed_time": "2:15:14", "remaining_time": "2:22:59", "throughput": 2319.78, "total_tokens": 18823184} {"current_steps": 32640, "total_steps": 67140, "loss": 0.7146, "lr": 3.052735532223342e-05, "epoch": 4.861483467381591, "percentage": 48.61, "elapsed_time": "2:15:15", "remaining_time": "2:22:57", "throughput": 2319.83, "total_tokens": 18826288} {"current_steps": 32645, "total_steps": 67140, "loss": 0.6813, "lr": 3.052101712305028e-05, "epoch": 4.86222817992255, "percentage": 48.62, "elapsed_time": "2:15:16", "remaining_time": "2:22:56", "throughput": 2319.84, "total_tokens": 18828944} {"current_steps": 32650, "total_steps": 67140, "loss": 0.6263, "lr": 3.051467855077925e-05, "epoch": 4.862972892463509, "percentage": 48.63, "elapsed_time": "2:15:17", "remaining_time": "2:22:55", "throughput": 2319.87, "total_tokens": 18831824} {"current_steps": 32655, "total_steps": 67140, "loss": 0.6697, "lr": 3.050833960584866e-05, "epoch": 4.863717605004468, "percentage": 48.64, "elapsed_time": "2:15:18", "remaining_time": "2:22:53", "throughput": 2319.9, "total_tokens": 18834736} {"current_steps": 32660, "total_steps": 67140, "loss": 0.4949, "lr": 3.0502000288686877e-05, "epoch": 4.864462317545428, "percentage": 48.64, "elapsed_time": "2:15:19", "remaining_time": "2:22:52", "throughput": 2319.93, "total_tokens": 18837648} {"current_steps": 32665, "total_steps": 67140, "loss": 0.6547, "lr": 3.0495660599722292e-05, "epoch": 4.8652070300863866, "percentage": 48.65, "elapsed_time": "2:15:21", "remaining_time": "2:22:51", "throughput": 2319.98, "total_tokens": 18840848} {"current_steps": 32670, "total_steps": 67140, "loss": 0.7548, "lr": 3.0489320539383294e-05, "epoch": 4.865951742627346, "percentage": 48.66, "elapsed_time": "2:15:22", "remaining_time": "2:22:49", "throughput": 2320.0, "total_tokens": 18843568} {"current_steps": 32675, "total_steps": 67140, "loss": 0.5744, "lr": 3.0482980108098336e-05, "epoch": 4.866696455168305, "percentage": 48.67, "elapsed_time": "2:15:23", "remaining_time": "2:22:48", "throughput": 2320.02, "total_tokens": 18846256} {"current_steps": 32680, "total_steps": 67140, "loss": 0.5686, "lr": 3.0476639306295874e-05, "epoch": 4.867441167709265, "percentage": 48.67, "elapsed_time": "2:15:24", "remaining_time": "2:22:46", "throughput": 2320.04, "total_tokens": 18848976} {"current_steps": 32685, "total_steps": 67140, "loss": 0.3974, "lr": 3.0470298134404403e-05, "epoch": 4.868185880250223, "percentage": 48.68, "elapsed_time": "2:15:25", "remaining_time": "2:22:45", "throughput": 2320.05, "total_tokens": 18851600} {"current_steps": 32690, "total_steps": 67140, "loss": 0.5759, "lr": 3.0463956592852412e-05, "epoch": 4.868930592791182, "percentage": 48.69, "elapsed_time": "2:15:26", "remaining_time": "2:22:44", "throughput": 2320.07, "total_tokens": 18854384} {"current_steps": 32695, "total_steps": 67140, "loss": 0.7465, "lr": 3.0457614682068452e-05, "epoch": 4.869675305332142, "percentage": 48.7, "elapsed_time": "2:15:27", "remaining_time": "2:22:42", "throughput": 2320.09, "total_tokens": 18857168} {"current_steps": 32700, "total_steps": 67140, "loss": 0.6904, "lr": 3.0451272402481086e-05, "epoch": 4.870420017873101, "percentage": 48.7, "elapsed_time": "2:15:28", "remaining_time": "2:22:41", "throughput": 2320.1, "total_tokens": 18859792} {"current_steps": 32705, "total_steps": 67140, "loss": 0.5732, "lr": 3.044492975451889e-05, "epoch": 4.87116473041406, "percentage": 48.71, "elapsed_time": "2:15:29", "remaining_time": "2:22:40", "throughput": 2320.14, "total_tokens": 18862704} {"current_steps": 32710, "total_steps": 67140, "loss": 0.5422, "lr": 3.0438586738610482e-05, "epoch": 4.871909442955019, "percentage": 48.72, "elapsed_time": "2:15:31", "remaining_time": "2:22:38", "throughput": 2320.17, "total_tokens": 18865616} {"current_steps": 32715, "total_steps": 67140, "loss": 0.4807, "lr": 3.0432243355184494e-05, "epoch": 4.872654155495979, "percentage": 48.73, "elapsed_time": "2:15:32", "remaining_time": "2:22:37", "throughput": 2320.18, "total_tokens": 18868336} {"current_steps": 32720, "total_steps": 67140, "loss": 0.6492, "lr": 3.0425899604669577e-05, "epoch": 4.873398868036938, "percentage": 48.73, "elapsed_time": "2:15:33", "remaining_time": "2:22:35", "throughput": 2320.2, "total_tokens": 18871024} {"current_steps": 32725, "total_steps": 67140, "loss": 0.525, "lr": 3.041955548749444e-05, "epoch": 4.874143580577897, "percentage": 48.74, "elapsed_time": "2:15:34", "remaining_time": "2:22:34", "throughput": 2320.24, "total_tokens": 18874000} {"current_steps": 32730, "total_steps": 67140, "loss": 0.5099, "lr": 3.0413211004087773e-05, "epoch": 4.874888293118856, "percentage": 48.75, "elapsed_time": "2:15:35", "remaining_time": "2:22:33", "throughput": 2320.26, "total_tokens": 18876848} {"current_steps": 32735, "total_steps": 67140, "loss": 0.6108, "lr": 3.0406866154878306e-05, "epoch": 4.875633005659815, "percentage": 48.76, "elapsed_time": "2:15:36", "remaining_time": "2:22:31", "throughput": 2320.3, "total_tokens": 18879888} {"current_steps": 32740, "total_steps": 67140, "loss": 0.5672, "lr": 3.0400520940294808e-05, "epoch": 4.876377718200774, "percentage": 48.76, "elapsed_time": "2:15:37", "remaining_time": "2:22:30", "throughput": 2320.35, "total_tokens": 18882992} {"current_steps": 32745, "total_steps": 67140, "loss": 0.7088, "lr": 3.039417536076607e-05, "epoch": 4.877122430741734, "percentage": 48.77, "elapsed_time": "2:15:39", "remaining_time": "2:22:29", "throughput": 2320.39, "total_tokens": 18886000} {"current_steps": 32750, "total_steps": 67140, "loss": 0.6055, "lr": 3.0387829416720888e-05, "epoch": 4.8778671432826926, "percentage": 48.78, "elapsed_time": "2:15:40", "remaining_time": "2:22:27", "throughput": 2320.42, "total_tokens": 18888912} {"current_steps": 32755, "total_steps": 67140, "loss": 0.4931, "lr": 3.0381483108588093e-05, "epoch": 4.878611855823652, "percentage": 48.79, "elapsed_time": "2:15:41", "remaining_time": "2:22:26", "throughput": 2320.44, "total_tokens": 18891632} {"current_steps": 32760, "total_steps": 67140, "loss": 0.5644, "lr": 3.037513643679656e-05, "epoch": 4.879356568364611, "percentage": 48.79, "elapsed_time": "2:15:42", "remaining_time": "2:22:25", "throughput": 2320.44, "total_tokens": 18894160} {"current_steps": 32765, "total_steps": 67140, "loss": 0.5379, "lr": 3.036878940177516e-05, "epoch": 4.880101280905571, "percentage": 48.8, "elapsed_time": "2:15:43", "remaining_time": "2:22:23", "throughput": 2320.5, "total_tokens": 18897360} {"current_steps": 32770, "total_steps": 67140, "loss": 0.8433, "lr": 3.0362442003952795e-05, "epoch": 4.880845993446529, "percentage": 48.81, "elapsed_time": "2:15:44", "remaining_time": "2:22:22", "throughput": 2320.52, "total_tokens": 18900176} {"current_steps": 32775, "total_steps": 67140, "loss": 0.6246, "lr": 3.03560942437584e-05, "epoch": 4.881590705987489, "percentage": 48.82, "elapsed_time": "2:15:45", "remaining_time": "2:22:21", "throughput": 2320.53, "total_tokens": 18902768} {"current_steps": 32780, "total_steps": 67140, "loss": 0.8031, "lr": 3.0349746121620935e-05, "epoch": 4.882335418528448, "percentage": 48.82, "elapsed_time": "2:15:46", "remaining_time": "2:22:19", "throughput": 2320.55, "total_tokens": 18905424} {"current_steps": 32785, "total_steps": 67140, "loss": 0.6459, "lr": 3.034339763796938e-05, "epoch": 4.883080131069407, "percentage": 48.83, "elapsed_time": "2:15:48", "remaining_time": "2:22:18", "throughput": 2320.56, "total_tokens": 18908144} {"current_steps": 32790, "total_steps": 67140, "loss": 0.4886, "lr": 3.033704879323273e-05, "epoch": 4.883824843610366, "percentage": 48.84, "elapsed_time": "2:15:49", "remaining_time": "2:22:16", "throughput": 2320.58, "total_tokens": 18910864} {"current_steps": 32795, "total_steps": 67140, "loss": 0.795, "lr": 3.0330699587840027e-05, "epoch": 4.884569556151326, "percentage": 48.85, "elapsed_time": "2:15:50", "remaining_time": "2:22:15", "throughput": 2320.61, "total_tokens": 18913808} {"current_steps": 32800, "total_steps": 67140, "loss": 0.6359, "lr": 3.0324350022220317e-05, "epoch": 4.885314268692285, "percentage": 48.85, "elapsed_time": "2:15:51", "remaining_time": "2:22:14", "throughput": 2320.65, "total_tokens": 18916752} {"current_steps": 32805, "total_steps": 67140, "loss": 0.626, "lr": 3.0318000096802686e-05, "epoch": 4.886058981233244, "percentage": 48.86, "elapsed_time": "2:15:52", "remaining_time": "2:22:12", "throughput": 2320.67, "total_tokens": 18919568} {"current_steps": 32810, "total_steps": 67140, "loss": 0.8141, "lr": 3.031164981201622e-05, "epoch": 4.886803693774203, "percentage": 48.87, "elapsed_time": "2:15:53", "remaining_time": "2:22:11", "throughput": 2320.7, "total_tokens": 18922448} {"current_steps": 32815, "total_steps": 67140, "loss": 0.6966, "lr": 3.0305299168290064e-05, "epoch": 4.887548406315163, "percentage": 48.88, "elapsed_time": "2:15:54", "remaining_time": "2:22:10", "throughput": 2320.73, "total_tokens": 18925360} {"current_steps": 32820, "total_steps": 67140, "loss": 0.6802, "lr": 3.0298948166053352e-05, "epoch": 4.888293118856121, "percentage": 48.88, "elapsed_time": "2:15:56", "remaining_time": "2:22:08", "throughput": 2320.78, "total_tokens": 18928496} {"current_steps": 32825, "total_steps": 67140, "loss": 0.5197, "lr": 3.0292596805735274e-05, "epoch": 4.889037831397081, "percentage": 48.89, "elapsed_time": "2:15:57", "remaining_time": "2:22:07", "throughput": 2320.79, "total_tokens": 18931120} {"current_steps": 32830, "total_steps": 67140, "loss": 0.6142, "lr": 3.028624508776502e-05, "epoch": 4.88978254393804, "percentage": 48.9, "elapsed_time": "2:15:58", "remaining_time": "2:22:06", "throughput": 2320.83, "total_tokens": 18934192} {"current_steps": 32835, "total_steps": 67140, "loss": 0.8231, "lr": 3.0279893012571807e-05, "epoch": 4.890527256478999, "percentage": 48.91, "elapsed_time": "2:15:59", "remaining_time": "2:22:04", "throughput": 2320.85, "total_tokens": 18936880} {"current_steps": 32840, "total_steps": 67140, "loss": 0.7263, "lr": 3.0273540580584897e-05, "epoch": 4.891271969019958, "percentage": 48.91, "elapsed_time": "2:16:00", "remaining_time": "2:22:03", "throughput": 2320.89, "total_tokens": 18939856} {"current_steps": 32845, "total_steps": 67140, "loss": 0.8514, "lr": 3.026718779223356e-05, "epoch": 4.892016681560918, "percentage": 48.92, "elapsed_time": "2:16:01", "remaining_time": "2:22:02", "throughput": 2320.9, "total_tokens": 18942544} {"current_steps": 32850, "total_steps": 67140, "loss": 0.6034, "lr": 3.0260834647947085e-05, "epoch": 4.892761394101877, "percentage": 48.93, "elapsed_time": "2:16:02", "remaining_time": "2:22:00", "throughput": 2320.95, "total_tokens": 18945680} {"current_steps": 32855, "total_steps": 67140, "loss": 0.5911, "lr": 3.0254481148154788e-05, "epoch": 4.893506106642836, "percentage": 48.94, "elapsed_time": "2:16:04", "remaining_time": "2:21:59", "throughput": 2320.99, "total_tokens": 18948656} {"current_steps": 32860, "total_steps": 67140, "loss": 0.6397, "lr": 3.0248127293286022e-05, "epoch": 4.894250819183795, "percentage": 48.94, "elapsed_time": "2:16:05", "remaining_time": "2:21:58", "throughput": 2321.0, "total_tokens": 18951312} {"current_steps": 32865, "total_steps": 67140, "loss": 0.7699, "lr": 3.0241773083770154e-05, "epoch": 4.894995531724755, "percentage": 48.95, "elapsed_time": "2:16:06", "remaining_time": "2:21:56", "throughput": 2321.04, "total_tokens": 18954384} {"current_steps": 32870, "total_steps": 67140, "loss": 0.5965, "lr": 3.0235418520036567e-05, "epoch": 4.895740244265713, "percentage": 48.96, "elapsed_time": "2:16:07", "remaining_time": "2:21:55", "throughput": 2321.08, "total_tokens": 18957360} {"current_steps": 32875, "total_steps": 67140, "loss": 0.606, "lr": 3.0229063602514678e-05, "epoch": 4.896484956806672, "percentage": 48.96, "elapsed_time": "2:16:08", "remaining_time": "2:21:53", "throughput": 2321.1, "total_tokens": 18960112} {"current_steps": 32880, "total_steps": 67140, "loss": 0.6879, "lr": 3.022270833163394e-05, "epoch": 4.897229669347632, "percentage": 48.97, "elapsed_time": "2:16:09", "remaining_time": "2:21:52", "throughput": 2321.12, "total_tokens": 18962864} {"current_steps": 32885, "total_steps": 67140, "loss": 0.6108, "lr": 3.0216352707823807e-05, "epoch": 4.8979743818885915, "percentage": 48.98, "elapsed_time": "2:16:10", "remaining_time": "2:21:51", "throughput": 2321.14, "total_tokens": 18965552} {"current_steps": 32890, "total_steps": 67140, "loss": 0.7792, "lr": 3.0209996731513757e-05, "epoch": 4.89871909442955, "percentage": 48.99, "elapsed_time": "2:16:11", "remaining_time": "2:21:49", "throughput": 2321.18, "total_tokens": 18968592} {"current_steps": 32895, "total_steps": 67140, "loss": 0.5806, "lr": 3.020364040313332e-05, "epoch": 4.899463806970509, "percentage": 48.99, "elapsed_time": "2:16:13", "remaining_time": "2:21:48", "throughput": 2321.22, "total_tokens": 18971568} {"current_steps": 32900, "total_steps": 67140, "loss": 0.7033, "lr": 3.0197283723112013e-05, "epoch": 4.900208519511469, "percentage": 49.0, "elapsed_time": "2:16:14", "remaining_time": "2:21:47", "throughput": 2321.24, "total_tokens": 18974288} {"current_steps": 32905, "total_steps": 67140, "loss": 0.6561, "lr": 3.0190926691879412e-05, "epoch": 4.900953232052427, "percentage": 49.01, "elapsed_time": "2:16:15", "remaining_time": "2:21:45", "throughput": 2321.26, "total_tokens": 18977008} {"current_steps": 32910, "total_steps": 67140, "loss": 0.7421, "lr": 3.018456930986508e-05, "epoch": 4.901697944593387, "percentage": 49.02, "elapsed_time": "2:16:16", "remaining_time": "2:21:44", "throughput": 2321.28, "total_tokens": 18979824} {"current_steps": 32915, "total_steps": 67140, "loss": 0.5024, "lr": 3.017821157749864e-05, "epoch": 4.902442657134346, "percentage": 49.02, "elapsed_time": "2:16:17", "remaining_time": "2:21:43", "throughput": 2321.3, "total_tokens": 18982544} {"current_steps": 32920, "total_steps": 67140, "loss": 0.6602, "lr": 3.0171853495209708e-05, "epoch": 4.903187369675305, "percentage": 49.03, "elapsed_time": "2:16:18", "remaining_time": "2:21:41", "throughput": 2321.3, "total_tokens": 18985072} {"current_steps": 32925, "total_steps": 67140, "loss": 0.5522, "lr": 3.0165495063427952e-05, "epoch": 4.903932082216264, "percentage": 49.04, "elapsed_time": "2:16:19", "remaining_time": "2:21:40", "throughput": 2321.33, "total_tokens": 18987984} {"current_steps": 32930, "total_steps": 67140, "loss": 0.4827, "lr": 3.0159136282583038e-05, "epoch": 4.904676794757224, "percentage": 49.05, "elapsed_time": "2:16:20", "remaining_time": "2:21:38", "throughput": 2321.36, "total_tokens": 18990800} {"current_steps": 32935, "total_steps": 67140, "loss": 0.443, "lr": 3.0152777153104665e-05, "epoch": 4.905421507298183, "percentage": 49.05, "elapsed_time": "2:16:22", "remaining_time": "2:21:37", "throughput": 2321.39, "total_tokens": 18993808} {"current_steps": 32940, "total_steps": 67140, "loss": 0.554, "lr": 3.014641767542256e-05, "epoch": 4.906166219839142, "percentage": 49.06, "elapsed_time": "2:16:23", "remaining_time": "2:21:36", "throughput": 2321.43, "total_tokens": 18996784} {"current_steps": 32945, "total_steps": 67140, "loss": 0.6326, "lr": 3.014005784996648e-05, "epoch": 4.906910932380101, "percentage": 49.07, "elapsed_time": "2:16:24", "remaining_time": "2:21:34", "throughput": 2321.47, "total_tokens": 18999888} {"current_steps": 32950, "total_steps": 67140, "loss": 0.5233, "lr": 3.013369767716619e-05, "epoch": 4.907655644921061, "percentage": 49.08, "elapsed_time": "2:16:25", "remaining_time": "2:21:33", "throughput": 2321.5, "total_tokens": 19002704} {"current_steps": 32955, "total_steps": 67140, "loss": 0.5987, "lr": 3.0127337157451475e-05, "epoch": 4.908400357462019, "percentage": 49.08, "elapsed_time": "2:16:26", "remaining_time": "2:21:32", "throughput": 2321.52, "total_tokens": 19005520} {"current_steps": 32960, "total_steps": 67140, "loss": 0.4594, "lr": 3.0120976291252167e-05, "epoch": 4.909145070002979, "percentage": 49.09, "elapsed_time": "2:16:27", "remaining_time": "2:21:30", "throughput": 2321.56, "total_tokens": 19008528} {"current_steps": 32965, "total_steps": 67140, "loss": 0.5718, "lr": 3.0114615078998103e-05, "epoch": 4.909889782543938, "percentage": 49.1, "elapsed_time": "2:16:28", "remaining_time": "2:21:29", "throughput": 2321.61, "total_tokens": 19011568} {"current_steps": 32970, "total_steps": 67140, "loss": 0.8662, "lr": 3.010825352111914e-05, "epoch": 4.9106344950848975, "percentage": 49.11, "elapsed_time": "2:16:30", "remaining_time": "2:21:28", "throughput": 2321.63, "total_tokens": 19014448} {"current_steps": 32975, "total_steps": 67140, "loss": 0.7691, "lr": 3.0101891618045175e-05, "epoch": 4.911379207625856, "percentage": 49.11, "elapsed_time": "2:16:31", "remaining_time": "2:21:26", "throughput": 2321.66, "total_tokens": 19017328} {"current_steps": 32980, "total_steps": 67140, "loss": 0.7776, "lr": 3.009552937020612e-05, "epoch": 4.912123920166816, "percentage": 49.12, "elapsed_time": "2:16:32", "remaining_time": "2:21:25", "throughput": 2321.68, "total_tokens": 19020016} {"current_steps": 32985, "total_steps": 67140, "loss": 0.5797, "lr": 3.008916677803191e-05, "epoch": 4.912868632707775, "percentage": 49.13, "elapsed_time": "2:16:33", "remaining_time": "2:21:24", "throughput": 2321.73, "total_tokens": 19023120} {"current_steps": 32990, "total_steps": 67140, "loss": 0.3382, "lr": 3.008280384195249e-05, "epoch": 4.913613345248734, "percentage": 49.14, "elapsed_time": "2:16:34", "remaining_time": "2:21:22", "throughput": 2321.75, "total_tokens": 19025936} {"current_steps": 32995, "total_steps": 67140, "loss": 0.5314, "lr": 3.0076440562397857e-05, "epoch": 4.914358057789693, "percentage": 49.14, "elapsed_time": "2:16:35", "remaining_time": "2:21:21", "throughput": 2321.84, "total_tokens": 19029584} {"current_steps": 33000, "total_steps": 67140, "loss": 0.7045, "lr": 3.007007693979801e-05, "epoch": 4.915102770330653, "percentage": 49.15, "elapsed_time": "2:16:37", "remaining_time": "2:21:20", "throughput": 2321.87, "total_tokens": 19032496} {"current_steps": 33005, "total_steps": 67140, "loss": 0.6924, "lr": 3.006371297458297e-05, "epoch": 4.915847482871611, "percentage": 49.16, "elapsed_time": "2:16:38", "remaining_time": "2:21:18", "throughput": 2321.91, "total_tokens": 19035408} {"current_steps": 33010, "total_steps": 67140, "loss": 0.803, "lr": 3.0057348667182806e-05, "epoch": 4.916592195412571, "percentage": 49.17, "elapsed_time": "2:16:39", "remaining_time": "2:21:17", "throughput": 2321.94, "total_tokens": 19038288} {"current_steps": 33015, "total_steps": 67140, "loss": 0.6127, "lr": 3.005098401802758e-05, "epoch": 4.91733690795353, "percentage": 49.17, "elapsed_time": "2:16:40", "remaining_time": "2:21:16", "throughput": 2321.97, "total_tokens": 19041296} {"current_steps": 33020, "total_steps": 67140, "loss": 0.6553, "lr": 3.0044619027547384e-05, "epoch": 4.9180816204944895, "percentage": 49.18, "elapsed_time": "2:16:41", "remaining_time": "2:21:14", "throughput": 2322.02, "total_tokens": 19044368} {"current_steps": 33025, "total_steps": 67140, "loss": 0.6759, "lr": 3.0038253696172342e-05, "epoch": 4.918826333035448, "percentage": 49.19, "elapsed_time": "2:16:42", "remaining_time": "2:21:13", "throughput": 2322.05, "total_tokens": 19047216} {"current_steps": 33030, "total_steps": 67140, "loss": 0.6676, "lr": 3.003188802433261e-05, "epoch": 4.919571045576408, "percentage": 49.2, "elapsed_time": "2:16:43", "remaining_time": "2:21:12", "throughput": 2322.08, "total_tokens": 19050128} {"current_steps": 33035, "total_steps": 67140, "loss": 0.7587, "lr": 3.0025522012458336e-05, "epoch": 4.920315758117367, "percentage": 49.2, "elapsed_time": "2:16:45", "remaining_time": "2:21:10", "throughput": 2322.13, "total_tokens": 19053264} {"current_steps": 33040, "total_steps": 67140, "loss": 0.7305, "lr": 3.0019155660979713e-05, "epoch": 4.921060470658325, "percentage": 49.21, "elapsed_time": "2:16:46", "remaining_time": "2:21:09", "throughput": 2322.16, "total_tokens": 19056112} {"current_steps": 33045, "total_steps": 67140, "loss": 0.8375, "lr": 3.0012788970326967e-05, "epoch": 4.921805183199285, "percentage": 49.22, "elapsed_time": "2:16:47", "remaining_time": "2:21:08", "throughput": 2322.21, "total_tokens": 19059216} {"current_steps": 33050, "total_steps": 67140, "loss": 0.6195, "lr": 3.000642194093032e-05, "epoch": 4.922549895740245, "percentage": 49.23, "elapsed_time": "2:16:48", "remaining_time": "2:21:06", "throughput": 2322.26, "total_tokens": 19062288} {"current_steps": 33055, "total_steps": 67140, "loss": 0.5986, "lr": 3.0000054573220028e-05, "epoch": 4.9232946082812035, "percentage": 49.23, "elapsed_time": "2:16:49", "remaining_time": "2:21:05", "throughput": 2322.28, "total_tokens": 19065104} {"current_steps": 33060, "total_steps": 67140, "loss": 0.692, "lr": 2.999368686762638e-05, "epoch": 4.924039320822162, "percentage": 49.24, "elapsed_time": "2:16:50", "remaining_time": "2:21:04", "throughput": 2322.31, "total_tokens": 19068048} {"current_steps": 33065, "total_steps": 67140, "loss": 0.6638, "lr": 2.998731882457967e-05, "epoch": 4.924784033363122, "percentage": 49.25, "elapsed_time": "2:16:51", "remaining_time": "2:21:02", "throughput": 2322.32, "total_tokens": 19070672} {"current_steps": 33070, "total_steps": 67140, "loss": 0.4685, "lr": 2.9980950444510236e-05, "epoch": 4.9255287459040815, "percentage": 49.26, "elapsed_time": "2:16:53", "remaining_time": "2:21:01", "throughput": 2322.37, "total_tokens": 19073808} {"current_steps": 33075, "total_steps": 67140, "loss": 0.8129, "lr": 2.9974581727848423e-05, "epoch": 4.92627345844504, "percentage": 49.26, "elapsed_time": "2:16:54", "remaining_time": "2:21:00", "throughput": 2322.4, "total_tokens": 19076720} {"current_steps": 33080, "total_steps": 67140, "loss": 0.6502, "lr": 2.9968212675024603e-05, "epoch": 4.927018170985999, "percentage": 49.27, "elapsed_time": "2:16:55", "remaining_time": "2:20:58", "throughput": 2322.42, "total_tokens": 19079536} {"current_steps": 33085, "total_steps": 67140, "loss": 0.6772, "lr": 2.9961843286469164e-05, "epoch": 4.927762883526959, "percentage": 49.28, "elapsed_time": "2:16:56", "remaining_time": "2:20:57", "throughput": 2322.46, "total_tokens": 19082416} {"current_steps": 33090, "total_steps": 67140, "loss": 0.5974, "lr": 2.9955473562612535e-05, "epoch": 4.928507596067917, "percentage": 49.29, "elapsed_time": "2:16:57", "remaining_time": "2:20:56", "throughput": 2322.49, "total_tokens": 19085360} {"current_steps": 33095, "total_steps": 67140, "loss": 0.6126, "lr": 2.994910350388515e-05, "epoch": 4.929252308608877, "percentage": 49.29, "elapsed_time": "2:16:58", "remaining_time": "2:20:54", "throughput": 2322.51, "total_tokens": 19088080} {"current_steps": 33100, "total_steps": 67140, "loss": 0.6683, "lr": 2.994273311071747e-05, "epoch": 4.929997021149836, "percentage": 49.3, "elapsed_time": "2:16:59", "remaining_time": "2:20:53", "throughput": 2322.52, "total_tokens": 19090736} {"current_steps": 33105, "total_steps": 67140, "loss": 0.6317, "lr": 2.9936362383539974e-05, "epoch": 4.9307417336907955, "percentage": 49.31, "elapsed_time": "2:17:00", "remaining_time": "2:20:51", "throughput": 2322.55, "total_tokens": 19093616} {"current_steps": 33110, "total_steps": 67140, "loss": 0.7628, "lr": 2.992999132278319e-05, "epoch": 4.931486446231754, "percentage": 49.31, "elapsed_time": "2:17:02", "remaining_time": "2:20:50", "throughput": 2322.57, "total_tokens": 19096368} {"current_steps": 33115, "total_steps": 67140, "loss": 0.5453, "lr": 2.9923619928877632e-05, "epoch": 4.932231158772714, "percentage": 49.32, "elapsed_time": "2:17:03", "remaining_time": "2:20:49", "throughput": 2322.6, "total_tokens": 19099280} {"current_steps": 33120, "total_steps": 67140, "loss": 0.6346, "lr": 2.9917248202253856e-05, "epoch": 4.932975871313673, "percentage": 49.33, "elapsed_time": "2:17:04", "remaining_time": "2:20:47", "throughput": 2322.61, "total_tokens": 19101936} {"current_steps": 33125, "total_steps": 67140, "loss": 0.6938, "lr": 2.9910876143342443e-05, "epoch": 4.933720583854632, "percentage": 49.34, "elapsed_time": "2:17:05", "remaining_time": "2:20:46", "throughput": 2322.62, "total_tokens": 19104592} {"current_steps": 33130, "total_steps": 67140, "loss": 0.7442, "lr": 2.9904503752573987e-05, "epoch": 4.934465296395591, "percentage": 49.34, "elapsed_time": "2:17:06", "remaining_time": "2:20:45", "throughput": 2322.65, "total_tokens": 19107376} {"current_steps": 33135, "total_steps": 67140, "loss": 0.6279, "lr": 2.98981310303791e-05, "epoch": 4.935210008936551, "percentage": 49.35, "elapsed_time": "2:17:07", "remaining_time": "2:20:43", "throughput": 2322.69, "total_tokens": 19110384} {"current_steps": 33140, "total_steps": 67140, "loss": 0.6018, "lr": 2.9891757977188433e-05, "epoch": 4.9359547214775095, "percentage": 49.36, "elapsed_time": "2:17:08", "remaining_time": "2:20:42", "throughput": 2322.71, "total_tokens": 19113168} {"current_steps": 33145, "total_steps": 67140, "loss": 0.782, "lr": 2.9885384593432658e-05, "epoch": 4.936699434018469, "percentage": 49.37, "elapsed_time": "2:17:09", "remaining_time": "2:20:40", "throughput": 2322.73, "total_tokens": 19115888} {"current_steps": 33150, "total_steps": 67140, "loss": 0.6025, "lr": 2.987901087954245e-05, "epoch": 4.937444146559428, "percentage": 49.37, "elapsed_time": "2:17:11", "remaining_time": "2:20:39", "throughput": 2322.75, "total_tokens": 19118800} {"current_steps": 33155, "total_steps": 67140, "loss": 0.5621, "lr": 2.987263683594852e-05, "epoch": 4.9381888591003875, "percentage": 49.38, "elapsed_time": "2:17:12", "remaining_time": "2:20:38", "throughput": 2322.79, "total_tokens": 19121712} {"current_steps": 33160, "total_steps": 67140, "loss": 0.5678, "lr": 2.986626246308161e-05, "epoch": 4.938933571641346, "percentage": 49.39, "elapsed_time": "2:17:13", "remaining_time": "2:20:36", "throughput": 2322.81, "total_tokens": 19124592} {"current_steps": 33165, "total_steps": 67140, "loss": 0.7106, "lr": 2.9859887761372464e-05, "epoch": 4.939678284182306, "percentage": 49.4, "elapsed_time": "2:17:14", "remaining_time": "2:20:35", "throughput": 2322.86, "total_tokens": 19127728} {"current_steps": 33170, "total_steps": 67140, "loss": 0.5567, "lr": 2.9853512731251866e-05, "epoch": 4.940422996723265, "percentage": 49.4, "elapsed_time": "2:17:15", "remaining_time": "2:20:34", "throughput": 2322.9, "total_tokens": 19130640} {"current_steps": 33175, "total_steps": 67140, "loss": 0.5742, "lr": 2.9847137373150602e-05, "epoch": 4.941167709264224, "percentage": 49.41, "elapsed_time": "2:17:16", "remaining_time": "2:20:32", "throughput": 2322.95, "total_tokens": 19133744} {"current_steps": 33180, "total_steps": 67140, "loss": 0.624, "lr": 2.9840761687499507e-05, "epoch": 4.941912421805183, "percentage": 49.42, "elapsed_time": "2:17:17", "remaining_time": "2:20:31", "throughput": 2322.95, "total_tokens": 19136368} {"current_steps": 33185, "total_steps": 67140, "loss": 0.5541, "lr": 2.9834385674729416e-05, "epoch": 4.942657134346143, "percentage": 49.43, "elapsed_time": "2:17:19", "remaining_time": "2:20:30", "throughput": 2322.98, "total_tokens": 19139120} {"current_steps": 33190, "total_steps": 67140, "loss": 0.7133, "lr": 2.98280093352712e-05, "epoch": 4.9434018468871015, "percentage": 49.43, "elapsed_time": "2:17:20", "remaining_time": "2:20:28", "throughput": 2323.0, "total_tokens": 19141936} {"current_steps": 33195, "total_steps": 67140, "loss": 0.5589, "lr": 2.9821632669555743e-05, "epoch": 4.944146559428061, "percentage": 49.44, "elapsed_time": "2:17:21", "remaining_time": "2:20:27", "throughput": 2323.05, "total_tokens": 19145104} {"current_steps": 33200, "total_steps": 67140, "loss": 0.748, "lr": 2.981525567801395e-05, "epoch": 4.94489127196902, "percentage": 49.45, "elapsed_time": "2:17:22", "remaining_time": "2:20:26", "throughput": 2323.08, "total_tokens": 19148048} {"current_steps": 33205, "total_steps": 67140, "loss": 0.6394, "lr": 2.9808878361076754e-05, "epoch": 4.945635984509979, "percentage": 49.46, "elapsed_time": "2:17:23", "remaining_time": "2:20:24", "throughput": 2323.12, "total_tokens": 19150928} {"current_steps": 33210, "total_steps": 67140, "loss": 0.744, "lr": 2.9802500719175107e-05, "epoch": 4.946380697050938, "percentage": 49.46, "elapsed_time": "2:17:24", "remaining_time": "2:20:23", "throughput": 2323.12, "total_tokens": 19153520} {"current_steps": 33215, "total_steps": 67140, "loss": 0.7368, "lr": 2.9796122752739997e-05, "epoch": 4.947125409591898, "percentage": 49.47, "elapsed_time": "2:17:25", "remaining_time": "2:20:22", "throughput": 2323.14, "total_tokens": 19156272} {"current_steps": 33220, "total_steps": 67140, "loss": 0.6289, "lr": 2.9789744462202407e-05, "epoch": 4.947870122132857, "percentage": 49.48, "elapsed_time": "2:17:26", "remaining_time": "2:20:20", "throughput": 2323.15, "total_tokens": 19158896} {"current_steps": 33225, "total_steps": 67140, "loss": 0.5606, "lr": 2.9783365847993362e-05, "epoch": 4.9486148346738155, "percentage": 49.49, "elapsed_time": "2:17:28", "remaining_time": "2:20:19", "throughput": 2323.18, "total_tokens": 19161744} {"current_steps": 33230, "total_steps": 67140, "loss": 0.5309, "lr": 2.9776986910543896e-05, "epoch": 4.949359547214775, "percentage": 49.49, "elapsed_time": "2:17:29", "remaining_time": "2:20:18", "throughput": 2323.21, "total_tokens": 19164624} {"current_steps": 33235, "total_steps": 67140, "loss": 0.6268, "lr": 2.9770607650285074e-05, "epoch": 4.950104259755735, "percentage": 49.5, "elapsed_time": "2:17:30", "remaining_time": "2:20:16", "throughput": 2323.26, "total_tokens": 19167792} {"current_steps": 33240, "total_steps": 67140, "loss": 0.6715, "lr": 2.9764228067647987e-05, "epoch": 4.9508489722966935, "percentage": 49.51, "elapsed_time": "2:17:31", "remaining_time": "2:20:15", "throughput": 2323.29, "total_tokens": 19170736} {"current_steps": 33245, "total_steps": 67140, "loss": 0.6507, "lr": 2.975784816306374e-05, "epoch": 4.951593684837652, "percentage": 49.52, "elapsed_time": "2:17:32", "remaining_time": "2:20:14", "throughput": 2323.31, "total_tokens": 19173456} {"current_steps": 33250, "total_steps": 67140, "loss": 0.549, "lr": 2.9751467936963456e-05, "epoch": 4.952338397378612, "percentage": 49.52, "elapsed_time": "2:17:33", "remaining_time": "2:20:12", "throughput": 2323.34, "total_tokens": 19176368} {"current_steps": 33255, "total_steps": 67140, "loss": 0.5242, "lr": 2.9745087389778286e-05, "epoch": 4.953083109919571, "percentage": 49.53, "elapsed_time": "2:17:34", "remaining_time": "2:20:11", "throughput": 2323.37, "total_tokens": 19179280} {"current_steps": 33260, "total_steps": 67140, "loss": 0.7243, "lr": 2.9738706521939402e-05, "epoch": 4.95382782246053, "percentage": 49.54, "elapsed_time": "2:17:36", "remaining_time": "2:20:10", "throughput": 2323.42, "total_tokens": 19182480} {"current_steps": 33265, "total_steps": 67140, "loss": 0.6601, "lr": 2.9732325333877997e-05, "epoch": 4.954572535001489, "percentage": 49.55, "elapsed_time": "2:17:37", "remaining_time": "2:20:08", "throughput": 2323.48, "total_tokens": 19185712} {"current_steps": 33270, "total_steps": 67140, "loss": 0.6786, "lr": 2.9725943826025287e-05, "epoch": 4.955317247542449, "percentage": 49.55, "elapsed_time": "2:17:38", "remaining_time": "2:20:07", "throughput": 2323.49, "total_tokens": 19188464} {"current_steps": 33275, "total_steps": 67140, "loss": 0.638, "lr": 2.9719561998812506e-05, "epoch": 4.9560619600834075, "percentage": 49.56, "elapsed_time": "2:17:39", "remaining_time": "2:20:06", "throughput": 2323.51, "total_tokens": 19191152} {"current_steps": 33280, "total_steps": 67140, "loss": 0.7251, "lr": 2.971317985267092e-05, "epoch": 4.956806672624367, "percentage": 49.57, "elapsed_time": "2:17:40", "remaining_time": "2:20:04", "throughput": 2323.57, "total_tokens": 19194480} {"current_steps": 33285, "total_steps": 67140, "loss": 0.5448, "lr": 2.9706797388031794e-05, "epoch": 4.957551385165326, "percentage": 49.58, "elapsed_time": "2:17:41", "remaining_time": "2:20:03", "throughput": 2323.59, "total_tokens": 19197264} {"current_steps": 33290, "total_steps": 67140, "loss": 0.478, "lr": 2.9700414605326444e-05, "epoch": 4.9582960977062855, "percentage": 49.58, "elapsed_time": "2:17:43", "remaining_time": "2:20:02", "throughput": 2323.62, "total_tokens": 19200144} {"current_steps": 33295, "total_steps": 67140, "loss": 0.6907, "lr": 2.969403150498618e-05, "epoch": 4.959040810247244, "percentage": 49.59, "elapsed_time": "2:17:44", "remaining_time": "2:20:00", "throughput": 2323.67, "total_tokens": 19203376} {"current_steps": 33300, "total_steps": 67140, "loss": 0.5933, "lr": 2.9687648087442353e-05, "epoch": 4.959785522788204, "percentage": 49.6, "elapsed_time": "2:17:45", "remaining_time": "2:19:59", "throughput": 2323.69, "total_tokens": 19206096} {"current_steps": 33305, "total_steps": 67140, "loss": 0.6454, "lr": 2.968126435312632e-05, "epoch": 4.960530235329163, "percentage": 49.61, "elapsed_time": "2:17:46", "remaining_time": "2:19:58", "throughput": 2323.7, "total_tokens": 19208784} {"current_steps": 33310, "total_steps": 67140, "loss": 0.5545, "lr": 2.9674880302469487e-05, "epoch": 4.961274947870122, "percentage": 49.61, "elapsed_time": "2:17:47", "remaining_time": "2:19:56", "throughput": 2323.71, "total_tokens": 19211472} {"current_steps": 33315, "total_steps": 67140, "loss": 0.7539, "lr": 2.9668495935903246e-05, "epoch": 4.962019660411081, "percentage": 49.62, "elapsed_time": "2:17:48", "remaining_time": "2:19:55", "throughput": 2323.73, "total_tokens": 19214160} {"current_steps": 33320, "total_steps": 67140, "loss": 0.5175, "lr": 2.9662111253859025e-05, "epoch": 4.962764372952041, "percentage": 49.63, "elapsed_time": "2:17:49", "remaining_time": "2:19:53", "throughput": 2323.76, "total_tokens": 19217008} {"current_steps": 33325, "total_steps": 67140, "loss": 0.6771, "lr": 2.9655726256768286e-05, "epoch": 4.9635090854929995, "percentage": 49.64, "elapsed_time": "2:17:50", "remaining_time": "2:19:52", "throughput": 2323.8, "total_tokens": 19220048} {"current_steps": 33330, "total_steps": 67140, "loss": 0.6835, "lr": 2.96493409450625e-05, "epoch": 4.964253798033959, "percentage": 49.64, "elapsed_time": "2:17:52", "remaining_time": "2:19:51", "throughput": 2323.81, "total_tokens": 19222736} {"current_steps": 33335, "total_steps": 67140, "loss": 0.6169, "lr": 2.9642955319173142e-05, "epoch": 4.964998510574918, "percentage": 49.65, "elapsed_time": "2:17:53", "remaining_time": "2:19:49", "throughput": 2323.81, "total_tokens": 19225264} {"current_steps": 33340, "total_steps": 67140, "loss": 0.6688, "lr": 2.963656937953175e-05, "epoch": 4.965743223115878, "percentage": 49.66, "elapsed_time": "2:17:54", "remaining_time": "2:19:48", "throughput": 2323.84, "total_tokens": 19228112} {"current_steps": 33345, "total_steps": 67140, "loss": 0.6333, "lr": 2.9630183126569843e-05, "epoch": 4.966487935656836, "percentage": 49.66, "elapsed_time": "2:17:55", "remaining_time": "2:19:47", "throughput": 2323.88, "total_tokens": 19231152} {"current_steps": 33350, "total_steps": 67140, "loss": 0.4847, "lr": 2.9623796560718997e-05, "epoch": 4.967232648197796, "percentage": 49.67, "elapsed_time": "2:17:56", "remaining_time": "2:19:45", "throughput": 2323.88, "total_tokens": 19233616} {"current_steps": 33355, "total_steps": 67140, "loss": 0.6308, "lr": 2.961740968241077e-05, "epoch": 4.967977360738755, "percentage": 49.68, "elapsed_time": "2:17:57", "remaining_time": "2:19:44", "throughput": 2323.9, "total_tokens": 19236432} {"current_steps": 33360, "total_steps": 67140, "loss": 0.6303, "lr": 2.961102249207677e-05, "epoch": 4.968722073279714, "percentage": 49.69, "elapsed_time": "2:17:58", "remaining_time": "2:19:43", "throughput": 2323.93, "total_tokens": 19239344} {"current_steps": 33365, "total_steps": 67140, "loss": 0.5539, "lr": 2.9604634990148617e-05, "epoch": 4.969466785820673, "percentage": 49.69, "elapsed_time": "2:17:59", "remaining_time": "2:19:41", "throughput": 2323.98, "total_tokens": 19242448} {"current_steps": 33370, "total_steps": 67140, "loss": 0.5732, "lr": 2.9598247177057952e-05, "epoch": 4.970211498361633, "percentage": 49.7, "elapsed_time": "2:18:01", "remaining_time": "2:19:40", "throughput": 2323.99, "total_tokens": 19245168} {"current_steps": 33375, "total_steps": 67140, "loss": 0.6295, "lr": 2.9591859053236436e-05, "epoch": 4.9709562109025915, "percentage": 49.71, "elapsed_time": "2:18:02", "remaining_time": "2:19:39", "throughput": 2324.03, "total_tokens": 19248208} {"current_steps": 33380, "total_steps": 67140, "loss": 0.833, "lr": 2.9585470619115762e-05, "epoch": 4.971700923443551, "percentage": 49.72, "elapsed_time": "2:18:03", "remaining_time": "2:19:37", "throughput": 2324.06, "total_tokens": 19251056} {"current_steps": 33385, "total_steps": 67140, "loss": 0.8082, "lr": 2.9579081875127625e-05, "epoch": 4.97244563598451, "percentage": 49.72, "elapsed_time": "2:18:04", "remaining_time": "2:19:36", "throughput": 2324.09, "total_tokens": 19253968} {"current_steps": 33390, "total_steps": 67140, "loss": 0.5393, "lr": 2.9572692821703745e-05, "epoch": 4.973190348525469, "percentage": 49.73, "elapsed_time": "2:18:05", "remaining_time": "2:19:34", "throughput": 2324.11, "total_tokens": 19256720} {"current_steps": 33395, "total_steps": 67140, "loss": 0.6314, "lr": 2.9566303459275884e-05, "epoch": 4.973935061066428, "percentage": 49.74, "elapsed_time": "2:18:06", "remaining_time": "2:19:33", "throughput": 2324.15, "total_tokens": 19259728} {"current_steps": 33400, "total_steps": 67140, "loss": 0.6599, "lr": 2.9559913788275793e-05, "epoch": 4.974679773607388, "percentage": 49.75, "elapsed_time": "2:18:07", "remaining_time": "2:19:32", "throughput": 2324.19, "total_tokens": 19262736} {"current_steps": 33405, "total_steps": 67140, "loss": 0.5941, "lr": 2.955352380913527e-05, "epoch": 4.975424486148347, "percentage": 49.75, "elapsed_time": "2:18:09", "remaining_time": "2:19:30", "throughput": 2324.21, "total_tokens": 19265488} {"current_steps": 33410, "total_steps": 67140, "loss": 0.6757, "lr": 2.954713352228613e-05, "epoch": 4.9761691986893055, "percentage": 49.76, "elapsed_time": "2:18:10", "remaining_time": "2:19:29", "throughput": 2324.22, "total_tokens": 19268080} {"current_steps": 33415, "total_steps": 67140, "loss": 0.7354, "lr": 2.9540742928160182e-05, "epoch": 4.976913911230265, "percentage": 49.77, "elapsed_time": "2:18:11", "remaining_time": "2:19:28", "throughput": 2324.29, "total_tokens": 19271536} {"current_steps": 33420, "total_steps": 67140, "loss": 0.7009, "lr": 2.953435202718929e-05, "epoch": 4.977658623771224, "percentage": 49.78, "elapsed_time": "2:18:12", "remaining_time": "2:19:26", "throughput": 2324.31, "total_tokens": 19274320} {"current_steps": 33425, "total_steps": 67140, "loss": 0.7661, "lr": 2.9527960819805327e-05, "epoch": 4.978403336312184, "percentage": 49.78, "elapsed_time": "2:18:13", "remaining_time": "2:19:25", "throughput": 2324.32, "total_tokens": 19277072} {"current_steps": 33430, "total_steps": 67140, "loss": 0.6915, "lr": 2.9521569306440183e-05, "epoch": 4.979148048853142, "percentage": 49.79, "elapsed_time": "2:18:14", "remaining_time": "2:19:24", "throughput": 2324.35, "total_tokens": 19279984} {"current_steps": 33435, "total_steps": 67140, "loss": 0.5485, "lr": 2.9515177487525763e-05, "epoch": 4.979892761394102, "percentage": 49.8, "elapsed_time": "2:18:15", "remaining_time": "2:19:22", "throughput": 2324.37, "total_tokens": 19282736} {"current_steps": 33440, "total_steps": 67140, "loss": 0.6683, "lr": 2.9508785363494e-05, "epoch": 4.980637473935061, "percentage": 49.81, "elapsed_time": "2:18:17", "remaining_time": "2:19:21", "throughput": 2324.39, "total_tokens": 19285552} {"current_steps": 33445, "total_steps": 67140, "loss": 0.9319, "lr": 2.950239293477687e-05, "epoch": 4.98138218647602, "percentage": 49.81, "elapsed_time": "2:18:18", "remaining_time": "2:19:20", "throughput": 2324.46, "total_tokens": 19288912} {"current_steps": 33450, "total_steps": 67140, "loss": 0.7617, "lr": 2.949600020180632e-05, "epoch": 4.982126899016979, "percentage": 49.82, "elapsed_time": "2:18:19", "remaining_time": "2:19:18", "throughput": 2324.47, "total_tokens": 19291632} {"current_steps": 33455, "total_steps": 67140, "loss": 0.6277, "lr": 2.9489607165014353e-05, "epoch": 4.982871611557939, "percentage": 49.83, "elapsed_time": "2:18:20", "remaining_time": "2:19:17", "throughput": 2324.5, "total_tokens": 19294576} {"current_steps": 33460, "total_steps": 67140, "loss": 0.6029, "lr": 2.9483213824833e-05, "epoch": 4.9836163240988975, "percentage": 49.84, "elapsed_time": "2:18:21", "remaining_time": "2:19:16", "throughput": 2324.56, "total_tokens": 19297840} {"current_steps": 33465, "total_steps": 67140, "loss": 0.8463, "lr": 2.9476820181694276e-05, "epoch": 4.984361036639857, "percentage": 49.84, "elapsed_time": "2:18:22", "remaining_time": "2:19:14", "throughput": 2324.6, "total_tokens": 19300880} {"current_steps": 33470, "total_steps": 67140, "loss": 0.556, "lr": 2.9470426236030247e-05, "epoch": 4.985105749180816, "percentage": 49.85, "elapsed_time": "2:18:24", "remaining_time": "2:19:13", "throughput": 2324.66, "total_tokens": 19304176} {"current_steps": 33475, "total_steps": 67140, "loss": 0.5082, "lr": 2.9464031988272983e-05, "epoch": 4.985850461721776, "percentage": 49.86, "elapsed_time": "2:18:25", "remaining_time": "2:19:12", "throughput": 2324.7, "total_tokens": 19307120} {"current_steps": 33480, "total_steps": 67140, "loss": 0.6066, "lr": 2.9457637438854592e-05, "epoch": 4.986595174262734, "percentage": 49.87, "elapsed_time": "2:18:26", "remaining_time": "2:19:11", "throughput": 2324.73, "total_tokens": 19310096} {"current_steps": 33485, "total_steps": 67140, "loss": 0.5568, "lr": 2.9451242588207185e-05, "epoch": 4.987339886803694, "percentage": 49.87, "elapsed_time": "2:18:27", "remaining_time": "2:19:09", "throughput": 2324.75, "total_tokens": 19312752} {"current_steps": 33490, "total_steps": 67140, "loss": 0.5766, "lr": 2.94448474367629e-05, "epoch": 4.988084599344653, "percentage": 49.88, "elapsed_time": "2:18:28", "remaining_time": "2:19:08", "throughput": 2324.75, "total_tokens": 19315312} {"current_steps": 33495, "total_steps": 67140, "loss": 0.6104, "lr": 2.94384519849539e-05, "epoch": 4.988829311885612, "percentage": 49.89, "elapsed_time": "2:18:29", "remaining_time": "2:19:06", "throughput": 2324.77, "total_tokens": 19318032} {"current_steps": 33500, "total_steps": 67140, "loss": 0.5589, "lr": 2.9432056233212357e-05, "epoch": 4.989574024426571, "percentage": 49.9, "elapsed_time": "2:18:30", "remaining_time": "2:19:05", "throughput": 2324.79, "total_tokens": 19320880} {"current_steps": 33505, "total_steps": 67140, "loss": 0.7038, "lr": 2.9425660181970472e-05, "epoch": 4.990318736967531, "percentage": 49.9, "elapsed_time": "2:18:31", "remaining_time": "2:19:04", "throughput": 2324.83, "total_tokens": 19323920} {"current_steps": 33510, "total_steps": 67140, "loss": 0.5375, "lr": 2.9419263831660475e-05, "epoch": 4.99106344950849, "percentage": 49.91, "elapsed_time": "2:18:33", "remaining_time": "2:19:02", "throughput": 2324.87, "total_tokens": 19326864} {"current_steps": 33515, "total_steps": 67140, "loss": 0.7938, "lr": 2.941286718271459e-05, "epoch": 4.991808162049449, "percentage": 49.92, "elapsed_time": "2:18:34", "remaining_time": "2:19:01", "throughput": 2324.91, "total_tokens": 19329872} {"current_steps": 33520, "total_steps": 67140, "loss": 0.7231, "lr": 2.9406470235565075e-05, "epoch": 4.992552874590408, "percentage": 49.93, "elapsed_time": "2:18:35", "remaining_time": "2:19:00", "throughput": 2324.93, "total_tokens": 19332688} {"current_steps": 33525, "total_steps": 67140, "loss": 0.7163, "lr": 2.940007299064423e-05, "epoch": 4.993297587131368, "percentage": 49.93, "elapsed_time": "2:18:36", "remaining_time": "2:18:58", "throughput": 2324.96, "total_tokens": 19335536} {"current_steps": 33530, "total_steps": 67140, "loss": 0.6501, "lr": 2.9393675448384332e-05, "epoch": 4.994042299672326, "percentage": 49.94, "elapsed_time": "2:18:37", "remaining_time": "2:18:57", "throughput": 2324.97, "total_tokens": 19338192} {"current_steps": 33535, "total_steps": 67140, "loss": 0.7835, "lr": 2.9387277609217713e-05, "epoch": 4.994787012213286, "percentage": 49.95, "elapsed_time": "2:18:38", "remaining_time": "2:18:56", "throughput": 2324.99, "total_tokens": 19341008} {"current_steps": 33540, "total_steps": 67140, "loss": 0.6096, "lr": 2.9380879473576705e-05, "epoch": 4.995531724754245, "percentage": 49.96, "elapsed_time": "2:18:39", "remaining_time": "2:18:54", "throughput": 2325.03, "total_tokens": 19343888} {"current_steps": 33545, "total_steps": 67140, "loss": 0.5711, "lr": 2.9374481041893687e-05, "epoch": 4.996276437295204, "percentage": 49.96, "elapsed_time": "2:18:41", "remaining_time": "2:18:53", "throughput": 2325.07, "total_tokens": 19346928} {"current_steps": 33550, "total_steps": 67140, "loss": 0.7, "lr": 2.9368082314601018e-05, "epoch": 4.997021149836163, "percentage": 49.97, "elapsed_time": "2:18:42", "remaining_time": "2:18:52", "throughput": 2325.1, "total_tokens": 19349808} {"current_steps": 33555, "total_steps": 67140, "loss": 0.6641, "lr": 2.9361683292131103e-05, "epoch": 4.997765862377122, "percentage": 49.98, "elapsed_time": "2:18:43", "remaining_time": "2:18:50", "throughput": 2325.13, "total_tokens": 19352752} {"current_steps": 33560, "total_steps": 67140, "loss": 0.5879, "lr": 2.935528397491637e-05, "epoch": 4.998510574918082, "percentage": 49.99, "elapsed_time": "2:18:44", "remaining_time": "2:18:49", "throughput": 2325.15, "total_tokens": 19355472} {"current_steps": 33565, "total_steps": 67140, "loss": 0.6321, "lr": 2.9348884363389246e-05, "epoch": 4.999255287459041, "percentage": 49.99, "elapsed_time": "2:18:45", "remaining_time": "2:18:48", "throughput": 2325.18, "total_tokens": 19358320} {"current_steps": 33570, "total_steps": 67140, "loss": 0.7214, "lr": 2.9342484457982206e-05, "epoch": 5.0, "percentage": 50.0, "elapsed_time": "2:18:46", "remaining_time": "2:18:46", "throughput": 2325.15, "total_tokens": 19360624} {"current_steps": 33570, "total_steps": 67140, "eval_loss": 0.6489034295082092, "epoch": 5.0, "percentage": 50.0, "elapsed_time": "2:20:00", "remaining_time": "2:20:00", "throughput": 2304.6, "total_tokens": 19360624} {"current_steps": 33575, "total_steps": 67140, "loss": 0.6048, "lr": 2.9336084259127716e-05, "epoch": 5.000744712540959, "percentage": 50.01, "elapsed_time": "2:20:03", "remaining_time": "2:20:01", "throughput": 2304.13, "total_tokens": 19363472} {"current_steps": 33580, "total_steps": 67140, "loss": 0.5263, "lr": 2.932968376725828e-05, "epoch": 5.001489425081918, "percentage": 50.01, "elapsed_time": "2:20:04", "remaining_time": "2:19:59", "throughput": 2304.16, "total_tokens": 19366288} {"current_steps": 33585, "total_steps": 67140, "loss": 0.3976, "lr": 2.932328298280642e-05, "epoch": 5.002234137622877, "percentage": 50.02, "elapsed_time": "2:20:06", "remaining_time": "2:19:58", "throughput": 2304.17, "total_tokens": 19368944} {"current_steps": 33590, "total_steps": 67140, "loss": 0.7256, "lr": 2.9316881906204675e-05, "epoch": 5.002978850163837, "percentage": 50.03, "elapsed_time": "2:20:07", "remaining_time": "2:19:57", "throughput": 2304.18, "total_tokens": 19371632} {"current_steps": 33595, "total_steps": 67140, "loss": 0.4853, "lr": 2.9310480537885605e-05, "epoch": 5.003723562704796, "percentage": 50.04, "elapsed_time": "2:20:08", "remaining_time": "2:19:55", "throughput": 2304.22, "total_tokens": 19374608} {"current_steps": 33600, "total_steps": 67140, "loss": 0.5939, "lr": 2.9304078878281778e-05, "epoch": 5.004468275245755, "percentage": 50.04, "elapsed_time": "2:20:09", "remaining_time": "2:19:54", "throughput": 2304.25, "total_tokens": 19377520} {"current_steps": 33605, "total_steps": 67140, "loss": 0.7016, "lr": 2.9297676927825803e-05, "epoch": 5.005212987786714, "percentage": 50.05, "elapsed_time": "2:20:10", "remaining_time": "2:19:53", "throughput": 2304.29, "total_tokens": 19380464} {"current_steps": 33610, "total_steps": 67140, "loss": 0.5383, "lr": 2.9291274686950294e-05, "epoch": 5.005957700327674, "percentage": 50.06, "elapsed_time": "2:20:11", "remaining_time": "2:19:51", "throughput": 2304.31, "total_tokens": 19383152} {"current_steps": 33615, "total_steps": 67140, "loss": 0.6483, "lr": 2.9284872156087896e-05, "epoch": 5.006702412868632, "percentage": 50.07, "elapsed_time": "2:20:12", "remaining_time": "2:19:50", "throughput": 2304.35, "total_tokens": 19386096} {"current_steps": 33620, "total_steps": 67140, "loss": 0.7593, "lr": 2.9278469335671245e-05, "epoch": 5.007447125409592, "percentage": 50.07, "elapsed_time": "2:20:13", "remaining_time": "2:19:48", "throughput": 2304.38, "total_tokens": 19389072} {"current_steps": 33625, "total_steps": 67140, "loss": 0.6513, "lr": 2.9272066226133037e-05, "epoch": 5.008191837950551, "percentage": 50.08, "elapsed_time": "2:20:15", "remaining_time": "2:19:47", "throughput": 2304.41, "total_tokens": 19391792} {"current_steps": 33630, "total_steps": 67140, "loss": 0.6912, "lr": 2.9265662827905967e-05, "epoch": 5.00893655049151, "percentage": 50.09, "elapsed_time": "2:20:16", "remaining_time": "2:19:46", "throughput": 2304.43, "total_tokens": 19394608} {"current_steps": 33635, "total_steps": 67140, "loss": 0.7899, "lr": 2.925925914142274e-05, "epoch": 5.009681263032469, "percentage": 50.1, "elapsed_time": "2:20:17", "remaining_time": "2:19:44", "throughput": 2304.44, "total_tokens": 19397232} {"current_steps": 33640, "total_steps": 67140, "loss": 0.7102, "lr": 2.92528551671161e-05, "epoch": 5.010425975573429, "percentage": 50.1, "elapsed_time": "2:20:18", "remaining_time": "2:19:43", "throughput": 2304.46, "total_tokens": 19399888} {"current_steps": 33645, "total_steps": 67140, "loss": 0.5457, "lr": 2.9246450905418798e-05, "epoch": 5.011170688114388, "percentage": 50.11, "elapsed_time": "2:20:19", "remaining_time": "2:19:42", "throughput": 2304.52, "total_tokens": 19403152} {"current_steps": 33650, "total_steps": 67140, "loss": 0.6046, "lr": 2.9240046356763607e-05, "epoch": 5.011915400655347, "percentage": 50.12, "elapsed_time": "2:20:20", "remaining_time": "2:19:40", "throughput": 2304.52, "total_tokens": 19405744} {"current_steps": 33655, "total_steps": 67140, "loss": 0.5775, "lr": 2.9233641521583325e-05, "epoch": 5.012660113196306, "percentage": 50.13, "elapsed_time": "2:20:21", "remaining_time": "2:19:39", "throughput": 2304.53, "total_tokens": 19408304} {"current_steps": 33660, "total_steps": 67140, "loss": 0.5087, "lr": 2.9227236400310765e-05, "epoch": 5.013404825737266, "percentage": 50.13, "elapsed_time": "2:20:23", "remaining_time": "2:19:37", "throughput": 2304.58, "total_tokens": 19411504} {"current_steps": 33665, "total_steps": 67140, "loss": 0.6558, "lr": 2.9220830993378745e-05, "epoch": 5.014149538278224, "percentage": 50.14, "elapsed_time": "2:20:24", "remaining_time": "2:19:36", "throughput": 2304.62, "total_tokens": 19414448} {"current_steps": 33670, "total_steps": 67140, "loss": 0.693, "lr": 2.9214425301220133e-05, "epoch": 5.014894250819184, "percentage": 50.15, "elapsed_time": "2:20:25", "remaining_time": "2:19:35", "throughput": 2304.65, "total_tokens": 19417360} {"current_steps": 33675, "total_steps": 67140, "loss": 0.4954, "lr": 2.9208019324267798e-05, "epoch": 5.015638963360143, "percentage": 50.16, "elapsed_time": "2:20:26", "remaining_time": "2:19:33", "throughput": 2304.67, "total_tokens": 19420080} {"current_steps": 33680, "total_steps": 67140, "loss": 0.8149, "lr": 2.920161306295462e-05, "epoch": 5.0163836759011025, "percentage": 50.16, "elapsed_time": "2:20:27", "remaining_time": "2:19:32", "throughput": 2304.72, "total_tokens": 19423184} {"current_steps": 33685, "total_steps": 67140, "loss": 0.76, "lr": 2.9195206517713515e-05, "epoch": 5.017128388442061, "percentage": 50.17, "elapsed_time": "2:20:28", "remaining_time": "2:19:31", "throughput": 2304.73, "total_tokens": 19425776} {"current_steps": 33690, "total_steps": 67140, "loss": 0.7188, "lr": 2.9188799688977407e-05, "epoch": 5.017873100983021, "percentage": 50.18, "elapsed_time": "2:20:29", "remaining_time": "2:19:29", "throughput": 2304.77, "total_tokens": 19428816} {"current_steps": 33695, "total_steps": 67140, "loss": 0.7109, "lr": 2.9182392577179257e-05, "epoch": 5.01861781352398, "percentage": 50.19, "elapsed_time": "2:20:30", "remaining_time": "2:19:28", "throughput": 2304.82, "total_tokens": 19431888} {"current_steps": 33700, "total_steps": 67140, "loss": 0.7416, "lr": 2.917598518275201e-05, "epoch": 5.019362526064939, "percentage": 50.19, "elapsed_time": "2:20:32", "remaining_time": "2:19:27", "throughput": 2304.86, "total_tokens": 19434928} {"current_steps": 33705, "total_steps": 67140, "loss": 0.6082, "lr": 2.9169577506128664e-05, "epoch": 5.020107238605898, "percentage": 50.2, "elapsed_time": "2:20:33", "remaining_time": "2:19:25", "throughput": 2304.9, "total_tokens": 19437904} {"current_steps": 33710, "total_steps": 67140, "loss": 0.6303, "lr": 2.9163169547742225e-05, "epoch": 5.020851951146858, "percentage": 50.21, "elapsed_time": "2:20:34", "remaining_time": "2:19:24", "throughput": 2304.94, "total_tokens": 19440976} {"current_steps": 33715, "total_steps": 67140, "loss": 0.6513, "lr": 2.9156761308025715e-05, "epoch": 5.021596663687816, "percentage": 50.22, "elapsed_time": "2:20:35", "remaining_time": "2:19:23", "throughput": 2304.94, "total_tokens": 19443568} {"current_steps": 33720, "total_steps": 67140, "loss": 0.5091, "lr": 2.915035278741218e-05, "epoch": 5.022341376228776, "percentage": 50.22, "elapsed_time": "2:20:36", "remaining_time": "2:19:21", "throughput": 2304.96, "total_tokens": 19446256} {"current_steps": 33725, "total_steps": 67140, "loss": 0.3898, "lr": 2.914394398633467e-05, "epoch": 5.023086088769735, "percentage": 50.23, "elapsed_time": "2:20:37", "remaining_time": "2:19:20", "throughput": 2304.98, "total_tokens": 19449040} {"current_steps": 33730, "total_steps": 67140, "loss": 0.4417, "lr": 2.9137534905226272e-05, "epoch": 5.0238308013106945, "percentage": 50.24, "elapsed_time": "2:20:39", "remaining_time": "2:19:18", "throughput": 2305.05, "total_tokens": 19452400} {"current_steps": 33735, "total_steps": 67140, "loss": 0.7445, "lr": 2.9131125544520095e-05, "epoch": 5.024575513851653, "percentage": 50.25, "elapsed_time": "2:20:40", "remaining_time": "2:19:17", "throughput": 2305.07, "total_tokens": 19455120} {"current_steps": 33740, "total_steps": 67140, "loss": 0.6642, "lr": 2.9124715904649247e-05, "epoch": 5.025320226392613, "percentage": 50.25, "elapsed_time": "2:20:41", "remaining_time": "2:19:16", "throughput": 2305.11, "total_tokens": 19458128} {"current_steps": 33745, "total_steps": 67140, "loss": 0.6018, "lr": 2.911830598604687e-05, "epoch": 5.026064938933572, "percentage": 50.26, "elapsed_time": "2:20:42", "remaining_time": "2:19:14", "throughput": 2305.13, "total_tokens": 19460944} {"current_steps": 33750, "total_steps": 67140, "loss": 0.4837, "lr": 2.911189578914611e-05, "epoch": 5.02680965147453, "percentage": 50.27, "elapsed_time": "2:20:43", "remaining_time": "2:19:13", "throughput": 2305.14, "total_tokens": 19463504} {"current_steps": 33755, "total_steps": 67140, "loss": 0.6553, "lr": 2.9105485314380154e-05, "epoch": 5.02755436401549, "percentage": 50.28, "elapsed_time": "2:20:44", "remaining_time": "2:19:12", "throughput": 2305.18, "total_tokens": 19466512} {"current_steps": 33760, "total_steps": 67140, "loss": 0.6483, "lr": 2.90990745621822e-05, "epoch": 5.028299076556449, "percentage": 50.28, "elapsed_time": "2:20:45", "remaining_time": "2:19:10", "throughput": 2305.19, "total_tokens": 19469168} {"current_steps": 33765, "total_steps": 67140, "loss": 0.5826, "lr": 2.9092663532985442e-05, "epoch": 5.0290437890974085, "percentage": 50.29, "elapsed_time": "2:20:46", "remaining_time": "2:19:09", "throughput": 2305.23, "total_tokens": 19472080} {"current_steps": 33770, "total_steps": 67140, "loss": 0.471, "lr": 2.9086252227223122e-05, "epoch": 5.029788501638367, "percentage": 50.3, "elapsed_time": "2:20:48", "remaining_time": "2:19:07", "throughput": 2305.25, "total_tokens": 19474832} {"current_steps": 33775, "total_steps": 67140, "loss": 0.4214, "lr": 2.9079840645328505e-05, "epoch": 5.030533214179327, "percentage": 50.31, "elapsed_time": "2:20:49", "remaining_time": "2:19:06", "throughput": 2305.27, "total_tokens": 19477584} {"current_steps": 33780, "total_steps": 67140, "loss": 0.5997, "lr": 2.907342878773483e-05, "epoch": 5.031277926720286, "percentage": 50.31, "elapsed_time": "2:20:50", "remaining_time": "2:19:05", "throughput": 2305.28, "total_tokens": 19480304} {"current_steps": 33785, "total_steps": 67140, "loss": 0.5484, "lr": 2.90670166548754e-05, "epoch": 5.032022639261245, "percentage": 50.32, "elapsed_time": "2:20:51", "remaining_time": "2:19:03", "throughput": 2305.32, "total_tokens": 19483248} {"current_steps": 33790, "total_steps": 67140, "loss": 0.4325, "lr": 2.9060604247183525e-05, "epoch": 5.032767351802204, "percentage": 50.33, "elapsed_time": "2:20:52", "remaining_time": "2:19:02", "throughput": 2305.36, "total_tokens": 19486192} {"current_steps": 33795, "total_steps": 67140, "loss": 0.5754, "lr": 2.9054191565092524e-05, "epoch": 5.033512064343164, "percentage": 50.34, "elapsed_time": "2:20:53", "remaining_time": "2:19:01", "throughput": 2305.39, "total_tokens": 19489072} {"current_steps": 33800, "total_steps": 67140, "loss": 0.8457, "lr": 2.9047778609035737e-05, "epoch": 5.034256776884122, "percentage": 50.34, "elapsed_time": "2:20:54", "remaining_time": "2:18:59", "throughput": 2305.44, "total_tokens": 19492112} {"current_steps": 33805, "total_steps": 67140, "loss": 0.5238, "lr": 2.9041365379446522e-05, "epoch": 5.035001489425082, "percentage": 50.35, "elapsed_time": "2:20:56", "remaining_time": "2:18:58", "throughput": 2305.49, "total_tokens": 19495280} {"current_steps": 33810, "total_steps": 67140, "loss": 0.4613, "lr": 2.9034951876758276e-05, "epoch": 5.035746201966041, "percentage": 50.36, "elapsed_time": "2:20:57", "remaining_time": "2:18:57", "throughput": 2305.5, "total_tokens": 19497872} {"current_steps": 33815, "total_steps": 67140, "loss": 0.7612, "lr": 2.902853810140439e-05, "epoch": 5.0364909145070005, "percentage": 50.36, "elapsed_time": "2:20:58", "remaining_time": "2:18:55", "throughput": 2305.54, "total_tokens": 19500848} {"current_steps": 33820, "total_steps": 67140, "loss": 0.6055, "lr": 2.9022124053818268e-05, "epoch": 5.037235627047959, "percentage": 50.37, "elapsed_time": "2:20:59", "remaining_time": "2:18:54", "throughput": 2305.57, "total_tokens": 19503728} {"current_steps": 33825, "total_steps": 67140, "loss": 0.8146, "lr": 2.901570973443336e-05, "epoch": 5.037980339588919, "percentage": 50.38, "elapsed_time": "2:21:00", "remaining_time": "2:18:52", "throughput": 2305.6, "total_tokens": 19506640} {"current_steps": 33830, "total_steps": 67140, "loss": 0.594, "lr": 2.9009295143683114e-05, "epoch": 5.038725052129878, "percentage": 50.39, "elapsed_time": "2:21:01", "remaining_time": "2:18:51", "throughput": 2305.63, "total_tokens": 19509456} {"current_steps": 33835, "total_steps": 67140, "loss": 0.5666, "lr": 2.9002880282001004e-05, "epoch": 5.039469764670837, "percentage": 50.39, "elapsed_time": "2:21:02", "remaining_time": "2:18:50", "throughput": 2305.66, "total_tokens": 19512400} {"current_steps": 33840, "total_steps": 67140, "loss": 0.4529, "lr": 2.899646514982052e-05, "epoch": 5.040214477211796, "percentage": 50.4, "elapsed_time": "2:21:03", "remaining_time": "2:18:48", "throughput": 2305.71, "total_tokens": 19515472} {"current_steps": 33845, "total_steps": 67140, "loss": 0.551, "lr": 2.8990049747575165e-05, "epoch": 5.040959189752756, "percentage": 50.41, "elapsed_time": "2:21:05", "remaining_time": "2:18:47", "throughput": 2305.73, "total_tokens": 19518256} {"current_steps": 33850, "total_steps": 67140, "loss": 0.7271, "lr": 2.8983634075698475e-05, "epoch": 5.0417039022937145, "percentage": 50.42, "elapsed_time": "2:21:06", "remaining_time": "2:18:46", "throughput": 2305.74, "total_tokens": 19520848} {"current_steps": 33855, "total_steps": 67140, "loss": 0.6802, "lr": 2.897721813462399e-05, "epoch": 5.042448614834674, "percentage": 50.42, "elapsed_time": "2:21:07", "remaining_time": "2:18:44", "throughput": 2305.77, "total_tokens": 19523728} {"current_steps": 33860, "total_steps": 67140, "loss": 0.784, "lr": 2.8970801924785273e-05, "epoch": 5.043193327375633, "percentage": 50.43, "elapsed_time": "2:21:08", "remaining_time": "2:18:43", "throughput": 2305.81, "total_tokens": 19526736} {"current_steps": 33865, "total_steps": 67140, "loss": 0.7776, "lr": 2.8964385446615905e-05, "epoch": 5.0439380399165925, "percentage": 50.44, "elapsed_time": "2:21:09", "remaining_time": "2:18:42", "throughput": 2305.85, "total_tokens": 19529744} {"current_steps": 33870, "total_steps": 67140, "loss": 0.7391, "lr": 2.895796870054948e-05, "epoch": 5.044682752457551, "percentage": 50.45, "elapsed_time": "2:21:10", "remaining_time": "2:18:40", "throughput": 2305.88, "total_tokens": 19532624} {"current_steps": 33875, "total_steps": 67140, "loss": 0.486, "lr": 2.895155168701964e-05, "epoch": 5.045427464998511, "percentage": 50.45, "elapsed_time": "2:21:11", "remaining_time": "2:18:39", "throughput": 2305.91, "total_tokens": 19535504} {"current_steps": 33880, "total_steps": 67140, "loss": 0.6197, "lr": 2.894513440645999e-05, "epoch": 5.04617217753947, "percentage": 50.46, "elapsed_time": "2:21:13", "remaining_time": "2:18:37", "throughput": 2305.94, "total_tokens": 19538320} {"current_steps": 33885, "total_steps": 67140, "loss": 0.5875, "lr": 2.8938716859304193e-05, "epoch": 5.046916890080429, "percentage": 50.47, "elapsed_time": "2:21:14", "remaining_time": "2:18:36", "throughput": 2305.95, "total_tokens": 19540912} {"current_steps": 33890, "total_steps": 67140, "loss": 0.7935, "lr": 2.8932299045985932e-05, "epoch": 5.047661602621388, "percentage": 50.48, "elapsed_time": "2:21:15", "remaining_time": "2:18:35", "throughput": 2305.97, "total_tokens": 19543664} {"current_steps": 33895, "total_steps": 67140, "loss": 0.4963, "lr": 2.892588096693889e-05, "epoch": 5.048406315162348, "percentage": 50.48, "elapsed_time": "2:21:16", "remaining_time": "2:18:33", "throughput": 2305.99, "total_tokens": 19546384} {"current_steps": 33900, "total_steps": 67140, "loss": 0.7949, "lr": 2.8919462622596764e-05, "epoch": 5.0491510277033065, "percentage": 50.49, "elapsed_time": "2:21:17", "remaining_time": "2:18:32", "throughput": 2306.02, "total_tokens": 19549264} {"current_steps": 33905, "total_steps": 67140, "loss": 0.5619, "lr": 2.8913044013393305e-05, "epoch": 5.049895740244266, "percentage": 50.5, "elapsed_time": "2:21:18", "remaining_time": "2:18:31", "throughput": 2306.05, "total_tokens": 19552176} {"current_steps": 33910, "total_steps": 67140, "loss": 0.5822, "lr": 2.890662513976223e-05, "epoch": 5.050640452785225, "percentage": 50.51, "elapsed_time": "2:21:19", "remaining_time": "2:18:29", "throughput": 2306.07, "total_tokens": 19555024} {"current_steps": 33915, "total_steps": 67140, "loss": 0.6477, "lr": 2.890020600213731e-05, "epoch": 5.0513851653261845, "percentage": 50.51, "elapsed_time": "2:21:20", "remaining_time": "2:18:28", "throughput": 2306.11, "total_tokens": 19557936} {"current_steps": 33920, "total_steps": 67140, "loss": 0.6931, "lr": 2.889378660095233e-05, "epoch": 5.052129877867143, "percentage": 50.52, "elapsed_time": "2:21:22", "remaining_time": "2:18:27", "throughput": 2306.15, "total_tokens": 19561040} {"current_steps": 33925, "total_steps": 67140, "loss": 0.5892, "lr": 2.8887366936641082e-05, "epoch": 5.052874590408102, "percentage": 50.53, "elapsed_time": "2:21:23", "remaining_time": "2:18:25", "throughput": 2306.2, "total_tokens": 19564208} {"current_steps": 33930, "total_steps": 67140, "loss": 0.6852, "lr": 2.8880947009637377e-05, "epoch": 5.053619302949062, "percentage": 50.54, "elapsed_time": "2:21:24", "remaining_time": "2:18:24", "throughput": 2306.24, "total_tokens": 19567184} {"current_steps": 33935, "total_steps": 67140, "loss": 0.6786, "lr": 2.887452682037506e-05, "epoch": 5.0543640154900205, "percentage": 50.54, "elapsed_time": "2:21:25", "remaining_time": "2:18:23", "throughput": 2306.26, "total_tokens": 19569968} {"current_steps": 33940, "total_steps": 67140, "loss": 0.5947, "lr": 2.8868106369287966e-05, "epoch": 5.05510872803098, "percentage": 50.55, "elapsed_time": "2:21:26", "remaining_time": "2:18:21", "throughput": 2306.3, "total_tokens": 19572912} {"current_steps": 33945, "total_steps": 67140, "loss": 0.4162, "lr": 2.886168565680997e-05, "epoch": 5.055853440571939, "percentage": 50.56, "elapsed_time": "2:21:27", "remaining_time": "2:18:20", "throughput": 2306.33, "total_tokens": 19575856} {"current_steps": 33950, "total_steps": 67140, "loss": 0.6821, "lr": 2.8855264683374956e-05, "epoch": 5.0565981531128985, "percentage": 50.57, "elapsed_time": "2:21:29", "remaining_time": "2:18:19", "throughput": 2306.4, "total_tokens": 19579216} {"current_steps": 33955, "total_steps": 67140, "loss": 0.5711, "lr": 2.884884344941684e-05, "epoch": 5.057342865653857, "percentage": 50.57, "elapsed_time": "2:21:30", "remaining_time": "2:18:17", "throughput": 2306.43, "total_tokens": 19582096} {"current_steps": 33960, "total_steps": 67140, "loss": 0.7585, "lr": 2.8842421955369526e-05, "epoch": 5.058087578194817, "percentage": 50.58, "elapsed_time": "2:21:31", "remaining_time": "2:18:16", "throughput": 2306.47, "total_tokens": 19585104} {"current_steps": 33965, "total_steps": 67140, "loss": 0.5248, "lr": 2.883600020166695e-05, "epoch": 5.058832290735776, "percentage": 50.59, "elapsed_time": "2:21:32", "remaining_time": "2:18:15", "throughput": 2306.51, "total_tokens": 19588144} {"current_steps": 33970, "total_steps": 67140, "loss": 0.5675, "lr": 2.8829578188743084e-05, "epoch": 5.059577003276735, "percentage": 50.6, "elapsed_time": "2:21:33", "remaining_time": "2:18:13", "throughput": 2306.53, "total_tokens": 19590928} {"current_steps": 33975, "total_steps": 67140, "loss": 0.783, "lr": 2.88231559170319e-05, "epoch": 5.060321715817694, "percentage": 50.6, "elapsed_time": "2:21:34", "remaining_time": "2:18:12", "throughput": 2306.58, "total_tokens": 19593968} {"current_steps": 33980, "total_steps": 67140, "loss": 0.6091, "lr": 2.8816733386967376e-05, "epoch": 5.061066428358654, "percentage": 50.61, "elapsed_time": "2:21:35", "remaining_time": "2:18:10", "throughput": 2306.61, "total_tokens": 19596880} {"current_steps": 33985, "total_steps": 67140, "loss": 0.6459, "lr": 2.8810310598983524e-05, "epoch": 5.0618111408996125, "percentage": 50.62, "elapsed_time": "2:21:37", "remaining_time": "2:18:09", "throughput": 2306.64, "total_tokens": 19599664} {"current_steps": 33990, "total_steps": 67140, "loss": 0.5047, "lr": 2.880388755351438e-05, "epoch": 5.062555853440572, "percentage": 50.63, "elapsed_time": "2:21:38", "remaining_time": "2:18:08", "throughput": 2306.66, "total_tokens": 19602384} {"current_steps": 33995, "total_steps": 67140, "loss": 0.5414, "lr": 2.8797464250993984e-05, "epoch": 5.063300565981531, "percentage": 50.63, "elapsed_time": "2:21:39", "remaining_time": "2:18:06", "throughput": 2306.68, "total_tokens": 19605168} {"current_steps": 34000, "total_steps": 67140, "loss": 0.5074, "lr": 2.8791040691856385e-05, "epoch": 5.0640452785224905, "percentage": 50.64, "elapsed_time": "2:21:40", "remaining_time": "2:18:05", "throughput": 2306.72, "total_tokens": 19608176} {"current_steps": 34005, "total_steps": 67140, "loss": 0.6346, "lr": 2.8784616876535673e-05, "epoch": 5.064789991063449, "percentage": 50.65, "elapsed_time": "2:21:41", "remaining_time": "2:18:04", "throughput": 2306.78, "total_tokens": 19611472} {"current_steps": 34010, "total_steps": 67140, "loss": 0.3954, "lr": 2.8778192805465937e-05, "epoch": 5.065534703604409, "percentage": 50.66, "elapsed_time": "2:21:42", "remaining_time": "2:18:02", "throughput": 2306.82, "total_tokens": 19614384} {"current_steps": 34015, "total_steps": 67140, "loss": 0.6253, "lr": 2.8771768479081297e-05, "epoch": 5.066279416145368, "percentage": 50.66, "elapsed_time": "2:21:43", "remaining_time": "2:18:01", "throughput": 2306.83, "total_tokens": 19617104} {"current_steps": 34020, "total_steps": 67140, "loss": 0.6055, "lr": 2.8765343897815867e-05, "epoch": 5.067024128686327, "percentage": 50.67, "elapsed_time": "2:21:45", "remaining_time": "2:18:00", "throughput": 2306.85, "total_tokens": 19619792} {"current_steps": 34025, "total_steps": 67140, "loss": 0.71, "lr": 2.8758919062103817e-05, "epoch": 5.067768841227286, "percentage": 50.68, "elapsed_time": "2:21:46", "remaining_time": "2:17:58", "throughput": 2306.86, "total_tokens": 19622448} {"current_steps": 34030, "total_steps": 67140, "loss": 0.5783, "lr": 2.8752493972379292e-05, "epoch": 5.068513553768246, "percentage": 50.69, "elapsed_time": "2:21:47", "remaining_time": "2:17:57", "throughput": 2306.88, "total_tokens": 19625200} {"current_steps": 34035, "total_steps": 67140, "loss": 0.6187, "lr": 2.8746068629076487e-05, "epoch": 5.0692582663092045, "percentage": 50.69, "elapsed_time": "2:21:48", "remaining_time": "2:17:55", "throughput": 2306.9, "total_tokens": 19627920} {"current_steps": 34040, "total_steps": 67140, "loss": 0.6332, "lr": 2.8739643032629592e-05, "epoch": 5.070002978850164, "percentage": 50.7, "elapsed_time": "2:21:49", "remaining_time": "2:17:54", "throughput": 2306.94, "total_tokens": 19630928} {"current_steps": 34045, "total_steps": 67140, "loss": 0.4929, "lr": 2.8733217183472823e-05, "epoch": 5.070747691391123, "percentage": 50.71, "elapsed_time": "2:21:50", "remaining_time": "2:17:53", "throughput": 2306.97, "total_tokens": 19633744} {"current_steps": 34050, "total_steps": 67140, "loss": 0.6308, "lr": 2.8726791082040416e-05, "epoch": 5.071492403932083, "percentage": 50.71, "elapsed_time": "2:21:51", "remaining_time": "2:17:51", "throughput": 2307.01, "total_tokens": 19636816} {"current_steps": 34055, "total_steps": 67140, "loss": 0.6201, "lr": 2.8720364728766618e-05, "epoch": 5.072237116473041, "percentage": 50.72, "elapsed_time": "2:21:52", "remaining_time": "2:17:50", "throughput": 2307.03, "total_tokens": 19639536} {"current_steps": 34060, "total_steps": 67140, "loss": 0.6833, "lr": 2.8713938124085706e-05, "epoch": 5.072981829014001, "percentage": 50.73, "elapsed_time": "2:21:54", "remaining_time": "2:17:49", "throughput": 2307.05, "total_tokens": 19642256} {"current_steps": 34065, "total_steps": 67140, "loss": 0.6383, "lr": 2.8707511268431947e-05, "epoch": 5.07372654155496, "percentage": 50.74, "elapsed_time": "2:21:55", "remaining_time": "2:17:47", "throughput": 2307.08, "total_tokens": 19645168} {"current_steps": 34070, "total_steps": 67140, "loss": 0.5211, "lr": 2.8701084162239656e-05, "epoch": 5.074471254095919, "percentage": 50.74, "elapsed_time": "2:21:56", "remaining_time": "2:17:46", "throughput": 2307.1, "total_tokens": 19647920} {"current_steps": 34075, "total_steps": 67140, "loss": 0.6392, "lr": 2.8694656805943143e-05, "epoch": 5.075215966636878, "percentage": 50.75, "elapsed_time": "2:21:57", "remaining_time": "2:17:44", "throughput": 2307.1, "total_tokens": 19650480} {"current_steps": 34080, "total_steps": 67140, "loss": 0.5794, "lr": 2.868822919997674e-05, "epoch": 5.075960679177838, "percentage": 50.76, "elapsed_time": "2:21:58", "remaining_time": "2:17:43", "throughput": 2307.14, "total_tokens": 19653488} {"current_steps": 34085, "total_steps": 67140, "loss": 0.6903, "lr": 2.86818013447748e-05, "epoch": 5.0767053917187965, "percentage": 50.77, "elapsed_time": "2:21:59", "remaining_time": "2:17:42", "throughput": 2307.16, "total_tokens": 19656272} {"current_steps": 34090, "total_steps": 67140, "loss": 0.7456, "lr": 2.8675373240771703e-05, "epoch": 5.077450104259755, "percentage": 50.77, "elapsed_time": "2:22:00", "remaining_time": "2:17:40", "throughput": 2307.18, "total_tokens": 19658960} {"current_steps": 34095, "total_steps": 67140, "loss": 0.4993, "lr": 2.8668944888401826e-05, "epoch": 5.078194816800715, "percentage": 50.78, "elapsed_time": "2:22:01", "remaining_time": "2:17:39", "throughput": 2307.2, "total_tokens": 19661680} {"current_steps": 34100, "total_steps": 67140, "loss": 0.7521, "lr": 2.866251628809956e-05, "epoch": 5.078939529341674, "percentage": 50.79, "elapsed_time": "2:22:03", "remaining_time": "2:17:38", "throughput": 2307.22, "total_tokens": 19664528} {"current_steps": 34105, "total_steps": 67140, "loss": 0.667, "lr": 2.8656087440299347e-05, "epoch": 5.079684241882633, "percentage": 50.8, "elapsed_time": "2:22:04", "remaining_time": "2:17:36", "throughput": 2307.25, "total_tokens": 19667344} {"current_steps": 34110, "total_steps": 67140, "loss": 0.5878, "lr": 2.8649658345435597e-05, "epoch": 5.080428954423592, "percentage": 50.8, "elapsed_time": "2:22:05", "remaining_time": "2:17:35", "throughput": 2307.28, "total_tokens": 19670224} {"current_steps": 34115, "total_steps": 67140, "loss": 0.6436, "lr": 2.8643229003942786e-05, "epoch": 5.081173666964552, "percentage": 50.81, "elapsed_time": "2:22:06", "remaining_time": "2:17:34", "throughput": 2307.32, "total_tokens": 19673168} {"current_steps": 34120, "total_steps": 67140, "loss": 0.576, "lr": 2.8636799416255362e-05, "epoch": 5.0819183795055105, "percentage": 50.82, "elapsed_time": "2:22:07", "remaining_time": "2:17:32", "throughput": 2307.33, "total_tokens": 19675856} {"current_steps": 34125, "total_steps": 67140, "loss": 0.6051, "lr": 2.8630369582807824e-05, "epoch": 5.08266309204647, "percentage": 50.83, "elapsed_time": "2:22:08", "remaining_time": "2:17:31", "throughput": 2307.35, "total_tokens": 19678512} {"current_steps": 34130, "total_steps": 67140, "loss": 0.6639, "lr": 2.8623939504034662e-05, "epoch": 5.083407804587429, "percentage": 50.83, "elapsed_time": "2:22:09", "remaining_time": "2:17:29", "throughput": 2307.37, "total_tokens": 19681360} {"current_steps": 34135, "total_steps": 67140, "loss": 0.8386, "lr": 2.8617509180370418e-05, "epoch": 5.084152517128389, "percentage": 50.84, "elapsed_time": "2:22:10", "remaining_time": "2:17:28", "throughput": 2307.4, "total_tokens": 19684272} {"current_steps": 34140, "total_steps": 67140, "loss": 0.5077, "lr": 2.8611078612249598e-05, "epoch": 5.084897229669347, "percentage": 50.85, "elapsed_time": "2:22:12", "remaining_time": "2:17:27", "throughput": 2307.42, "total_tokens": 19686928} {"current_steps": 34145, "total_steps": 67140, "loss": 0.6207, "lr": 2.8604647800106772e-05, "epoch": 5.085641942210307, "percentage": 50.86, "elapsed_time": "2:22:13", "remaining_time": "2:17:25", "throughput": 2307.44, "total_tokens": 19689776} {"current_steps": 34150, "total_steps": 67140, "loss": 0.7102, "lr": 2.85982167443765e-05, "epoch": 5.086386654751266, "percentage": 50.86, "elapsed_time": "2:22:14", "remaining_time": "2:17:24", "throughput": 2307.46, "total_tokens": 19692496} {"current_steps": 34155, "total_steps": 67140, "loss": 0.5944, "lr": 2.8591785445493376e-05, "epoch": 5.087131367292225, "percentage": 50.87, "elapsed_time": "2:22:15", "remaining_time": "2:17:23", "throughput": 2307.5, "total_tokens": 19695472} {"current_steps": 34160, "total_steps": 67140, "loss": 0.5741, "lr": 2.8585353903891986e-05, "epoch": 5.087876079833184, "percentage": 50.88, "elapsed_time": "2:22:16", "remaining_time": "2:17:21", "throughput": 2307.54, "total_tokens": 19698416} {"current_steps": 34165, "total_steps": 67140, "loss": 0.6008, "lr": 2.8578922120006962e-05, "epoch": 5.088620792374144, "percentage": 50.89, "elapsed_time": "2:22:17", "remaining_time": "2:17:20", "throughput": 2307.58, "total_tokens": 19701424} {"current_steps": 34170, "total_steps": 67140, "loss": 0.7422, "lr": 2.857249009427293e-05, "epoch": 5.0893655049151025, "percentage": 50.89, "elapsed_time": "2:22:18", "remaining_time": "2:17:18", "throughput": 2307.62, "total_tokens": 19704432} {"current_steps": 34175, "total_steps": 67140, "loss": 0.6175, "lr": 2.856605782712455e-05, "epoch": 5.090110217456062, "percentage": 50.9, "elapsed_time": "2:22:19", "remaining_time": "2:17:17", "throughput": 2307.64, "total_tokens": 19707216} {"current_steps": 34180, "total_steps": 67140, "loss": 0.4721, "lr": 2.855962531899647e-05, "epoch": 5.090854929997021, "percentage": 50.91, "elapsed_time": "2:22:21", "remaining_time": "2:17:16", "throughput": 2307.67, "total_tokens": 19710032} {"current_steps": 34185, "total_steps": 67140, "loss": 0.6654, "lr": 2.8553192570323385e-05, "epoch": 5.091599642537981, "percentage": 50.92, "elapsed_time": "2:22:22", "remaining_time": "2:17:14", "throughput": 2307.7, "total_tokens": 19712912} {"current_steps": 34190, "total_steps": 67140, "loss": 0.6438, "lr": 2.8546759581539994e-05, "epoch": 5.092344355078939, "percentage": 50.92, "elapsed_time": "2:22:23", "remaining_time": "2:17:13", "throughput": 2307.76, "total_tokens": 19716176} {"current_steps": 34195, "total_steps": 67140, "loss": 0.6327, "lr": 2.8540326353081005e-05, "epoch": 5.093089067619899, "percentage": 50.93, "elapsed_time": "2:22:24", "remaining_time": "2:17:12", "throughput": 2307.79, "total_tokens": 19719120} {"current_steps": 34200, "total_steps": 67140, "loss": 0.6224, "lr": 2.8533892885381164e-05, "epoch": 5.093833780160858, "percentage": 50.94, "elapsed_time": "2:22:25", "remaining_time": "2:17:10", "throughput": 2307.82, "total_tokens": 19721904} {"current_steps": 34205, "total_steps": 67140, "loss": 0.5399, "lr": 2.852745917887521e-05, "epoch": 5.094578492701817, "percentage": 50.95, "elapsed_time": "2:22:26", "remaining_time": "2:17:09", "throughput": 2307.85, "total_tokens": 19724720} {"current_steps": 34210, "total_steps": 67140, "loss": 0.5856, "lr": 2.85210252339979e-05, "epoch": 5.095323205242776, "percentage": 50.95, "elapsed_time": "2:22:27", "remaining_time": "2:17:08", "throughput": 2307.87, "total_tokens": 19727568} {"current_steps": 34215, "total_steps": 67140, "loss": 0.6863, "lr": 2.851459105118402e-05, "epoch": 5.096067917783736, "percentage": 50.96, "elapsed_time": "2:22:29", "remaining_time": "2:17:06", "throughput": 2307.92, "total_tokens": 19730704} {"current_steps": 34220, "total_steps": 67140, "loss": 0.7854, "lr": 2.8508156630868373e-05, "epoch": 5.096812630324695, "percentage": 50.97, "elapsed_time": "2:22:30", "remaining_time": "2:17:05", "throughput": 2307.95, "total_tokens": 19733584} {"current_steps": 34225, "total_steps": 67140, "loss": 0.5414, "lr": 2.8501721973485757e-05, "epoch": 5.097557342865654, "percentage": 50.98, "elapsed_time": "2:22:31", "remaining_time": "2:17:04", "throughput": 2307.97, "total_tokens": 19736304} {"current_steps": 34230, "total_steps": 67140, "loss": 0.5706, "lr": 2.8495287079471012e-05, "epoch": 5.098302055406613, "percentage": 50.98, "elapsed_time": "2:22:32", "remaining_time": "2:17:02", "throughput": 2308.02, "total_tokens": 19739440} {"current_steps": 34235, "total_steps": 67140, "loss": 0.4551, "lr": 2.8488851949258972e-05, "epoch": 5.099046767947573, "percentage": 50.99, "elapsed_time": "2:22:33", "remaining_time": "2:17:01", "throughput": 2308.06, "total_tokens": 19742448} {"current_steps": 34240, "total_steps": 67140, "loss": 0.5731, "lr": 2.848241658328451e-05, "epoch": 5.099791480488531, "percentage": 51.0, "elapsed_time": "2:22:34", "remaining_time": "2:17:00", "throughput": 2308.08, "total_tokens": 19745200} {"current_steps": 34245, "total_steps": 67140, "loss": 0.6828, "lr": 2.8475980981982485e-05, "epoch": 5.100536193029491, "percentage": 51.01, "elapsed_time": "2:22:36", "remaining_time": "2:16:58", "throughput": 2308.14, "total_tokens": 19748528} {"current_steps": 34250, "total_steps": 67140, "loss": 0.7395, "lr": 2.8469545145787796e-05, "epoch": 5.10128090557045, "percentage": 51.01, "elapsed_time": "2:22:37", "remaining_time": "2:16:57", "throughput": 2308.16, "total_tokens": 19751248} {"current_steps": 34255, "total_steps": 67140, "loss": 0.7301, "lr": 2.846310907513536e-05, "epoch": 5.102025618111409, "percentage": 51.02, "elapsed_time": "2:22:38", "remaining_time": "2:16:55", "throughput": 2308.18, "total_tokens": 19753936} {"current_steps": 34260, "total_steps": 67140, "loss": 0.5415, "lr": 2.845667277046009e-05, "epoch": 5.102770330652368, "percentage": 51.03, "elapsed_time": "2:22:39", "remaining_time": "2:16:54", "throughput": 2308.21, "total_tokens": 19756880} {"current_steps": 34265, "total_steps": 67140, "loss": 0.5018, "lr": 2.8450236232196924e-05, "epoch": 5.103515043193327, "percentage": 51.04, "elapsed_time": "2:22:40", "remaining_time": "2:16:53", "throughput": 2308.24, "total_tokens": 19759792} {"current_steps": 34270, "total_steps": 67140, "loss": 0.5835, "lr": 2.844379946078083e-05, "epoch": 5.104259755734287, "percentage": 51.04, "elapsed_time": "2:22:41", "remaining_time": "2:16:51", "throughput": 2308.29, "total_tokens": 19762896} {"current_steps": 34275, "total_steps": 67140, "loss": 0.7512, "lr": 2.843736245664676e-05, "epoch": 5.105004468275245, "percentage": 51.05, "elapsed_time": "2:22:42", "remaining_time": "2:16:50", "throughput": 2308.32, "total_tokens": 19765776} {"current_steps": 34280, "total_steps": 67140, "loss": 0.617, "lr": 2.843092522022972e-05, "epoch": 5.105749180816205, "percentage": 51.06, "elapsed_time": "2:22:43", "remaining_time": "2:16:49", "throughput": 2308.34, "total_tokens": 19768592} {"current_steps": 34285, "total_steps": 67140, "loss": 0.7898, "lr": 2.8424487751964696e-05, "epoch": 5.106493893357164, "percentage": 51.06, "elapsed_time": "2:22:45", "remaining_time": "2:16:47", "throughput": 2308.39, "total_tokens": 19771760} {"current_steps": 34290, "total_steps": 67140, "loss": 0.6767, "lr": 2.8418050052286715e-05, "epoch": 5.107238605898123, "percentage": 51.07, "elapsed_time": "2:22:46", "remaining_time": "2:16:46", "throughput": 2308.41, "total_tokens": 19774480} {"current_steps": 34295, "total_steps": 67140, "loss": 0.6348, "lr": 2.8411612121630804e-05, "epoch": 5.107983318439082, "percentage": 51.08, "elapsed_time": "2:22:47", "remaining_time": "2:16:45", "throughput": 2308.43, "total_tokens": 19777232} {"current_steps": 34300, "total_steps": 67140, "loss": 0.7523, "lr": 2.8405173960432024e-05, "epoch": 5.108728030980042, "percentage": 51.09, "elapsed_time": "2:22:48", "remaining_time": "2:16:43", "throughput": 2308.44, "total_tokens": 19779888} {"current_steps": 34305, "total_steps": 67140, "loss": 0.4294, "lr": 2.8398735569125427e-05, "epoch": 5.109472743521001, "percentage": 51.09, "elapsed_time": "2:22:49", "remaining_time": "2:16:42", "throughput": 2308.47, "total_tokens": 19782736} {"current_steps": 34310, "total_steps": 67140, "loss": 0.5543, "lr": 2.83922969481461e-05, "epoch": 5.11021745606196, "percentage": 51.1, "elapsed_time": "2:22:50", "remaining_time": "2:16:41", "throughput": 2308.5, "total_tokens": 19785552} {"current_steps": 34315, "total_steps": 67140, "loss": 0.4601, "lr": 2.8385858097929135e-05, "epoch": 5.110962168602919, "percentage": 51.11, "elapsed_time": "2:22:51", "remaining_time": "2:16:39", "throughput": 2308.52, "total_tokens": 19788336} {"current_steps": 34320, "total_steps": 67140, "loss": 0.4887, "lr": 2.8379419018909648e-05, "epoch": 5.111706881143879, "percentage": 51.12, "elapsed_time": "2:22:52", "remaining_time": "2:16:38", "throughput": 2308.55, "total_tokens": 19791152} {"current_steps": 34325, "total_steps": 67140, "loss": 0.6129, "lr": 2.8372979711522767e-05, "epoch": 5.112451593684837, "percentage": 51.12, "elapsed_time": "2:22:54", "remaining_time": "2:16:36", "throughput": 2308.56, "total_tokens": 19793776} {"current_steps": 34330, "total_steps": 67140, "loss": 0.5175, "lr": 2.8366540176203625e-05, "epoch": 5.113196306225797, "percentage": 51.13, "elapsed_time": "2:22:55", "remaining_time": "2:16:35", "throughput": 2308.58, "total_tokens": 19796400} {"current_steps": 34335, "total_steps": 67140, "loss": 0.4937, "lr": 2.8360100413387392e-05, "epoch": 5.113941018766756, "percentage": 51.14, "elapsed_time": "2:22:56", "remaining_time": "2:16:34", "throughput": 2308.59, "total_tokens": 19799088} {"current_steps": 34340, "total_steps": 67140, "loss": 0.7938, "lr": 2.8353660423509233e-05, "epoch": 5.114685731307715, "percentage": 51.15, "elapsed_time": "2:22:57", "remaining_time": "2:16:32", "throughput": 2308.62, "total_tokens": 19801872} {"current_steps": 34345, "total_steps": 67140, "loss": 0.7318, "lr": 2.8347220207004325e-05, "epoch": 5.115430443848674, "percentage": 51.15, "elapsed_time": "2:22:58", "remaining_time": "2:16:31", "throughput": 2308.66, "total_tokens": 19804848} {"current_steps": 34350, "total_steps": 67140, "loss": 0.5131, "lr": 2.834077976430789e-05, "epoch": 5.116175156389634, "percentage": 51.16, "elapsed_time": "2:22:59", "remaining_time": "2:16:30", "throughput": 2308.68, "total_tokens": 19807696} {"current_steps": 34355, "total_steps": 67140, "loss": 0.6027, "lr": 2.8334339095855152e-05, "epoch": 5.116919868930593, "percentage": 51.17, "elapsed_time": "2:23:00", "remaining_time": "2:16:28", "throughput": 2308.71, "total_tokens": 19810544} {"current_steps": 34360, "total_steps": 67140, "loss": 0.6598, "lr": 2.8327898202081327e-05, "epoch": 5.117664581471552, "percentage": 51.18, "elapsed_time": "2:23:01", "remaining_time": "2:16:27", "throughput": 2308.73, "total_tokens": 19813200} {"current_steps": 34365, "total_steps": 67140, "loss": 0.8214, "lr": 2.8321457083421665e-05, "epoch": 5.118409294012511, "percentage": 51.18, "elapsed_time": "2:23:02", "remaining_time": "2:16:25", "throughput": 2308.75, "total_tokens": 19815888} {"current_steps": 34370, "total_steps": 67140, "loss": 0.5852, "lr": 2.831501574031145e-05, "epoch": 5.119154006553471, "percentage": 51.19, "elapsed_time": "2:23:04", "remaining_time": "2:16:24", "throughput": 2308.78, "total_tokens": 19818768} {"current_steps": 34375, "total_steps": 67140, "loss": 0.546, "lr": 2.8308574173185943e-05, "epoch": 5.119898719094429, "percentage": 51.2, "elapsed_time": "2:23:05", "remaining_time": "2:16:23", "throughput": 2308.83, "total_tokens": 19822000} {"current_steps": 34380, "total_steps": 67140, "loss": 0.6593, "lr": 2.8302132382480447e-05, "epoch": 5.120643431635389, "percentage": 51.21, "elapsed_time": "2:23:06", "remaining_time": "2:16:21", "throughput": 2308.87, "total_tokens": 19824976} {"current_steps": 34385, "total_steps": 67140, "loss": 0.7231, "lr": 2.8295690368630263e-05, "epoch": 5.121388144176348, "percentage": 51.21, "elapsed_time": "2:23:07", "remaining_time": "2:16:20", "throughput": 2308.91, "total_tokens": 19827952} {"current_steps": 34390, "total_steps": 67140, "loss": 0.7558, "lr": 2.8289248132070727e-05, "epoch": 5.1221328567173074, "percentage": 51.22, "elapsed_time": "2:23:08", "remaining_time": "2:16:19", "throughput": 2308.93, "total_tokens": 19830704} {"current_steps": 34395, "total_steps": 67140, "loss": 0.5998, "lr": 2.828280567323718e-05, "epoch": 5.122877569258266, "percentage": 51.23, "elapsed_time": "2:23:09", "remaining_time": "2:16:17", "throughput": 2308.96, "total_tokens": 19833616} {"current_steps": 34400, "total_steps": 67140, "loss": 0.6559, "lr": 2.827636299256497e-05, "epoch": 5.123622281799226, "percentage": 51.24, "elapsed_time": "2:23:10", "remaining_time": "2:16:16", "throughput": 2308.99, "total_tokens": 19836432} {"current_steps": 34405, "total_steps": 67140, "loss": 0.5399, "lr": 2.826992009048947e-05, "epoch": 5.124366994340185, "percentage": 51.24, "elapsed_time": "2:23:12", "remaining_time": "2:16:14", "throughput": 2308.99, "total_tokens": 19838992} {"current_steps": 34410, "total_steps": 67140, "loss": 0.7266, "lr": 2.8263476967446062e-05, "epoch": 5.125111706881144, "percentage": 51.25, "elapsed_time": "2:23:13", "remaining_time": "2:16:13", "throughput": 2309.02, "total_tokens": 19841840} {"current_steps": 34415, "total_steps": 67140, "loss": 0.6747, "lr": 2.8257033623870145e-05, "epoch": 5.125856419422103, "percentage": 51.26, "elapsed_time": "2:23:14", "remaining_time": "2:16:12", "throughput": 2309.07, "total_tokens": 19844912} {"current_steps": 34420, "total_steps": 67140, "loss": 0.4309, "lr": 2.825059006019715e-05, "epoch": 5.126601131963063, "percentage": 51.27, "elapsed_time": "2:23:15", "remaining_time": "2:16:10", "throughput": 2309.1, "total_tokens": 19847824} {"current_steps": 34425, "total_steps": 67140, "loss": 0.6189, "lr": 2.824414627686249e-05, "epoch": 5.127345844504021, "percentage": 51.27, "elapsed_time": "2:23:16", "remaining_time": "2:16:09", "throughput": 2309.13, "total_tokens": 19850704} {"current_steps": 34430, "total_steps": 67140, "loss": 0.39, "lr": 2.8237702274301602e-05, "epoch": 5.128090557044981, "percentage": 51.28, "elapsed_time": "2:23:17", "remaining_time": "2:16:08", "throughput": 2309.15, "total_tokens": 19853424} {"current_steps": 34435, "total_steps": 67140, "loss": 0.5486, "lr": 2.823125805294997e-05, "epoch": 5.12883526958594, "percentage": 51.29, "elapsed_time": "2:23:18", "remaining_time": "2:16:06", "throughput": 2309.16, "total_tokens": 19856048} {"current_steps": 34440, "total_steps": 67140, "loss": 0.606, "lr": 2.8224813613243062e-05, "epoch": 5.129579982126899, "percentage": 51.3, "elapsed_time": "2:23:20", "remaining_time": "2:16:05", "throughput": 2309.21, "total_tokens": 19859248} {"current_steps": 34445, "total_steps": 67140, "loss": 0.4927, "lr": 2.8218368955616347e-05, "epoch": 5.130324694667858, "percentage": 51.3, "elapsed_time": "2:23:21", "remaining_time": "2:16:04", "throughput": 2309.24, "total_tokens": 19862128} {"current_steps": 34450, "total_steps": 67140, "loss": 0.5279, "lr": 2.8211924080505348e-05, "epoch": 5.131069407208817, "percentage": 51.31, "elapsed_time": "2:23:22", "remaining_time": "2:16:02", "throughput": 2309.25, "total_tokens": 19864720} {"current_steps": 34455, "total_steps": 67140, "loss": 0.6784, "lr": 2.8205478988345584e-05, "epoch": 5.131814119749777, "percentage": 51.32, "elapsed_time": "2:23:23", "remaining_time": "2:16:01", "throughput": 2309.26, "total_tokens": 19867376} {"current_steps": 34460, "total_steps": 67140, "loss": 0.6527, "lr": 2.8199033679572578e-05, "epoch": 5.132558832290735, "percentage": 51.33, "elapsed_time": "2:23:24", "remaining_time": "2:16:00", "throughput": 2309.29, "total_tokens": 19870192} {"current_steps": 34465, "total_steps": 67140, "loss": 0.4948, "lr": 2.819258815462188e-05, "epoch": 5.133303544831695, "percentage": 51.33, "elapsed_time": "2:23:25", "remaining_time": "2:15:58", "throughput": 2309.31, "total_tokens": 19872976} {"current_steps": 34470, "total_steps": 67140, "loss": 0.6005, "lr": 2.8186142413929063e-05, "epoch": 5.134048257372654, "percentage": 51.34, "elapsed_time": "2:23:26", "remaining_time": "2:15:57", "throughput": 2309.33, "total_tokens": 19875664} {"current_steps": 34475, "total_steps": 67140, "loss": 0.5461, "lr": 2.8179696457929684e-05, "epoch": 5.1347929699136134, "percentage": 51.35, "elapsed_time": "2:23:27", "remaining_time": "2:15:55", "throughput": 2309.35, "total_tokens": 19878448} {"current_steps": 34480, "total_steps": 67140, "loss": 0.715, "lr": 2.8173250287059354e-05, "epoch": 5.135537682454572, "percentage": 51.36, "elapsed_time": "2:23:28", "remaining_time": "2:15:54", "throughput": 2309.38, "total_tokens": 19881296} {"current_steps": 34485, "total_steps": 67140, "loss": 0.7529, "lr": 2.816680390175367e-05, "epoch": 5.136282394995532, "percentage": 51.36, "elapsed_time": "2:23:29", "remaining_time": "2:15:53", "throughput": 2309.37, "total_tokens": 19883632} {"current_steps": 34490, "total_steps": 67140, "loss": 0.5662, "lr": 2.8160357302448253e-05, "epoch": 5.137027107536491, "percentage": 51.37, "elapsed_time": "2:23:31", "remaining_time": "2:15:51", "throughput": 2309.41, "total_tokens": 19886640} {"current_steps": 34495, "total_steps": 67140, "loss": 0.6386, "lr": 2.8153910489578734e-05, "epoch": 5.13777182007745, "percentage": 51.38, "elapsed_time": "2:23:32", "remaining_time": "2:15:50", "throughput": 2309.42, "total_tokens": 19889232} {"current_steps": 34500, "total_steps": 67140, "loss": 0.5992, "lr": 2.8147463463580776e-05, "epoch": 5.138516532618409, "percentage": 51.39, "elapsed_time": "2:23:33", "remaining_time": "2:15:48", "throughput": 2309.45, "total_tokens": 19892144} {"current_steps": 34505, "total_steps": 67140, "loss": 0.6914, "lr": 2.8141016224890027e-05, "epoch": 5.139261245159369, "percentage": 51.39, "elapsed_time": "2:23:34", "remaining_time": "2:15:47", "throughput": 2309.49, "total_tokens": 19895120} {"current_steps": 34510, "total_steps": 67140, "loss": 0.6416, "lr": 2.8134568773942172e-05, "epoch": 5.140005957700327, "percentage": 51.4, "elapsed_time": "2:23:35", "remaining_time": "2:15:46", "throughput": 2309.51, "total_tokens": 19897872} {"current_steps": 34515, "total_steps": 67140, "loss": 0.6525, "lr": 2.81281211111729e-05, "epoch": 5.140750670241287, "percentage": 51.41, "elapsed_time": "2:23:36", "remaining_time": "2:15:44", "throughput": 2309.55, "total_tokens": 19900784} {"current_steps": 34520, "total_steps": 67140, "loss": 0.5961, "lr": 2.8121673237017937e-05, "epoch": 5.141495382782246, "percentage": 51.41, "elapsed_time": "2:23:37", "remaining_time": "2:15:43", "throughput": 2309.56, "total_tokens": 19903440} {"current_steps": 34525, "total_steps": 67140, "loss": 0.8104, "lr": 2.8115225151912977e-05, "epoch": 5.1422400953232055, "percentage": 51.42, "elapsed_time": "2:23:39", "remaining_time": "2:15:42", "throughput": 2309.61, "total_tokens": 19906544} {"current_steps": 34530, "total_steps": 67140, "loss": 0.7422, "lr": 2.810877685629376e-05, "epoch": 5.142984807864164, "percentage": 51.43, "elapsed_time": "2:23:40", "remaining_time": "2:15:40", "throughput": 2309.62, "total_tokens": 19909232} {"current_steps": 34535, "total_steps": 67140, "loss": 0.6262, "lr": 2.8102328350596058e-05, "epoch": 5.143729520405124, "percentage": 51.44, "elapsed_time": "2:23:41", "remaining_time": "2:15:39", "throughput": 2309.66, "total_tokens": 19912304} {"current_steps": 34540, "total_steps": 67140, "loss": 0.6883, "lr": 2.809587963525561e-05, "epoch": 5.144474232946083, "percentage": 51.44, "elapsed_time": "2:23:42", "remaining_time": "2:15:38", "throughput": 2309.71, "total_tokens": 19915344} {"current_steps": 34545, "total_steps": 67140, "loss": 0.6695, "lr": 2.8089430710708203e-05, "epoch": 5.145218945487042, "percentage": 51.45, "elapsed_time": "2:23:43", "remaining_time": "2:15:36", "throughput": 2309.74, "total_tokens": 19918256} {"current_steps": 34550, "total_steps": 67140, "loss": 0.4705, "lr": 2.8082981577389627e-05, "epoch": 5.145963658028001, "percentage": 51.46, "elapsed_time": "2:23:44", "remaining_time": "2:15:35", "throughput": 2309.76, "total_tokens": 19921008} {"current_steps": 34555, "total_steps": 67140, "loss": 0.5875, "lr": 2.80765322357357e-05, "epoch": 5.146708370568961, "percentage": 51.47, "elapsed_time": "2:23:45", "remaining_time": "2:15:34", "throughput": 2309.81, "total_tokens": 19924304} {"current_steps": 34560, "total_steps": 67140, "loss": 0.5925, "lr": 2.8070082686182232e-05, "epoch": 5.1474530831099194, "percentage": 51.47, "elapsed_time": "2:23:47", "remaining_time": "2:15:32", "throughput": 2309.85, "total_tokens": 19927216} {"current_steps": 34565, "total_steps": 67140, "loss": 0.6221, "lr": 2.8063632929165047e-05, "epoch": 5.148197795650879, "percentage": 51.48, "elapsed_time": "2:23:48", "remaining_time": "2:15:31", "throughput": 2309.86, "total_tokens": 19929872} {"current_steps": 34570, "total_steps": 67140, "loss": 0.6496, "lr": 2.805718296512001e-05, "epoch": 5.148942508191838, "percentage": 51.49, "elapsed_time": "2:23:49", "remaining_time": "2:15:30", "throughput": 2309.9, "total_tokens": 19932880} {"current_steps": 34575, "total_steps": 67140, "loss": 0.6043, "lr": 2.8050732794482976e-05, "epoch": 5.1496872207327975, "percentage": 51.5, "elapsed_time": "2:23:50", "remaining_time": "2:15:28", "throughput": 2309.94, "total_tokens": 19935920} {"current_steps": 34580, "total_steps": 67140, "loss": 0.7981, "lr": 2.804428241768983e-05, "epoch": 5.150431933273756, "percentage": 51.5, "elapsed_time": "2:23:51", "remaining_time": "2:15:27", "throughput": 2309.96, "total_tokens": 19938640} {"current_steps": 34585, "total_steps": 67140, "loss": 0.8352, "lr": 2.8037831835176454e-05, "epoch": 5.151176645814716, "percentage": 51.51, "elapsed_time": "2:23:52", "remaining_time": "2:15:26", "throughput": 2310.01, "total_tokens": 19941712} {"current_steps": 34590, "total_steps": 67140, "loss": 0.5928, "lr": 2.8031381047378746e-05, "epoch": 5.151921358355675, "percentage": 51.52, "elapsed_time": "2:23:53", "remaining_time": "2:15:24", "throughput": 2310.02, "total_tokens": 19944432} {"current_steps": 34595, "total_steps": 67140, "loss": 0.616, "lr": 2.8024930054732635e-05, "epoch": 5.152666070896634, "percentage": 51.53, "elapsed_time": "2:23:54", "remaining_time": "2:15:23", "throughput": 2310.05, "total_tokens": 19947280} {"current_steps": 34600, "total_steps": 67140, "loss": 0.7174, "lr": 2.8018478857674052e-05, "epoch": 5.153410783437593, "percentage": 51.53, "elapsed_time": "2:23:56", "remaining_time": "2:15:21", "throughput": 2310.09, "total_tokens": 19950256} {"current_steps": 34605, "total_steps": 67140, "loss": 0.6067, "lr": 2.801202745663894e-05, "epoch": 5.154155495978552, "percentage": 51.54, "elapsed_time": "2:23:57", "remaining_time": "2:15:20", "throughput": 2310.14, "total_tokens": 19953360} {"current_steps": 34610, "total_steps": 67140, "loss": 0.4171, "lr": 2.8005575852063252e-05, "epoch": 5.1549002085195115, "percentage": 51.55, "elapsed_time": "2:23:58", "remaining_time": "2:15:19", "throughput": 2310.15, "total_tokens": 19955984} {"current_steps": 34615, "total_steps": 67140, "loss": 0.4352, "lr": 2.7999124044382975e-05, "epoch": 5.15564492106047, "percentage": 51.56, "elapsed_time": "2:23:59", "remaining_time": "2:15:17", "throughput": 2310.18, "total_tokens": 19958896} {"current_steps": 34620, "total_steps": 67140, "loss": 0.6875, "lr": 2.7992672034034096e-05, "epoch": 5.15638963360143, "percentage": 51.56, "elapsed_time": "2:24:00", "remaining_time": "2:15:16", "throughput": 2310.21, "total_tokens": 19961776} {"current_steps": 34625, "total_steps": 67140, "loss": 0.7298, "lr": 2.798621982145259e-05, "epoch": 5.157134346142389, "percentage": 51.57, "elapsed_time": "2:24:01", "remaining_time": "2:15:15", "throughput": 2310.24, "total_tokens": 19964688} {"current_steps": 34630, "total_steps": 67140, "loss": 0.4192, "lr": 2.7979767407074496e-05, "epoch": 5.157879058683348, "percentage": 51.58, "elapsed_time": "2:24:02", "remaining_time": "2:15:13", "throughput": 2310.26, "total_tokens": 19967472} {"current_steps": 34635, "total_steps": 67140, "loss": 0.6267, "lr": 2.7973314791335842e-05, "epoch": 5.158623771224307, "percentage": 51.59, "elapsed_time": "2:24:04", "remaining_time": "2:15:12", "throughput": 2310.3, "total_tokens": 19970384} {"current_steps": 34640, "total_steps": 67140, "loss": 0.5601, "lr": 2.796686197467266e-05, "epoch": 5.159368483765267, "percentage": 51.59, "elapsed_time": "2:24:05", "remaining_time": "2:15:11", "throughput": 2310.35, "total_tokens": 19973648} {"current_steps": 34645, "total_steps": 67140, "loss": 0.4554, "lr": 2.7960408957521005e-05, "epoch": 5.1601131963062254, "percentage": 51.6, "elapsed_time": "2:24:06", "remaining_time": "2:15:09", "throughput": 2310.36, "total_tokens": 19976304} {"current_steps": 34650, "total_steps": 67140, "loss": 0.5575, "lr": 2.7953955740316944e-05, "epoch": 5.160857908847185, "percentage": 51.61, "elapsed_time": "2:24:07", "remaining_time": "2:15:08", "throughput": 2310.4, "total_tokens": 19979248} {"current_steps": 34655, "total_steps": 67140, "loss": 0.6026, "lr": 2.794750232349658e-05, "epoch": 5.161602621388144, "percentage": 51.62, "elapsed_time": "2:24:08", "remaining_time": "2:15:07", "throughput": 2310.43, "total_tokens": 19982160} {"current_steps": 34660, "total_steps": 67140, "loss": 0.5955, "lr": 2.7941048707495982e-05, "epoch": 5.1623473339291035, "percentage": 51.62, "elapsed_time": "2:24:09", "remaining_time": "2:15:05", "throughput": 2310.48, "total_tokens": 19985296} {"current_steps": 34665, "total_steps": 67140, "loss": 0.7616, "lr": 2.793459489275127e-05, "epoch": 5.163092046470062, "percentage": 51.63, "elapsed_time": "2:24:10", "remaining_time": "2:15:04", "throughput": 2310.5, "total_tokens": 19988112} {"current_steps": 34670, "total_steps": 67140, "loss": 0.5987, "lr": 2.7928140879698567e-05, "epoch": 5.163836759011022, "percentage": 51.64, "elapsed_time": "2:24:12", "remaining_time": "2:15:03", "throughput": 2310.54, "total_tokens": 19991152} {"current_steps": 34675, "total_steps": 67140, "loss": 0.4863, "lr": 2.7921686668774005e-05, "epoch": 5.164581471551981, "percentage": 51.65, "elapsed_time": "2:24:13", "remaining_time": "2:15:01", "throughput": 2310.58, "total_tokens": 19994192} {"current_steps": 34680, "total_steps": 67140, "loss": 0.5219, "lr": 2.791523226041374e-05, "epoch": 5.16532618409294, "percentage": 51.65, "elapsed_time": "2:24:14", "remaining_time": "2:15:00", "throughput": 2310.6, "total_tokens": 19996880} {"current_steps": 34685, "total_steps": 67140, "loss": 0.6342, "lr": 2.7908777655053936e-05, "epoch": 5.166070896633899, "percentage": 51.66, "elapsed_time": "2:24:15", "remaining_time": "2:14:59", "throughput": 2310.63, "total_tokens": 19999760} {"current_steps": 34690, "total_steps": 67140, "loss": 0.5942, "lr": 2.7902322853130757e-05, "epoch": 5.166815609174859, "percentage": 51.67, "elapsed_time": "2:24:16", "remaining_time": "2:14:57", "throughput": 2310.67, "total_tokens": 20002704} {"current_steps": 34695, "total_steps": 67140, "loss": 0.4183, "lr": 2.7895867855080405e-05, "epoch": 5.1675603217158175, "percentage": 51.68, "elapsed_time": "2:24:17", "remaining_time": "2:14:56", "throughput": 2310.7, "total_tokens": 20005616} {"current_steps": 34700, "total_steps": 67140, "loss": 0.6839, "lr": 2.7889412661339077e-05, "epoch": 5.168305034256777, "percentage": 51.68, "elapsed_time": "2:24:18", "remaining_time": "2:14:55", "throughput": 2310.75, "total_tokens": 20008720} {"current_steps": 34705, "total_steps": 67140, "loss": 0.6294, "lr": 2.7882957272342986e-05, "epoch": 5.169049746797736, "percentage": 51.69, "elapsed_time": "2:24:20", "remaining_time": "2:14:53", "throughput": 2310.79, "total_tokens": 20011696} {"current_steps": 34710, "total_steps": 67140, "loss": 0.5237, "lr": 2.7876501688528362e-05, "epoch": 5.1697944593386955, "percentage": 51.7, "elapsed_time": "2:24:21", "remaining_time": "2:14:52", "throughput": 2310.83, "total_tokens": 20014736} {"current_steps": 34715, "total_steps": 67140, "loss": 0.502, "lr": 2.7870045910331444e-05, "epoch": 5.170539171879654, "percentage": 51.71, "elapsed_time": "2:24:22", "remaining_time": "2:14:50", "throughput": 2310.86, "total_tokens": 20017616} {"current_steps": 34720, "total_steps": 67140, "loss": 0.7423, "lr": 2.786358993818851e-05, "epoch": 5.171283884420614, "percentage": 51.71, "elapsed_time": "2:24:23", "remaining_time": "2:14:49", "throughput": 2310.9, "total_tokens": 20020624} {"current_steps": 34725, "total_steps": 67140, "loss": 0.7489, "lr": 2.7857133772535798e-05, "epoch": 5.172028596961573, "percentage": 51.72, "elapsed_time": "2:24:24", "remaining_time": "2:14:48", "throughput": 2310.92, "total_tokens": 20023376} {"current_steps": 34730, "total_steps": 67140, "loss": 0.6353, "lr": 2.78506774138096e-05, "epoch": 5.172773309502532, "percentage": 51.73, "elapsed_time": "2:24:25", "remaining_time": "2:14:46", "throughput": 2310.94, "total_tokens": 20026064} {"current_steps": 34735, "total_steps": 67140, "loss": 0.6156, "lr": 2.7844220862446218e-05, "epoch": 5.173518022043491, "percentage": 51.74, "elapsed_time": "2:24:26", "remaining_time": "2:14:45", "throughput": 2310.95, "total_tokens": 20028720} {"current_steps": 34740, "total_steps": 67140, "loss": 0.5807, "lr": 2.7837764118881953e-05, "epoch": 5.174262734584451, "percentage": 51.74, "elapsed_time": "2:24:28", "remaining_time": "2:14:44", "throughput": 2310.98, "total_tokens": 20031632} {"current_steps": 34745, "total_steps": 67140, "loss": 0.5896, "lr": 2.7831307183553122e-05, "epoch": 5.1750074471254095, "percentage": 51.75, "elapsed_time": "2:24:29", "remaining_time": "2:14:42", "throughput": 2310.98, "total_tokens": 20034096} {"current_steps": 34750, "total_steps": 67140, "loss": 0.5804, "lr": 2.782485005689607e-05, "epoch": 5.175752159666369, "percentage": 51.76, "elapsed_time": "2:24:30", "remaining_time": "2:14:41", "throughput": 2310.99, "total_tokens": 20036784} {"current_steps": 34755, "total_steps": 67140, "loss": 0.6648, "lr": 2.7818392739347127e-05, "epoch": 5.176496872207328, "percentage": 51.76, "elapsed_time": "2:24:31", "remaining_time": "2:14:40", "throughput": 2311.02, "total_tokens": 20039664} {"current_steps": 34760, "total_steps": 67140, "loss": 0.7896, "lr": 2.781193523134267e-05, "epoch": 5.1772415847482876, "percentage": 51.77, "elapsed_time": "2:24:32", "remaining_time": "2:14:38", "throughput": 2311.04, "total_tokens": 20042448} {"current_steps": 34765, "total_steps": 67140, "loss": 0.7079, "lr": 2.780547753331906e-05, "epoch": 5.177986297289246, "percentage": 51.78, "elapsed_time": "2:24:33", "remaining_time": "2:14:37", "throughput": 2311.08, "total_tokens": 20045392} {"current_steps": 34770, "total_steps": 67140, "loss": 0.51, "lr": 2.7799019645712682e-05, "epoch": 5.178731009830206, "percentage": 51.79, "elapsed_time": "2:24:34", "remaining_time": "2:14:35", "throughput": 2311.1, "total_tokens": 20048208} {"current_steps": 34775, "total_steps": 67140, "loss": 0.8628, "lr": 2.7792561568959934e-05, "epoch": 5.179475722371165, "percentage": 51.79, "elapsed_time": "2:24:35", "remaining_time": "2:14:34", "throughput": 2311.15, "total_tokens": 20051344} {"current_steps": 34780, "total_steps": 67140, "loss": 0.5583, "lr": 2.778610330349723e-05, "epoch": 5.180220434912124, "percentage": 51.8, "elapsed_time": "2:24:37", "remaining_time": "2:14:33", "throughput": 2311.17, "total_tokens": 20054128} {"current_steps": 34785, "total_steps": 67140, "loss": 0.5468, "lr": 2.7779644849761004e-05, "epoch": 5.180965147453083, "percentage": 51.81, "elapsed_time": "2:24:38", "remaining_time": "2:14:31", "throughput": 2311.2, "total_tokens": 20056976} {"current_steps": 34790, "total_steps": 67140, "loss": 0.6812, "lr": 2.777318620818767e-05, "epoch": 5.181709859994042, "percentage": 51.82, "elapsed_time": "2:24:39", "remaining_time": "2:14:30", "throughput": 2311.23, "total_tokens": 20059824} {"current_steps": 34795, "total_steps": 67140, "loss": 0.5041, "lr": 2.7766727379213686e-05, "epoch": 5.1824545725350015, "percentage": 51.82, "elapsed_time": "2:24:40", "remaining_time": "2:14:29", "throughput": 2311.24, "total_tokens": 20062512} {"current_steps": 34800, "total_steps": 67140, "loss": 0.7264, "lr": 2.7760268363275523e-05, "epoch": 5.18319928507596, "percentage": 51.83, "elapsed_time": "2:24:41", "remaining_time": "2:14:27", "throughput": 2311.28, "total_tokens": 20065424} {"current_steps": 34805, "total_steps": 67140, "loss": 0.5574, "lr": 2.7753809160809642e-05, "epoch": 5.18394399761692, "percentage": 51.84, "elapsed_time": "2:24:42", "remaining_time": "2:14:26", "throughput": 2311.32, "total_tokens": 20068496} {"current_steps": 34810, "total_steps": 67140, "loss": 0.6472, "lr": 2.7747349772252523e-05, "epoch": 5.184688710157879, "percentage": 51.85, "elapsed_time": "2:24:43", "remaining_time": "2:14:25", "throughput": 2311.35, "total_tokens": 20071376} {"current_steps": 34815, "total_steps": 67140, "loss": 0.6334, "lr": 2.7740890198040687e-05, "epoch": 5.185433422698838, "percentage": 51.85, "elapsed_time": "2:24:44", "remaining_time": "2:14:23", "throughput": 2311.38, "total_tokens": 20074288} {"current_steps": 34820, "total_steps": 67140, "loss": 0.6147, "lr": 2.7734430438610637e-05, "epoch": 5.186178135239797, "percentage": 51.86, "elapsed_time": "2:24:46", "remaining_time": "2:14:22", "throughput": 2311.4, "total_tokens": 20077008} {"current_steps": 34825, "total_steps": 67140, "loss": 0.5415, "lr": 2.7727970494398892e-05, "epoch": 5.186922847780757, "percentage": 51.87, "elapsed_time": "2:24:47", "remaining_time": "2:14:21", "throughput": 2311.42, "total_tokens": 20079664} {"current_steps": 34830, "total_steps": 67140, "loss": 0.5591, "lr": 2.772151036584199e-05, "epoch": 5.1876675603217155, "percentage": 51.88, "elapsed_time": "2:24:48", "remaining_time": "2:14:19", "throughput": 2311.44, "total_tokens": 20082448} {"current_steps": 34835, "total_steps": 67140, "loss": 0.5675, "lr": 2.7715050053376484e-05, "epoch": 5.188412272862675, "percentage": 51.88, "elapsed_time": "2:24:49", "remaining_time": "2:14:18", "throughput": 2311.45, "total_tokens": 20085136} {"current_steps": 34840, "total_steps": 67140, "loss": 0.5736, "lr": 2.7708589557438936e-05, "epoch": 5.189156985403634, "percentage": 51.89, "elapsed_time": "2:24:50", "remaining_time": "2:14:16", "throughput": 2311.49, "total_tokens": 20088080} {"current_steps": 34845, "total_steps": 67140, "loss": 0.6648, "lr": 2.7702128878465917e-05, "epoch": 5.1899016979445936, "percentage": 51.9, "elapsed_time": "2:24:51", "remaining_time": "2:14:15", "throughput": 2311.5, "total_tokens": 20090704} {"current_steps": 34850, "total_steps": 67140, "loss": 0.585, "lr": 2.7695668016894017e-05, "epoch": 5.190646410485552, "percentage": 51.91, "elapsed_time": "2:24:52", "remaining_time": "2:14:14", "throughput": 2311.54, "total_tokens": 20093776} {"current_steps": 34855, "total_steps": 67140, "loss": 0.367, "lr": 2.7689206973159825e-05, "epoch": 5.191391123026512, "percentage": 51.91, "elapsed_time": "2:24:53", "remaining_time": "2:14:12", "throughput": 2311.56, "total_tokens": 20096528} {"current_steps": 34860, "total_steps": 67140, "loss": 0.6081, "lr": 2.7682745747699962e-05, "epoch": 5.192135835567471, "percentage": 51.92, "elapsed_time": "2:24:55", "remaining_time": "2:14:11", "throughput": 2311.58, "total_tokens": 20099280} {"current_steps": 34865, "total_steps": 67140, "loss": 0.6238, "lr": 2.7676284340951054e-05, "epoch": 5.19288054810843, "percentage": 51.93, "elapsed_time": "2:24:56", "remaining_time": "2:14:10", "throughput": 2311.6, "total_tokens": 20102064} {"current_steps": 34870, "total_steps": 67140, "loss": 0.5914, "lr": 2.766982275334973e-05, "epoch": 5.193625260649389, "percentage": 51.94, "elapsed_time": "2:24:57", "remaining_time": "2:14:08", "throughput": 2311.65, "total_tokens": 20105296} {"current_steps": 34875, "total_steps": 67140, "loss": 0.783, "lr": 2.7663360985332632e-05, "epoch": 5.194369973190349, "percentage": 51.94, "elapsed_time": "2:24:58", "remaining_time": "2:14:07", "throughput": 2311.68, "total_tokens": 20108144} {"current_steps": 34880, "total_steps": 67140, "loss": 0.634, "lr": 2.7656899037336426e-05, "epoch": 5.1951146857313075, "percentage": 51.95, "elapsed_time": "2:24:59", "remaining_time": "2:14:06", "throughput": 2311.71, "total_tokens": 20111088} {"current_steps": 34885, "total_steps": 67140, "loss": 0.6668, "lr": 2.76504369097978e-05, "epoch": 5.195859398272267, "percentage": 51.96, "elapsed_time": "2:25:00", "remaining_time": "2:14:04", "throughput": 2311.78, "total_tokens": 20114480} {"current_steps": 34890, "total_steps": 67140, "loss": 0.7289, "lr": 2.7643974603153412e-05, "epoch": 5.196604110813226, "percentage": 51.97, "elapsed_time": "2:25:01", "remaining_time": "2:14:03", "throughput": 2311.81, "total_tokens": 20117264} {"current_steps": 34895, "total_steps": 67140, "loss": 0.4904, "lr": 2.763751211783997e-05, "epoch": 5.197348823354186, "percentage": 51.97, "elapsed_time": "2:25:03", "remaining_time": "2:14:02", "throughput": 2311.83, "total_tokens": 20120144} {"current_steps": 34900, "total_steps": 67140, "loss": 0.4602, "lr": 2.7631049454294182e-05, "epoch": 5.198093535895144, "percentage": 51.98, "elapsed_time": "2:25:04", "remaining_time": "2:14:00", "throughput": 2311.85, "total_tokens": 20122896} {"current_steps": 34905, "total_steps": 67140, "loss": 0.676, "lr": 2.7624586612952775e-05, "epoch": 5.198838248436104, "percentage": 51.99, "elapsed_time": "2:25:05", "remaining_time": "2:13:59", "throughput": 2311.9, "total_tokens": 20125968} {"current_steps": 34910, "total_steps": 67140, "loss": 0.5773, "lr": 2.761812359425247e-05, "epoch": 5.199582960977063, "percentage": 52.0, "elapsed_time": "2:25:06", "remaining_time": "2:13:58", "throughput": 2311.9, "total_tokens": 20128528} {"current_steps": 34915, "total_steps": 67140, "loss": 0.6327, "lr": 2.7611660398630025e-05, "epoch": 5.200327673518022, "percentage": 52.0, "elapsed_time": "2:25:07", "remaining_time": "2:13:56", "throughput": 2311.95, "total_tokens": 20131632} {"current_steps": 34920, "total_steps": 67140, "loss": 0.5661, "lr": 2.7605197026522177e-05, "epoch": 5.201072386058981, "percentage": 52.01, "elapsed_time": "2:25:08", "remaining_time": "2:13:55", "throughput": 2311.98, "total_tokens": 20134576} {"current_steps": 34925, "total_steps": 67140, "loss": 0.5583, "lr": 2.7598733478365713e-05, "epoch": 5.201817098599941, "percentage": 52.02, "elapsed_time": "2:25:09", "remaining_time": "2:13:54", "throughput": 2312.03, "total_tokens": 20137584} {"current_steps": 34930, "total_steps": 67140, "loss": 0.5934, "lr": 2.75922697545974e-05, "epoch": 5.2025618111408996, "percentage": 52.03, "elapsed_time": "2:25:11", "remaining_time": "2:13:52", "throughput": 2312.05, "total_tokens": 20140368} {"current_steps": 34935, "total_steps": 67140, "loss": 0.5329, "lr": 2.7585805855654045e-05, "epoch": 5.203306523681859, "percentage": 52.03, "elapsed_time": "2:25:12", "remaining_time": "2:13:51", "throughput": 2312.07, "total_tokens": 20143152} {"current_steps": 34940, "total_steps": 67140, "loss": 0.5417, "lr": 2.7579341781972436e-05, "epoch": 5.204051236222818, "percentage": 52.04, "elapsed_time": "2:25:13", "remaining_time": "2:13:49", "throughput": 2312.07, "total_tokens": 20145616} {"current_steps": 34945, "total_steps": 67140, "loss": 0.5703, "lr": 2.75728775339894e-05, "epoch": 5.204795948763778, "percentage": 52.05, "elapsed_time": "2:25:14", "remaining_time": "2:13:48", "throughput": 2312.09, "total_tokens": 20148432} {"current_steps": 34950, "total_steps": 67140, "loss": 0.5818, "lr": 2.7566413112141765e-05, "epoch": 5.205540661304736, "percentage": 52.06, "elapsed_time": "2:25:15", "remaining_time": "2:13:47", "throughput": 2312.11, "total_tokens": 20151152} {"current_steps": 34955, "total_steps": 67140, "loss": 0.6117, "lr": 2.7559948516866357e-05, "epoch": 5.206285373845695, "percentage": 52.06, "elapsed_time": "2:25:16", "remaining_time": "2:13:45", "throughput": 2312.12, "total_tokens": 20153808} {"current_steps": 34960, "total_steps": 67140, "loss": 0.4815, "lr": 2.755348374860004e-05, "epoch": 5.207030086386655, "percentage": 52.07, "elapsed_time": "2:25:17", "remaining_time": "2:13:44", "throughput": 2312.19, "total_tokens": 20157136} {"current_steps": 34965, "total_steps": 67140, "loss": 0.6006, "lr": 2.7547018807779673e-05, "epoch": 5.2077747989276135, "percentage": 52.08, "elapsed_time": "2:25:18", "remaining_time": "2:13:43", "throughput": 2312.22, "total_tokens": 20160144} {"current_steps": 34970, "total_steps": 67140, "loss": 0.5565, "lr": 2.7540553694842136e-05, "epoch": 5.208519511468573, "percentage": 52.09, "elapsed_time": "2:25:20", "remaining_time": "2:13:41", "throughput": 2312.24, "total_tokens": 20162896} {"current_steps": 34975, "total_steps": 67140, "loss": 0.7128, "lr": 2.7534088410224302e-05, "epoch": 5.209264224009532, "percentage": 52.09, "elapsed_time": "2:25:21", "remaining_time": "2:13:40", "throughput": 2312.31, "total_tokens": 20166320} {"current_steps": 34980, "total_steps": 67140, "loss": 0.5567, "lr": 2.7527622954363074e-05, "epoch": 5.210008936550492, "percentage": 52.1, "elapsed_time": "2:25:22", "remaining_time": "2:13:39", "throughput": 2312.34, "total_tokens": 20169168} {"current_steps": 34985, "total_steps": 67140, "loss": 0.5998, "lr": 2.752115732769538e-05, "epoch": 5.21075364909145, "percentage": 52.11, "elapsed_time": "2:25:23", "remaining_time": "2:13:37", "throughput": 2312.36, "total_tokens": 20171984} {"current_steps": 34990, "total_steps": 67140, "loss": 0.595, "lr": 2.7514691530658103e-05, "epoch": 5.21149836163241, "percentage": 52.11, "elapsed_time": "2:25:24", "remaining_time": "2:13:36", "throughput": 2312.38, "total_tokens": 20174800} {"current_steps": 34995, "total_steps": 67140, "loss": 0.6897, "lr": 2.7508225563688206e-05, "epoch": 5.212243074173369, "percentage": 52.12, "elapsed_time": "2:25:25", "remaining_time": "2:13:35", "throughput": 2312.43, "total_tokens": 20177808} {"current_steps": 35000, "total_steps": 67140, "loss": 0.5833, "lr": 2.750175942722262e-05, "epoch": 5.212987786714328, "percentage": 52.13, "elapsed_time": "2:25:26", "remaining_time": "2:13:33", "throughput": 2312.47, "total_tokens": 20180848} {"current_steps": 35005, "total_steps": 67140, "loss": 0.6971, "lr": 2.749529312169831e-05, "epoch": 5.213732499255287, "percentage": 52.14, "elapsed_time": "2:25:28", "remaining_time": "2:13:32", "throughput": 2312.5, "total_tokens": 20183792} {"current_steps": 35010, "total_steps": 67140, "loss": 0.7659, "lr": 2.748882664755223e-05, "epoch": 5.214477211796247, "percentage": 52.14, "elapsed_time": "2:25:29", "remaining_time": "2:13:31", "throughput": 2312.51, "total_tokens": 20186448} {"current_steps": 35015, "total_steps": 67140, "loss": 0.6266, "lr": 2.748236000522137e-05, "epoch": 5.2152219243372056, "percentage": 52.15, "elapsed_time": "2:25:30", "remaining_time": "2:13:29", "throughput": 2312.53, "total_tokens": 20189200} {"current_steps": 35020, "total_steps": 67140, "loss": 0.6467, "lr": 2.7475893195142706e-05, "epoch": 5.215966636878165, "percentage": 52.16, "elapsed_time": "2:25:31", "remaining_time": "2:13:28", "throughput": 2312.57, "total_tokens": 20192080} {"current_steps": 35025, "total_steps": 67140, "loss": 0.5414, "lr": 2.746942621775325e-05, "epoch": 5.216711349419124, "percentage": 52.17, "elapsed_time": "2:25:32", "remaining_time": "2:13:27", "throughput": 2312.6, "total_tokens": 20195024} {"current_steps": 35030, "total_steps": 67140, "loss": 0.6628, "lr": 2.7462959073490007e-05, "epoch": 5.217456061960084, "percentage": 52.17, "elapsed_time": "2:25:33", "remaining_time": "2:13:25", "throughput": 2312.64, "total_tokens": 20198160} {"current_steps": 35035, "total_steps": 67140, "loss": 0.8527, "lr": 2.745649176279001e-05, "epoch": 5.218200774501042, "percentage": 52.18, "elapsed_time": "2:25:34", "remaining_time": "2:13:24", "throughput": 2312.69, "total_tokens": 20201296} {"current_steps": 35040, "total_steps": 67140, "loss": 0.6904, "lr": 2.7450024286090283e-05, "epoch": 5.218945487042002, "percentage": 52.19, "elapsed_time": "2:25:36", "remaining_time": "2:13:23", "throughput": 2312.72, "total_tokens": 20204176} {"current_steps": 35045, "total_steps": 67140, "loss": 0.5637, "lr": 2.7443556643827872e-05, "epoch": 5.219690199582961, "percentage": 52.2, "elapsed_time": "2:25:37", "remaining_time": "2:13:21", "throughput": 2312.75, "total_tokens": 20207024} {"current_steps": 35050, "total_steps": 67140, "loss": 0.6997, "lr": 2.7437088836439844e-05, "epoch": 5.22043491212392, "percentage": 52.2, "elapsed_time": "2:25:38", "remaining_time": "2:13:20", "throughput": 2312.78, "total_tokens": 20209968} {"current_steps": 35055, "total_steps": 67140, "loss": 0.6449, "lr": 2.7430620864363254e-05, "epoch": 5.221179624664879, "percentage": 52.21, "elapsed_time": "2:25:39", "remaining_time": "2:13:19", "throughput": 2312.82, "total_tokens": 20212944} {"current_steps": 35060, "total_steps": 67140, "loss": 0.6079, "lr": 2.7424152728035192e-05, "epoch": 5.221924337205839, "percentage": 52.22, "elapsed_time": "2:25:40", "remaining_time": "2:13:17", "throughput": 2312.84, "total_tokens": 20215760} {"current_steps": 35065, "total_steps": 67140, "loss": 0.5246, "lr": 2.7417684427892747e-05, "epoch": 5.222669049746798, "percentage": 52.23, "elapsed_time": "2:25:41", "remaining_time": "2:13:16", "throughput": 2312.86, "total_tokens": 20218512} {"current_steps": 35070, "total_steps": 67140, "loss": 0.5178, "lr": 2.741121596437302e-05, "epoch": 5.223413762287757, "percentage": 52.23, "elapsed_time": "2:25:42", "remaining_time": "2:13:15", "throughput": 2312.89, "total_tokens": 20221360} {"current_steps": 35075, "total_steps": 67140, "loss": 0.6225, "lr": 2.7404747337913116e-05, "epoch": 5.224158474828716, "percentage": 52.24, "elapsed_time": "2:25:44", "remaining_time": "2:13:13", "throughput": 2312.94, "total_tokens": 20224528} {"current_steps": 35080, "total_steps": 67140, "loss": 0.7111, "lr": 2.739827854895017e-05, "epoch": 5.224903187369676, "percentage": 52.25, "elapsed_time": "2:25:45", "remaining_time": "2:13:12", "throughput": 2312.98, "total_tokens": 20227472} {"current_steps": 35085, "total_steps": 67140, "loss": 0.8454, "lr": 2.73918095979213e-05, "epoch": 5.225647899910634, "percentage": 52.26, "elapsed_time": "2:25:46", "remaining_time": "2:13:10", "throughput": 2313.0, "total_tokens": 20230320} {"current_steps": 35090, "total_steps": 67140, "loss": 0.6644, "lr": 2.7385340485263667e-05, "epoch": 5.226392612451594, "percentage": 52.26, "elapsed_time": "2:25:47", "remaining_time": "2:13:09", "throughput": 2313.06, "total_tokens": 20233616} {"current_steps": 35095, "total_steps": 67140, "loss": 0.5522, "lr": 2.737887121141442e-05, "epoch": 5.227137324992553, "percentage": 52.27, "elapsed_time": "2:25:48", "remaining_time": "2:13:08", "throughput": 2313.09, "total_tokens": 20236432} {"current_steps": 35100, "total_steps": 67140, "loss": 0.6882, "lr": 2.7372401776810736e-05, "epoch": 5.227882037533512, "percentage": 52.28, "elapsed_time": "2:25:49", "remaining_time": "2:13:07", "throughput": 2313.13, "total_tokens": 20239440} {"current_steps": 35105, "total_steps": 67140, "loss": 0.575, "lr": 2.736593218188978e-05, "epoch": 5.228626750074471, "percentage": 52.29, "elapsed_time": "2:25:50", "remaining_time": "2:13:05", "throughput": 2313.17, "total_tokens": 20242512} {"current_steps": 35110, "total_steps": 67140, "loss": 0.6907, "lr": 2.7359462427088744e-05, "epoch": 5.229371462615431, "percentage": 52.29, "elapsed_time": "2:25:52", "remaining_time": "2:13:04", "throughput": 2313.23, "total_tokens": 20245680} {"current_steps": 35115, "total_steps": 67140, "loss": 0.545, "lr": 2.7352992512844838e-05, "epoch": 5.23011617515639, "percentage": 52.3, "elapsed_time": "2:25:53", "remaining_time": "2:13:03", "throughput": 2313.25, "total_tokens": 20248560} {"current_steps": 35120, "total_steps": 67140, "loss": 0.5894, "lr": 2.7346522439595256e-05, "epoch": 5.230860887697349, "percentage": 52.31, "elapsed_time": "2:25:54", "remaining_time": "2:13:01", "throughput": 2313.29, "total_tokens": 20251504} {"current_steps": 35125, "total_steps": 67140, "loss": 0.5438, "lr": 2.7340052207777234e-05, "epoch": 5.231605600238308, "percentage": 52.32, "elapsed_time": "2:25:55", "remaining_time": "2:13:00", "throughput": 2313.3, "total_tokens": 20254128} {"current_steps": 35130, "total_steps": 67140, "loss": 0.6742, "lr": 2.733358181782799e-05, "epoch": 5.232350312779268, "percentage": 52.32, "elapsed_time": "2:25:56", "remaining_time": "2:12:58", "throughput": 2313.33, "total_tokens": 20256976} {"current_steps": 35135, "total_steps": 67140, "loss": 0.5807, "lr": 2.732711127018478e-05, "epoch": 5.233095025320226, "percentage": 52.33, "elapsed_time": "2:25:57", "remaining_time": "2:12:57", "throughput": 2313.35, "total_tokens": 20259760} {"current_steps": 35140, "total_steps": 67140, "loss": 0.6981, "lr": 2.732064056528485e-05, "epoch": 5.233839737861185, "percentage": 52.34, "elapsed_time": "2:25:58", "remaining_time": "2:12:56", "throughput": 2313.39, "total_tokens": 20262864} {"current_steps": 35145, "total_steps": 67140, "loss": 0.5461, "lr": 2.7314169703565467e-05, "epoch": 5.234584450402145, "percentage": 52.35, "elapsed_time": "2:26:00", "remaining_time": "2:12:54", "throughput": 2313.43, "total_tokens": 20265904} {"current_steps": 35150, "total_steps": 67140, "loss": 0.5057, "lr": 2.7307698685463907e-05, "epoch": 5.235329162943104, "percentage": 52.35, "elapsed_time": "2:26:01", "remaining_time": "2:12:53", "throughput": 2313.48, "total_tokens": 20268976} {"current_steps": 35155, "total_steps": 67140, "loss": 0.6636, "lr": 2.730122751141745e-05, "epoch": 5.236073875484063, "percentage": 52.36, "elapsed_time": "2:26:02", "remaining_time": "2:12:52", "throughput": 2313.51, "total_tokens": 20271856} {"current_steps": 35160, "total_steps": 67140, "loss": 0.6682, "lr": 2.729475618186339e-05, "epoch": 5.236818588025022, "percentage": 52.37, "elapsed_time": "2:26:03", "remaining_time": "2:12:50", "throughput": 2313.55, "total_tokens": 20274832} {"current_steps": 35165, "total_steps": 67140, "loss": 0.5803, "lr": 2.728828469723904e-05, "epoch": 5.237563300565982, "percentage": 52.38, "elapsed_time": "2:26:04", "remaining_time": "2:12:49", "throughput": 2313.55, "total_tokens": 20277424} {"current_steps": 35170, "total_steps": 67140, "loss": 0.6032, "lr": 2.7281813057981715e-05, "epoch": 5.23830801310694, "percentage": 52.38, "elapsed_time": "2:26:05", "remaining_time": "2:12:48", "throughput": 2313.6, "total_tokens": 20280528} {"current_steps": 35175, "total_steps": 67140, "loss": 0.672, "lr": 2.7275341264528737e-05, "epoch": 5.2390527256479, "percentage": 52.39, "elapsed_time": "2:26:06", "remaining_time": "2:12:46", "throughput": 2313.62, "total_tokens": 20283344} {"current_steps": 35180, "total_steps": 67140, "loss": 0.5674, "lr": 2.7268869317317452e-05, "epoch": 5.239797438188859, "percentage": 52.4, "elapsed_time": "2:26:08", "remaining_time": "2:12:45", "throughput": 2313.63, "total_tokens": 20286032} {"current_steps": 35185, "total_steps": 67140, "loss": 0.5081, "lr": 2.72623972167852e-05, "epoch": 5.240542150729818, "percentage": 52.41, "elapsed_time": "2:26:09", "remaining_time": "2:12:44", "throughput": 2313.67, "total_tokens": 20289040} {"current_steps": 35190, "total_steps": 67140, "loss": 0.5196, "lr": 2.7255924963369345e-05, "epoch": 5.241286863270777, "percentage": 52.41, "elapsed_time": "2:26:10", "remaining_time": "2:12:42", "throughput": 2313.71, "total_tokens": 20292016} {"current_steps": 35195, "total_steps": 67140, "loss": 0.5551, "lr": 2.7249452557507243e-05, "epoch": 5.242031575811737, "percentage": 52.42, "elapsed_time": "2:26:11", "remaining_time": "2:12:41", "throughput": 2313.74, "total_tokens": 20294864} {"current_steps": 35200, "total_steps": 67140, "loss": 0.6629, "lr": 2.7242979999636296e-05, "epoch": 5.242776288352696, "percentage": 52.43, "elapsed_time": "2:26:12", "remaining_time": "2:12:40", "throughput": 2313.77, "total_tokens": 20297808} {"current_steps": 35205, "total_steps": 67140, "loss": 0.5236, "lr": 2.7236507290193876e-05, "epoch": 5.243521000893655, "percentage": 52.44, "elapsed_time": "2:26:13", "remaining_time": "2:12:38", "throughput": 2313.81, "total_tokens": 20300752} {"current_steps": 35210, "total_steps": 67140, "loss": 0.5217, "lr": 2.7230034429617386e-05, "epoch": 5.244265713434614, "percentage": 52.44, "elapsed_time": "2:26:14", "remaining_time": "2:12:37", "throughput": 2313.84, "total_tokens": 20303696} {"current_steps": 35215, "total_steps": 67140, "loss": 0.4805, "lr": 2.7223561418344234e-05, "epoch": 5.245010425975574, "percentage": 52.45, "elapsed_time": "2:26:15", "remaining_time": "2:12:36", "throughput": 2313.85, "total_tokens": 20306320} {"current_steps": 35220, "total_steps": 67140, "loss": 0.6993, "lr": 2.721708825681184e-05, "epoch": 5.245755138516532, "percentage": 52.46, "elapsed_time": "2:26:17", "remaining_time": "2:12:34", "throughput": 2313.89, "total_tokens": 20309360} {"current_steps": 35225, "total_steps": 67140, "loss": 0.6311, "lr": 2.7210614945457642e-05, "epoch": 5.246499851057492, "percentage": 52.46, "elapsed_time": "2:26:18", "remaining_time": "2:12:33", "throughput": 2313.92, "total_tokens": 20312176} {"current_steps": 35230, "total_steps": 67140, "loss": 0.6815, "lr": 2.7204141484719064e-05, "epoch": 5.247244563598451, "percentage": 52.47, "elapsed_time": "2:26:19", "remaining_time": "2:12:32", "throughput": 2313.94, "total_tokens": 20314960} {"current_steps": 35235, "total_steps": 67140, "loss": 0.6634, "lr": 2.719766787503357e-05, "epoch": 5.2479892761394105, "percentage": 52.48, "elapsed_time": "2:26:20", "remaining_time": "2:12:30", "throughput": 2313.96, "total_tokens": 20317808} {"current_steps": 35240, "total_steps": 67140, "loss": 0.5173, "lr": 2.719119411683862e-05, "epoch": 5.248733988680369, "percentage": 52.49, "elapsed_time": "2:26:21", "remaining_time": "2:12:29", "throughput": 2313.99, "total_tokens": 20320624} {"current_steps": 35245, "total_steps": 67140, "loss": 0.5116, "lr": 2.7184720210571678e-05, "epoch": 5.249478701221329, "percentage": 52.49, "elapsed_time": "2:26:22", "remaining_time": "2:12:28", "throughput": 2314.03, "total_tokens": 20323728} {"current_steps": 35250, "total_steps": 67140, "loss": 0.6882, "lr": 2.717824615667023e-05, "epoch": 5.250223413762288, "percentage": 52.5, "elapsed_time": "2:26:23", "remaining_time": "2:12:26", "throughput": 2314.07, "total_tokens": 20326768} {"current_steps": 35255, "total_steps": 67140, "loss": 0.6211, "lr": 2.7171771955571756e-05, "epoch": 5.250968126303247, "percentage": 52.51, "elapsed_time": "2:26:25", "remaining_time": "2:12:25", "throughput": 2314.12, "total_tokens": 20329872} {"current_steps": 35260, "total_steps": 67140, "loss": 0.5221, "lr": 2.7165297607713763e-05, "epoch": 5.251712838844206, "percentage": 52.52, "elapsed_time": "2:26:26", "remaining_time": "2:12:24", "throughput": 2314.14, "total_tokens": 20332720} {"current_steps": 35265, "total_steps": 67140, "loss": 0.8271, "lr": 2.715882311353377e-05, "epoch": 5.252457551385166, "percentage": 52.52, "elapsed_time": "2:26:27", "remaining_time": "2:12:22", "throughput": 2314.17, "total_tokens": 20335632} {"current_steps": 35270, "total_steps": 67140, "loss": 0.6257, "lr": 2.7152348473469285e-05, "epoch": 5.253202263926124, "percentage": 52.53, "elapsed_time": "2:26:28", "remaining_time": "2:12:21", "throughput": 2314.21, "total_tokens": 20338576} {"current_steps": 35275, "total_steps": 67140, "loss": 0.7563, "lr": 2.7145873687957835e-05, "epoch": 5.253946976467084, "percentage": 52.54, "elapsed_time": "2:26:29", "remaining_time": "2:12:20", "throughput": 2314.28, "total_tokens": 20342256} {"current_steps": 35280, "total_steps": 67140, "loss": 0.7904, "lr": 2.7139398757436968e-05, "epoch": 5.254691689008043, "percentage": 52.55, "elapsed_time": "2:26:31", "remaining_time": "2:12:18", "throughput": 2314.32, "total_tokens": 20345264} {"current_steps": 35285, "total_steps": 67140, "loss": 0.6645, "lr": 2.7132923682344235e-05, "epoch": 5.2554364015490025, "percentage": 52.55, "elapsed_time": "2:26:32", "remaining_time": "2:12:17", "throughput": 2314.36, "total_tokens": 20348336} {"current_steps": 35290, "total_steps": 67140, "loss": 0.6238, "lr": 2.7126448463117188e-05, "epoch": 5.256181114089961, "percentage": 52.56, "elapsed_time": "2:26:33", "remaining_time": "2:12:16", "throughput": 2314.39, "total_tokens": 20351216} {"current_steps": 35295, "total_steps": 67140, "loss": 0.5619, "lr": 2.7119973100193397e-05, "epoch": 5.256925826630921, "percentage": 52.57, "elapsed_time": "2:26:34", "remaining_time": "2:12:14", "throughput": 2314.41, "total_tokens": 20354032} {"current_steps": 35300, "total_steps": 67140, "loss": 0.6643, "lr": 2.7113497594010452e-05, "epoch": 5.25767053917188, "percentage": 52.58, "elapsed_time": "2:26:35", "remaining_time": "2:12:13", "throughput": 2314.43, "total_tokens": 20356752} {"current_steps": 35305, "total_steps": 67140, "loss": 0.5045, "lr": 2.710702194500593e-05, "epoch": 5.258415251712838, "percentage": 52.58, "elapsed_time": "2:26:36", "remaining_time": "2:12:12", "throughput": 2314.46, "total_tokens": 20359696} {"current_steps": 35310, "total_steps": 67140, "loss": 0.6442, "lr": 2.7100546153617423e-05, "epoch": 5.259159964253798, "percentage": 52.59, "elapsed_time": "2:26:37", "remaining_time": "2:12:10", "throughput": 2314.49, "total_tokens": 20362512} {"current_steps": 35315, "total_steps": 67140, "loss": 0.5178, "lr": 2.7094070220282553e-05, "epoch": 5.259904676794757, "percentage": 52.6, "elapsed_time": "2:26:38", "remaining_time": "2:12:09", "throughput": 2314.5, "total_tokens": 20365200} {"current_steps": 35320, "total_steps": 67140, "loss": 0.6175, "lr": 2.7087594145438926e-05, "epoch": 5.2606493893357165, "percentage": 52.61, "elapsed_time": "2:26:40", "remaining_time": "2:12:08", "throughput": 2314.53, "total_tokens": 20368016} {"current_steps": 35325, "total_steps": 67140, "loss": 0.5616, "lr": 2.7081117929524185e-05, "epoch": 5.261394101876675, "percentage": 52.61, "elapsed_time": "2:26:41", "remaining_time": "2:12:06", "throughput": 2314.56, "total_tokens": 20370928} {"current_steps": 35330, "total_steps": 67140, "loss": 0.7322, "lr": 2.7074641572975944e-05, "epoch": 5.262138814417635, "percentage": 52.62, "elapsed_time": "2:26:42", "remaining_time": "2:12:05", "throughput": 2314.61, "total_tokens": 20374160} {"current_steps": 35335, "total_steps": 67140, "loss": 0.5775, "lr": 2.7068165076231865e-05, "epoch": 5.262883526958594, "percentage": 52.63, "elapsed_time": "2:26:43", "remaining_time": "2:12:04", "throughput": 2314.65, "total_tokens": 20377200} {"current_steps": 35340, "total_steps": 67140, "loss": 0.5677, "lr": 2.7061688439729598e-05, "epoch": 5.263628239499553, "percentage": 52.64, "elapsed_time": "2:26:44", "remaining_time": "2:12:02", "throughput": 2314.68, "total_tokens": 20380112} {"current_steps": 35345, "total_steps": 67140, "loss": 0.665, "lr": 2.7055211663906814e-05, "epoch": 5.264372952040512, "percentage": 52.64, "elapsed_time": "2:26:45", "remaining_time": "2:12:01", "throughput": 2314.72, "total_tokens": 20383056} {"current_steps": 35350, "total_steps": 67140, "loss": 0.5102, "lr": 2.704873474920118e-05, "epoch": 5.265117664581472, "percentage": 52.65, "elapsed_time": "2:26:47", "remaining_time": "2:12:00", "throughput": 2314.75, "total_tokens": 20386032} {"current_steps": 35355, "total_steps": 67140, "loss": 0.6485, "lr": 2.7042257696050377e-05, "epoch": 5.26586237712243, "percentage": 52.66, "elapsed_time": "2:26:48", "remaining_time": "2:11:58", "throughput": 2314.79, "total_tokens": 20389040} {"current_steps": 35360, "total_steps": 67140, "loss": 0.5262, "lr": 2.70357805048921e-05, "epoch": 5.26660708966339, "percentage": 52.67, "elapsed_time": "2:26:49", "remaining_time": "2:11:57", "throughput": 2314.82, "total_tokens": 20392016} {"current_steps": 35365, "total_steps": 67140, "loss": 0.5405, "lr": 2.7029303176164066e-05, "epoch": 5.267351802204349, "percentage": 52.67, "elapsed_time": "2:26:50", "remaining_time": "2:11:56", "throughput": 2314.85, "total_tokens": 20394960} {"current_steps": 35370, "total_steps": 67140, "loss": 0.5284, "lr": 2.702282571030396e-05, "epoch": 5.2680965147453085, "percentage": 52.68, "elapsed_time": "2:26:51", "remaining_time": "2:11:54", "throughput": 2314.88, "total_tokens": 20397712} {"current_steps": 35375, "total_steps": 67140, "loss": 0.4904, "lr": 2.7016348107749522e-05, "epoch": 5.268841227286267, "percentage": 52.69, "elapsed_time": "2:26:52", "remaining_time": "2:11:53", "throughput": 2314.9, "total_tokens": 20400528} {"current_steps": 35380, "total_steps": 67140, "loss": 0.601, "lr": 2.7009870368938477e-05, "epoch": 5.269585939827227, "percentage": 52.7, "elapsed_time": "2:26:53", "remaining_time": "2:11:51", "throughput": 2314.91, "total_tokens": 20403120} {"current_steps": 35385, "total_steps": 67140, "loss": 0.6199, "lr": 2.700339249430856e-05, "epoch": 5.270330652368186, "percentage": 52.7, "elapsed_time": "2:26:54", "remaining_time": "2:11:50", "throughput": 2314.95, "total_tokens": 20406224} {"current_steps": 35390, "total_steps": 67140, "loss": 0.6098, "lr": 2.6996914484297532e-05, "epoch": 5.271075364909145, "percentage": 52.71, "elapsed_time": "2:26:56", "remaining_time": "2:11:49", "throughput": 2314.97, "total_tokens": 20408944} {"current_steps": 35395, "total_steps": 67140, "loss": 0.5424, "lr": 2.6990436339343134e-05, "epoch": 5.271820077450104, "percentage": 52.72, "elapsed_time": "2:26:57", "remaining_time": "2:11:47", "throughput": 2315.0, "total_tokens": 20411888} {"current_steps": 35400, "total_steps": 67140, "loss": 0.6345, "lr": 2.6983958059883145e-05, "epoch": 5.272564789991064, "percentage": 52.73, "elapsed_time": "2:26:58", "remaining_time": "2:11:46", "throughput": 2315.02, "total_tokens": 20414672} {"current_steps": 35405, "total_steps": 67140, "loss": 0.7741, "lr": 2.697747964635533e-05, "epoch": 5.2733095025320225, "percentage": 52.73, "elapsed_time": "2:26:59", "remaining_time": "2:11:45", "throughput": 2315.06, "total_tokens": 20417616} {"current_steps": 35410, "total_steps": 67140, "loss": 0.7197, "lr": 2.697100109919749e-05, "epoch": 5.274054215072982, "percentage": 52.74, "elapsed_time": "2:27:00", "remaining_time": "2:11:43", "throughput": 2315.08, "total_tokens": 20420368} {"current_steps": 35415, "total_steps": 67140, "loss": 0.5326, "lr": 2.696452241884741e-05, "epoch": 5.274798927613941, "percentage": 52.75, "elapsed_time": "2:27:01", "remaining_time": "2:11:42", "throughput": 2315.12, "total_tokens": 20423440} {"current_steps": 35420, "total_steps": 67140, "loss": 0.4858, "lr": 2.6958043605742882e-05, "epoch": 5.2755436401549005, "percentage": 52.76, "elapsed_time": "2:27:02", "remaining_time": "2:11:41", "throughput": 2315.13, "total_tokens": 20425968} {"current_steps": 35425, "total_steps": 67140, "loss": 0.5214, "lr": 2.695156466032173e-05, "epoch": 5.276288352695859, "percentage": 52.76, "elapsed_time": "2:27:03", "remaining_time": "2:11:39", "throughput": 2315.15, "total_tokens": 20428816} {"current_steps": 35430, "total_steps": 67140, "loss": 0.5209, "lr": 2.6945085583021783e-05, "epoch": 5.277033065236819, "percentage": 52.77, "elapsed_time": "2:27:05", "remaining_time": "2:11:38", "throughput": 2315.17, "total_tokens": 20431536} {"current_steps": 35435, "total_steps": 67140, "loss": 0.6195, "lr": 2.693860637428085e-05, "epoch": 5.277777777777778, "percentage": 52.78, "elapsed_time": "2:27:06", "remaining_time": "2:11:37", "throughput": 2315.21, "total_tokens": 20434704} {"current_steps": 35440, "total_steps": 67140, "loss": 0.6296, "lr": 2.693212703453678e-05, "epoch": 5.278522490318737, "percentage": 52.79, "elapsed_time": "2:27:07", "remaining_time": "2:11:35", "throughput": 2315.24, "total_tokens": 20437488} {"current_steps": 35445, "total_steps": 67140, "loss": 0.7884, "lr": 2.692564756422743e-05, "epoch": 5.279267202859696, "percentage": 52.79, "elapsed_time": "2:27:08", "remaining_time": "2:11:34", "throughput": 2315.26, "total_tokens": 20440240} {"current_steps": 35450, "total_steps": 67140, "loss": 0.4742, "lr": 2.6919167963790636e-05, "epoch": 5.280011915400656, "percentage": 52.8, "elapsed_time": "2:27:09", "remaining_time": "2:11:33", "throughput": 2315.28, "total_tokens": 20443088} {"current_steps": 35455, "total_steps": 67140, "loss": 0.5671, "lr": 2.691268823366428e-05, "epoch": 5.2807566279416145, "percentage": 52.81, "elapsed_time": "2:27:10", "remaining_time": "2:11:31", "throughput": 2315.3, "total_tokens": 20445872} {"current_steps": 35460, "total_steps": 67140, "loss": 0.5492, "lr": 2.6906208374286223e-05, "epoch": 5.281501340482574, "percentage": 52.82, "elapsed_time": "2:27:11", "remaining_time": "2:11:30", "throughput": 2315.35, "total_tokens": 20449008} {"current_steps": 35465, "total_steps": 67140, "loss": 0.4917, "lr": 2.6899728386094364e-05, "epoch": 5.282246053023533, "percentage": 52.82, "elapsed_time": "2:27:13", "remaining_time": "2:11:29", "throughput": 2315.4, "total_tokens": 20452176} {"current_steps": 35470, "total_steps": 67140, "loss": 0.5435, "lr": 2.6893248269526578e-05, "epoch": 5.282990765564492, "percentage": 52.83, "elapsed_time": "2:27:14", "remaining_time": "2:11:27", "throughput": 2315.43, "total_tokens": 20455056} {"current_steps": 35475, "total_steps": 67140, "loss": 0.6449, "lr": 2.688676802502077e-05, "epoch": 5.283735478105451, "percentage": 52.84, "elapsed_time": "2:27:15", "remaining_time": "2:11:26", "throughput": 2315.46, "total_tokens": 20458000} {"current_steps": 35480, "total_steps": 67140, "loss": 0.5547, "lr": 2.688028765301486e-05, "epoch": 5.284480190646411, "percentage": 52.84, "elapsed_time": "2:27:16", "remaining_time": "2:11:25", "throughput": 2315.49, "total_tokens": 20460912} {"current_steps": 35485, "total_steps": 67140, "loss": 0.5298, "lr": 2.687380715394674e-05, "epoch": 5.28522490318737, "percentage": 52.85, "elapsed_time": "2:27:17", "remaining_time": "2:11:23", "throughput": 2315.5, "total_tokens": 20463536} {"current_steps": 35490, "total_steps": 67140, "loss": 0.7668, "lr": 2.686732652825436e-05, "epoch": 5.2859696157283285, "percentage": 52.86, "elapsed_time": "2:27:18", "remaining_time": "2:11:22", "throughput": 2315.54, "total_tokens": 20466512} {"current_steps": 35495, "total_steps": 67140, "loss": 0.6666, "lr": 2.6860845776375643e-05, "epoch": 5.286714328269288, "percentage": 52.87, "elapsed_time": "2:27:19", "remaining_time": "2:11:21", "throughput": 2315.58, "total_tokens": 20469488} {"current_steps": 35500, "total_steps": 67140, "loss": 0.564, "lr": 2.6854364898748537e-05, "epoch": 5.287459040810247, "percentage": 52.87, "elapsed_time": "2:27:21", "remaining_time": "2:11:19", "throughput": 2315.59, "total_tokens": 20472176} {"current_steps": 35505, "total_steps": 67140, "loss": 0.4588, "lr": 2.6847883895810984e-05, "epoch": 5.2882037533512065, "percentage": 52.88, "elapsed_time": "2:27:22", "remaining_time": "2:11:18", "throughput": 2315.63, "total_tokens": 20475184} {"current_steps": 35510, "total_steps": 67140, "loss": 0.6007, "lr": 2.6841402768000957e-05, "epoch": 5.288948465892165, "percentage": 52.89, "elapsed_time": "2:27:23", "remaining_time": "2:11:17", "throughput": 2315.68, "total_tokens": 20478320} {"current_steps": 35515, "total_steps": 67140, "loss": 0.5253, "lr": 2.6834921515756417e-05, "epoch": 5.289693178433125, "percentage": 52.9, "elapsed_time": "2:27:24", "remaining_time": "2:11:15", "throughput": 2315.69, "total_tokens": 20480976} {"current_steps": 35520, "total_steps": 67140, "loss": 0.7083, "lr": 2.6828440139515337e-05, "epoch": 5.290437890974084, "percentage": 52.9, "elapsed_time": "2:27:25", "remaining_time": "2:11:14", "throughput": 2315.71, "total_tokens": 20483856} {"current_steps": 35525, "total_steps": 67140, "loss": 0.4923, "lr": 2.6821958639715704e-05, "epoch": 5.291182603515043, "percentage": 52.91, "elapsed_time": "2:27:26", "remaining_time": "2:11:13", "throughput": 2315.76, "total_tokens": 20486992} {"current_steps": 35530, "total_steps": 67140, "loss": 0.4402, "lr": 2.6815477016795526e-05, "epoch": 5.291927316056002, "percentage": 52.92, "elapsed_time": "2:27:27", "remaining_time": "2:11:11", "throughput": 2315.78, "total_tokens": 20489712} {"current_steps": 35535, "total_steps": 67140, "loss": 0.6922, "lr": 2.6808995271192784e-05, "epoch": 5.292672028596962, "percentage": 52.93, "elapsed_time": "2:27:28", "remaining_time": "2:11:10", "throughput": 2315.79, "total_tokens": 20492432} {"current_steps": 35540, "total_steps": 67140, "loss": 0.8522, "lr": 2.680251340334549e-05, "epoch": 5.2934167411379205, "percentage": 52.93, "elapsed_time": "2:27:30", "remaining_time": "2:11:09", "throughput": 2315.84, "total_tokens": 20495504} {"current_steps": 35545, "total_steps": 67140, "loss": 0.425, "lr": 2.679603141369168e-05, "epoch": 5.29416145367888, "percentage": 52.94, "elapsed_time": "2:27:31", "remaining_time": "2:11:07", "throughput": 2315.87, "total_tokens": 20498512} {"current_steps": 35550, "total_steps": 67140, "loss": 0.5296, "lr": 2.678954930266937e-05, "epoch": 5.294906166219839, "percentage": 52.95, "elapsed_time": "2:27:32", "remaining_time": "2:11:06", "throughput": 2315.91, "total_tokens": 20501456} {"current_steps": 35555, "total_steps": 67140, "loss": 0.6665, "lr": 2.6783067070716583e-05, "epoch": 5.2956508787607985, "percentage": 52.96, "elapsed_time": "2:27:33", "remaining_time": "2:11:04", "throughput": 2315.93, "total_tokens": 20504240} {"current_steps": 35560, "total_steps": 67140, "loss": 0.6996, "lr": 2.6776584718271376e-05, "epoch": 5.296395591301757, "percentage": 52.96, "elapsed_time": "2:27:34", "remaining_time": "2:11:03", "throughput": 2315.95, "total_tokens": 20507024} {"current_steps": 35565, "total_steps": 67140, "loss": 0.5783, "lr": 2.67701022457718e-05, "epoch": 5.297140303842717, "percentage": 52.97, "elapsed_time": "2:27:35", "remaining_time": "2:11:02", "throughput": 2315.97, "total_tokens": 20509808} {"current_steps": 35570, "total_steps": 67140, "loss": 0.4745, "lr": 2.6763619653655913e-05, "epoch": 5.297885016383676, "percentage": 52.98, "elapsed_time": "2:27:36", "remaining_time": "2:11:00", "throughput": 2315.99, "total_tokens": 20512560} {"current_steps": 35575, "total_steps": 67140, "loss": 0.6117, "lr": 2.6757136942361776e-05, "epoch": 5.298629728924635, "percentage": 52.99, "elapsed_time": "2:27:38", "remaining_time": "2:10:59", "throughput": 2316.04, "total_tokens": 20515632} {"current_steps": 35580, "total_steps": 67140, "loss": 0.7245, "lr": 2.6750654112327474e-05, "epoch": 5.299374441465594, "percentage": 52.99, "elapsed_time": "2:27:39", "remaining_time": "2:10:58", "throughput": 2316.07, "total_tokens": 20518608} {"current_steps": 35585, "total_steps": 67140, "loss": 0.6296, "lr": 2.674417116399108e-05, "epoch": 5.300119154006554, "percentage": 53.0, "elapsed_time": "2:27:40", "remaining_time": "2:10:56", "throughput": 2316.1, "total_tokens": 20521488} {"current_steps": 35590, "total_steps": 67140, "loss": 0.7646, "lr": 2.6737688097790693e-05, "epoch": 5.3008638665475125, "percentage": 53.01, "elapsed_time": "2:27:41", "remaining_time": "2:10:55", "throughput": 2316.12, "total_tokens": 20524272} {"current_steps": 35595, "total_steps": 67140, "loss": 0.6659, "lr": 2.6731204914164405e-05, "epoch": 5.301608579088472, "percentage": 53.02, "elapsed_time": "2:27:42", "remaining_time": "2:10:54", "throughput": 2316.14, "total_tokens": 20527024} {"current_steps": 35600, "total_steps": 67140, "loss": 0.4847, "lr": 2.672472161355033e-05, "epoch": 5.302353291629431, "percentage": 53.02, "elapsed_time": "2:27:43", "remaining_time": "2:10:52", "throughput": 2316.16, "total_tokens": 20529808} {"current_steps": 35605, "total_steps": 67140, "loss": 0.6277, "lr": 2.6718238196386576e-05, "epoch": 5.303098004170391, "percentage": 53.03, "elapsed_time": "2:27:44", "remaining_time": "2:10:51", "throughput": 2316.2, "total_tokens": 20532848} {"current_steps": 35610, "total_steps": 67140, "loss": 0.6781, "lr": 2.6711754663111277e-05, "epoch": 5.303842716711349, "percentage": 53.04, "elapsed_time": "2:27:46", "remaining_time": "2:10:50", "throughput": 2316.22, "total_tokens": 20535696} {"current_steps": 35615, "total_steps": 67140, "loss": 1.0298, "lr": 2.6705271014162554e-05, "epoch": 5.304587429252309, "percentage": 53.05, "elapsed_time": "2:27:47", "remaining_time": "2:10:48", "throughput": 2316.23, "total_tokens": 20538288} {"current_steps": 35620, "total_steps": 67140, "loss": 0.7902, "lr": 2.6698787249978546e-05, "epoch": 5.305332141793268, "percentage": 53.05, "elapsed_time": "2:27:48", "remaining_time": "2:10:47", "throughput": 2316.28, "total_tokens": 20541456} {"current_steps": 35625, "total_steps": 67140, "loss": 0.4689, "lr": 2.6692303370997405e-05, "epoch": 5.306076854334227, "percentage": 53.06, "elapsed_time": "2:27:49", "remaining_time": "2:10:46", "throughput": 2316.32, "total_tokens": 20544432} {"current_steps": 35630, "total_steps": 67140, "loss": 0.7539, "lr": 2.668581937765729e-05, "epoch": 5.306821566875186, "percentage": 53.07, "elapsed_time": "2:27:50", "remaining_time": "2:10:44", "throughput": 2316.33, "total_tokens": 20547120} {"current_steps": 35635, "total_steps": 67140, "loss": 0.4879, "lr": 2.667933527039635e-05, "epoch": 5.307566279416146, "percentage": 53.08, "elapsed_time": "2:27:51", "remaining_time": "2:10:43", "throughput": 2316.37, "total_tokens": 20550160} {"current_steps": 35640, "total_steps": 67140, "loss": 0.685, "lr": 2.6672851049652752e-05, "epoch": 5.3083109919571045, "percentage": 53.08, "elapsed_time": "2:27:52", "remaining_time": "2:10:42", "throughput": 2316.38, "total_tokens": 20552848} {"current_steps": 35645, "total_steps": 67140, "loss": 0.6141, "lr": 2.6666366715864694e-05, "epoch": 5.309055704498064, "percentage": 53.09, "elapsed_time": "2:27:53", "remaining_time": "2:10:40", "throughput": 2316.41, "total_tokens": 20555728} {"current_steps": 35650, "total_steps": 67140, "loss": 0.7343, "lr": 2.665988226947034e-05, "epoch": 5.309800417039023, "percentage": 53.1, "elapsed_time": "2:27:55", "remaining_time": "2:10:39", "throughput": 2316.43, "total_tokens": 20558544} {"current_steps": 35655, "total_steps": 67140, "loss": 0.6504, "lr": 2.6653397710907895e-05, "epoch": 5.310545129579982, "percentage": 53.11, "elapsed_time": "2:27:56", "remaining_time": "2:10:38", "throughput": 2316.44, "total_tokens": 20561264} {"current_steps": 35660, "total_steps": 67140, "loss": 0.6117, "lr": 2.664691304061555e-05, "epoch": 5.311289842120941, "percentage": 53.11, "elapsed_time": "2:27:57", "remaining_time": "2:10:36", "throughput": 2316.46, "total_tokens": 20564080} {"current_steps": 35665, "total_steps": 67140, "loss": 0.7064, "lr": 2.6640428259031525e-05, "epoch": 5.3120345546619, "percentage": 53.12, "elapsed_time": "2:27:58", "remaining_time": "2:10:35", "throughput": 2316.5, "total_tokens": 20567056} {"current_steps": 35670, "total_steps": 67140, "loss": 0.4897, "lr": 2.6633943366594027e-05, "epoch": 5.31277926720286, "percentage": 53.13, "elapsed_time": "2:27:59", "remaining_time": "2:10:34", "throughput": 2316.54, "total_tokens": 20570064} {"current_steps": 35675, "total_steps": 67140, "loss": 0.5145, "lr": 2.6627458363741274e-05, "epoch": 5.3135239797438185, "percentage": 53.14, "elapsed_time": "2:28:00", "remaining_time": "2:10:32", "throughput": 2316.55, "total_tokens": 20572688} {"current_steps": 35680, "total_steps": 67140, "loss": 0.5611, "lr": 2.6620973250911506e-05, "epoch": 5.314268692284778, "percentage": 53.14, "elapsed_time": "2:28:01", "remaining_time": "2:10:31", "throughput": 2316.57, "total_tokens": 20575408} {"current_steps": 35685, "total_steps": 67140, "loss": 0.6228, "lr": 2.6614488028542948e-05, "epoch": 5.315013404825737, "percentage": 53.15, "elapsed_time": "2:28:02", "remaining_time": "2:10:30", "throughput": 2316.59, "total_tokens": 20578224} {"current_steps": 35690, "total_steps": 67140, "loss": 0.553, "lr": 2.6608002697073864e-05, "epoch": 5.315758117366697, "percentage": 53.16, "elapsed_time": "2:28:04", "remaining_time": "2:10:28", "throughput": 2316.61, "total_tokens": 20581008} {"current_steps": 35695, "total_steps": 67140, "loss": 0.7848, "lr": 2.6601517256942494e-05, "epoch": 5.316502829907655, "percentage": 53.17, "elapsed_time": "2:28:05", "remaining_time": "2:10:27", "throughput": 2316.64, "total_tokens": 20583952} {"current_steps": 35700, "total_steps": 67140, "loss": 0.6681, "lr": 2.6595031708587093e-05, "epoch": 5.317247542448615, "percentage": 53.17, "elapsed_time": "2:28:06", "remaining_time": "2:10:25", "throughput": 2316.65, "total_tokens": 20586608} {"current_steps": 35705, "total_steps": 67140, "loss": 0.5476, "lr": 2.6588546052445933e-05, "epoch": 5.317992254989574, "percentage": 53.18, "elapsed_time": "2:28:07", "remaining_time": "2:10:24", "throughput": 2316.67, "total_tokens": 20589232} {"current_steps": 35710, "total_steps": 67140, "loss": 0.536, "lr": 2.6582060288957295e-05, "epoch": 5.318736967530533, "percentage": 53.19, "elapsed_time": "2:28:08", "remaining_time": "2:10:23", "throughput": 2316.68, "total_tokens": 20591920} {"current_steps": 35715, "total_steps": 67140, "loss": 0.6292, "lr": 2.6575574418559456e-05, "epoch": 5.319481680071492, "percentage": 53.19, "elapsed_time": "2:28:09", "remaining_time": "2:10:21", "throughput": 2316.73, "total_tokens": 20595056} {"current_steps": 35720, "total_steps": 67140, "loss": 0.6471, "lr": 2.6569088441690697e-05, "epoch": 5.320226392612452, "percentage": 53.2, "elapsed_time": "2:28:10", "remaining_time": "2:10:20", "throughput": 2316.74, "total_tokens": 20597680} {"current_steps": 35725, "total_steps": 67140, "loss": 0.73, "lr": 2.6562602358789324e-05, "epoch": 5.3209711051534105, "percentage": 53.21, "elapsed_time": "2:28:12", "remaining_time": "2:10:19", "throughput": 2316.79, "total_tokens": 20600880} {"current_steps": 35730, "total_steps": 67140, "loss": 0.632, "lr": 2.6556116170293645e-05, "epoch": 5.32171581769437, "percentage": 53.22, "elapsed_time": "2:28:13", "remaining_time": "2:10:17", "throughput": 2316.79, "total_tokens": 20603440} {"current_steps": 35735, "total_steps": 67140, "loss": 0.6015, "lr": 2.6549629876641953e-05, "epoch": 5.322460530235329, "percentage": 53.22, "elapsed_time": "2:28:14", "remaining_time": "2:10:16", "throughput": 2316.84, "total_tokens": 20606544} {"current_steps": 35740, "total_steps": 67140, "loss": 0.7062, "lr": 2.654314347827257e-05, "epoch": 5.323205242776289, "percentage": 53.23, "elapsed_time": "2:28:15", "remaining_time": "2:10:15", "throughput": 2316.88, "total_tokens": 20609616} {"current_steps": 35745, "total_steps": 67140, "loss": 0.5284, "lr": 2.653665697562383e-05, "epoch": 5.323949955317247, "percentage": 53.24, "elapsed_time": "2:28:16", "remaining_time": "2:10:13", "throughput": 2316.92, "total_tokens": 20612688} {"current_steps": 35750, "total_steps": 67140, "loss": 0.7218, "lr": 2.6530170369134062e-05, "epoch": 5.324694667858207, "percentage": 53.25, "elapsed_time": "2:28:17", "remaining_time": "2:10:12", "throughput": 2316.96, "total_tokens": 20615824} {"current_steps": 35755, "total_steps": 67140, "loss": 0.5657, "lr": 2.6523683659241594e-05, "epoch": 5.325439380399166, "percentage": 53.25, "elapsed_time": "2:28:18", "remaining_time": "2:10:11", "throughput": 2316.99, "total_tokens": 20618704} {"current_steps": 35760, "total_steps": 67140, "loss": 0.5953, "lr": 2.651719684638479e-05, "epoch": 5.326184092940125, "percentage": 53.26, "elapsed_time": "2:28:20", "remaining_time": "2:10:09", "throughput": 2317.03, "total_tokens": 20621680} {"current_steps": 35765, "total_steps": 67140, "loss": 0.8215, "lr": 2.651070993100198e-05, "epoch": 5.326928805481084, "percentage": 53.27, "elapsed_time": "2:28:21", "remaining_time": "2:10:08", "throughput": 2317.08, "total_tokens": 20624880} {"current_steps": 35770, "total_steps": 67140, "loss": 0.763, "lr": 2.6504222913531545e-05, "epoch": 5.327673518022044, "percentage": 53.28, "elapsed_time": "2:28:22", "remaining_time": "2:10:07", "throughput": 2317.11, "total_tokens": 20627856} {"current_steps": 35775, "total_steps": 67140, "loss": 0.6122, "lr": 2.6497735794411833e-05, "epoch": 5.328418230563003, "percentage": 53.28, "elapsed_time": "2:28:23", "remaining_time": "2:10:06", "throughput": 2317.15, "total_tokens": 20630832} {"current_steps": 35780, "total_steps": 67140, "loss": 0.5277, "lr": 2.6491248574081228e-05, "epoch": 5.329162943103962, "percentage": 53.29, "elapsed_time": "2:28:24", "remaining_time": "2:10:04", "throughput": 2317.19, "total_tokens": 20633872} {"current_steps": 35785, "total_steps": 67140, "loss": 0.7245, "lr": 2.6484761252978107e-05, "epoch": 5.329907655644921, "percentage": 53.3, "elapsed_time": "2:28:25", "remaining_time": "2:10:03", "throughput": 2317.21, "total_tokens": 20636624} {"current_steps": 35790, "total_steps": 67140, "loss": 0.6465, "lr": 2.6478273831540863e-05, "epoch": 5.330652368185881, "percentage": 53.31, "elapsed_time": "2:28:26", "remaining_time": "2:10:01", "throughput": 2317.24, "total_tokens": 20639536} {"current_steps": 35795, "total_steps": 67140, "loss": 0.6303, "lr": 2.647178631020788e-05, "epoch": 5.331397080726839, "percentage": 53.31, "elapsed_time": "2:28:28", "remaining_time": "2:10:00", "throughput": 2317.26, "total_tokens": 20642352} {"current_steps": 35800, "total_steps": 67140, "loss": 0.6147, "lr": 2.6465298689417555e-05, "epoch": 5.332141793267799, "percentage": 53.32, "elapsed_time": "2:28:29", "remaining_time": "2:09:59", "throughput": 2317.28, "total_tokens": 20645072} {"current_steps": 35805, "total_steps": 67140, "loss": 0.586, "lr": 2.6458810969608304e-05, "epoch": 5.332886505808758, "percentage": 53.33, "elapsed_time": "2:28:30", "remaining_time": "2:09:57", "throughput": 2317.31, "total_tokens": 20647888} {"current_steps": 35810, "total_steps": 67140, "loss": 0.5172, "lr": 2.645232315121855e-05, "epoch": 5.333631218349717, "percentage": 53.34, "elapsed_time": "2:28:31", "remaining_time": "2:09:56", "throughput": 2317.31, "total_tokens": 20650448} {"current_steps": 35815, "total_steps": 67140, "loss": 0.5151, "lr": 2.6445835234686693e-05, "epoch": 5.334375930890676, "percentage": 53.34, "elapsed_time": "2:28:32", "remaining_time": "2:09:55", "throughput": 2317.34, "total_tokens": 20653296} {"current_steps": 35820, "total_steps": 67140, "loss": 0.6478, "lr": 2.643934722045117e-05, "epoch": 5.335120643431635, "percentage": 53.35, "elapsed_time": "2:28:33", "remaining_time": "2:09:53", "throughput": 2317.37, "total_tokens": 20656208} {"current_steps": 35825, "total_steps": 67140, "loss": 0.5088, "lr": 2.6432859108950413e-05, "epoch": 5.335865355972595, "percentage": 53.36, "elapsed_time": "2:28:34", "remaining_time": "2:09:52", "throughput": 2317.42, "total_tokens": 20659376} {"current_steps": 35830, "total_steps": 67140, "loss": 0.6117, "lr": 2.642637090062287e-05, "epoch": 5.336610068513554, "percentage": 53.37, "elapsed_time": "2:28:35", "remaining_time": "2:09:51", "throughput": 2317.46, "total_tokens": 20662384} {"current_steps": 35835, "total_steps": 67140, "loss": 0.5127, "lr": 2.6419882595906976e-05, "epoch": 5.337354781054513, "percentage": 53.37, "elapsed_time": "2:28:37", "remaining_time": "2:09:49", "throughput": 2317.49, "total_tokens": 20665168} {"current_steps": 35840, "total_steps": 67140, "loss": 0.5346, "lr": 2.6413394195241186e-05, "epoch": 5.338099493595472, "percentage": 53.38, "elapsed_time": "2:28:38", "remaining_time": "2:09:48", "throughput": 2317.5, "total_tokens": 20667888} {"current_steps": 35845, "total_steps": 67140, "loss": 0.663, "lr": 2.6406905699063965e-05, "epoch": 5.338844206136431, "percentage": 53.39, "elapsed_time": "2:28:39", "remaining_time": "2:09:47", "throughput": 2317.54, "total_tokens": 20670928} {"current_steps": 35850, "total_steps": 67140, "loss": 0.5808, "lr": 2.640041710781378e-05, "epoch": 5.33958891867739, "percentage": 53.4, "elapsed_time": "2:28:40", "remaining_time": "2:09:45", "throughput": 2317.58, "total_tokens": 20673840} {"current_steps": 35855, "total_steps": 67140, "loss": 0.4056, "lr": 2.6393928421929098e-05, "epoch": 5.34033363121835, "percentage": 53.4, "elapsed_time": "2:28:41", "remaining_time": "2:09:44", "throughput": 2317.61, "total_tokens": 20676816} {"current_steps": 35860, "total_steps": 67140, "loss": 0.7706, "lr": 2.6387439641848405e-05, "epoch": 5.341078343759309, "percentage": 53.41, "elapsed_time": "2:28:42", "remaining_time": "2:09:43", "throughput": 2317.65, "total_tokens": 20679792} {"current_steps": 35865, "total_steps": 67140, "loss": 0.6915, "lr": 2.638095076801017e-05, "epoch": 5.341823056300268, "percentage": 53.42, "elapsed_time": "2:28:43", "remaining_time": "2:09:41", "throughput": 2317.69, "total_tokens": 20682800} {"current_steps": 35870, "total_steps": 67140, "loss": 0.6131, "lr": 2.6374461800852907e-05, "epoch": 5.342567768841227, "percentage": 53.43, "elapsed_time": "2:28:45", "remaining_time": "2:09:40", "throughput": 2317.7, "total_tokens": 20685520} {"current_steps": 35875, "total_steps": 67140, "loss": 0.4765, "lr": 2.63679727408151e-05, "epoch": 5.343312481382187, "percentage": 53.43, "elapsed_time": "2:28:46", "remaining_time": "2:09:39", "throughput": 2317.74, "total_tokens": 20688432} {"current_steps": 35880, "total_steps": 67140, "loss": 0.3051, "lr": 2.6361483588335257e-05, "epoch": 5.344057193923145, "percentage": 53.44, "elapsed_time": "2:28:47", "remaining_time": "2:09:37", "throughput": 2317.77, "total_tokens": 20691408} {"current_steps": 35885, "total_steps": 67140, "loss": 0.5888, "lr": 2.6354994343851884e-05, "epoch": 5.344801906464105, "percentage": 53.45, "elapsed_time": "2:28:48", "remaining_time": "2:09:36", "throughput": 2317.81, "total_tokens": 20694448} {"current_steps": 35890, "total_steps": 67140, "loss": 0.4285, "lr": 2.6348505007803515e-05, "epoch": 5.345546619005064, "percentage": 53.46, "elapsed_time": "2:28:49", "remaining_time": "2:09:35", "throughput": 2317.82, "total_tokens": 20697104} {"current_steps": 35895, "total_steps": 67140, "loss": 0.7209, "lr": 2.6342015580628655e-05, "epoch": 5.346291331546023, "percentage": 53.46, "elapsed_time": "2:28:50", "remaining_time": "2:09:33", "throughput": 2317.84, "total_tokens": 20699856} {"current_steps": 35900, "total_steps": 67140, "loss": 0.5637, "lr": 2.633552606276583e-05, "epoch": 5.347036044086982, "percentage": 53.47, "elapsed_time": "2:28:51", "remaining_time": "2:09:32", "throughput": 2317.86, "total_tokens": 20702608} {"current_steps": 35905, "total_steps": 67140, "loss": 0.4475, "lr": 2.6329036454653588e-05, "epoch": 5.347780756627942, "percentage": 53.48, "elapsed_time": "2:28:52", "remaining_time": "2:09:31", "throughput": 2317.88, "total_tokens": 20705424} {"current_steps": 35910, "total_steps": 67140, "loss": 0.7438, "lr": 2.632254675673047e-05, "epoch": 5.348525469168901, "percentage": 53.49, "elapsed_time": "2:28:53", "remaining_time": "2:09:29", "throughput": 2317.9, "total_tokens": 20708112} {"current_steps": 35915, "total_steps": 67140, "loss": 0.6383, "lr": 2.6316056969435022e-05, "epoch": 5.34927018170986, "percentage": 53.49, "elapsed_time": "2:28:55", "remaining_time": "2:09:28", "throughput": 2317.95, "total_tokens": 20711312} {"current_steps": 35920, "total_steps": 67140, "loss": 0.4709, "lr": 2.6309567093205784e-05, "epoch": 5.350014894250819, "percentage": 53.5, "elapsed_time": "2:28:56", "remaining_time": "2:09:27", "throughput": 2317.98, "total_tokens": 20714288} {"current_steps": 35925, "total_steps": 67140, "loss": 0.8393, "lr": 2.6303077128481335e-05, "epoch": 5.350759606791779, "percentage": 53.51, "elapsed_time": "2:28:57", "remaining_time": "2:09:25", "throughput": 2318.02, "total_tokens": 20717296} {"current_steps": 35930, "total_steps": 67140, "loss": 0.5636, "lr": 2.629658707570023e-05, "epoch": 5.351504319332737, "percentage": 53.52, "elapsed_time": "2:28:58", "remaining_time": "2:09:24", "throughput": 2318.06, "total_tokens": 20720240} {"current_steps": 35935, "total_steps": 67140, "loss": 0.6192, "lr": 2.6290096935301034e-05, "epoch": 5.352249031873697, "percentage": 53.52, "elapsed_time": "2:28:59", "remaining_time": "2:09:23", "throughput": 2318.08, "total_tokens": 20723120} {"current_steps": 35940, "total_steps": 67140, "loss": 0.7813, "lr": 2.6283606707722336e-05, "epoch": 5.352993744414656, "percentage": 53.53, "elapsed_time": "2:29:00", "remaining_time": "2:09:21", "throughput": 2318.12, "total_tokens": 20726096} {"current_steps": 35945, "total_steps": 67140, "loss": 0.6954, "lr": 2.6277116393402718e-05, "epoch": 5.3537384569556155, "percentage": 53.54, "elapsed_time": "2:29:02", "remaining_time": "2:09:20", "throughput": 2318.14, "total_tokens": 20728976} {"current_steps": 35950, "total_steps": 67140, "loss": 0.672, "lr": 2.6270625992780772e-05, "epoch": 5.354483169496574, "percentage": 53.54, "elapsed_time": "2:29:03", "remaining_time": "2:09:19", "throughput": 2318.16, "total_tokens": 20731728} {"current_steps": 35955, "total_steps": 67140, "loss": 0.5678, "lr": 2.626413550629508e-05, "epoch": 5.355227882037534, "percentage": 53.55, "elapsed_time": "2:29:04", "remaining_time": "2:09:17", "throughput": 2318.19, "total_tokens": 20734736} {"current_steps": 35960, "total_steps": 67140, "loss": 0.5915, "lr": 2.625764493438425e-05, "epoch": 5.355972594578493, "percentage": 53.56, "elapsed_time": "2:29:05", "remaining_time": "2:09:16", "throughput": 2318.22, "total_tokens": 20737488} {"current_steps": 35965, "total_steps": 67140, "loss": 0.5786, "lr": 2.625115427748689e-05, "epoch": 5.356717307119452, "percentage": 53.57, "elapsed_time": "2:29:06", "remaining_time": "2:09:15", "throughput": 2318.27, "total_tokens": 20740688} {"current_steps": 35970, "total_steps": 67140, "loss": 0.6202, "lr": 2.6244663536041614e-05, "epoch": 5.357462019660411, "percentage": 53.57, "elapsed_time": "2:29:07", "remaining_time": "2:09:13", "throughput": 2318.29, "total_tokens": 20743440} {"current_steps": 35975, "total_steps": 67140, "loss": 0.5778, "lr": 2.623817271048703e-05, "epoch": 5.358206732201371, "percentage": 53.58, "elapsed_time": "2:29:08", "remaining_time": "2:09:12", "throughput": 2318.32, "total_tokens": 20746384} {"current_steps": 35980, "total_steps": 67140, "loss": 0.5956, "lr": 2.623168180126177e-05, "epoch": 5.358951444742329, "percentage": 53.59, "elapsed_time": "2:29:10", "remaining_time": "2:09:11", "throughput": 2318.33, "total_tokens": 20749072} {"current_steps": 35985, "total_steps": 67140, "loss": 0.536, "lr": 2.6225190808804463e-05, "epoch": 5.359696157283288, "percentage": 53.6, "elapsed_time": "2:29:11", "remaining_time": "2:09:09", "throughput": 2318.36, "total_tokens": 20751952} {"current_steps": 35990, "total_steps": 67140, "loss": 0.6467, "lr": 2.6218699733553742e-05, "epoch": 5.360440869824248, "percentage": 53.6, "elapsed_time": "2:29:12", "remaining_time": "2:09:08", "throughput": 2318.4, "total_tokens": 20755024} {"current_steps": 35995, "total_steps": 67140, "loss": 0.6679, "lr": 2.6212208575948257e-05, "epoch": 5.3611855823652075, "percentage": 53.61, "elapsed_time": "2:29:13", "remaining_time": "2:09:07", "throughput": 2318.43, "total_tokens": 20757840} {"current_steps": 36000, "total_steps": 67140, "loss": 0.5033, "lr": 2.6205717336426632e-05, "epoch": 5.361930294906166, "percentage": 53.62, "elapsed_time": "2:29:14", "remaining_time": "2:09:05", "throughput": 2318.47, "total_tokens": 20760944} {"current_steps": 36005, "total_steps": 67140, "loss": 0.6323, "lr": 2.6199226015427532e-05, "epoch": 5.362675007447125, "percentage": 53.63, "elapsed_time": "2:29:15", "remaining_time": "2:09:04", "throughput": 2318.49, "total_tokens": 20763728} {"current_steps": 36010, "total_steps": 67140, "loss": 0.457, "lr": 2.619273461338962e-05, "epoch": 5.363419719988085, "percentage": 53.63, "elapsed_time": "2:29:16", "remaining_time": "2:09:03", "throughput": 2318.53, "total_tokens": 20766736} {"current_steps": 36015, "total_steps": 67140, "loss": 0.6455, "lr": 2.6186243130751554e-05, "epoch": 5.364164432529043, "percentage": 53.64, "elapsed_time": "2:29:18", "remaining_time": "2:09:01", "throughput": 2318.56, "total_tokens": 20769680} {"current_steps": 36020, "total_steps": 67140, "loss": 0.7154, "lr": 2.6179751567951992e-05, "epoch": 5.364909145070003, "percentage": 53.65, "elapsed_time": "2:29:19", "remaining_time": "2:09:00", "throughput": 2318.59, "total_tokens": 20772592} {"current_steps": 36025, "total_steps": 67140, "loss": 0.6524, "lr": 2.617325992542962e-05, "epoch": 5.365653857610962, "percentage": 53.66, "elapsed_time": "2:29:20", "remaining_time": "2:08:59", "throughput": 2318.61, "total_tokens": 20775376} {"current_steps": 36030, "total_steps": 67140, "loss": 0.5616, "lr": 2.616676820362311e-05, "epoch": 5.3663985701519215, "percentage": 53.66, "elapsed_time": "2:29:21", "remaining_time": "2:08:57", "throughput": 2318.66, "total_tokens": 20778544} {"current_steps": 36035, "total_steps": 67140, "loss": 0.6234, "lr": 2.6160276402971153e-05, "epoch": 5.36714328269288, "percentage": 53.67, "elapsed_time": "2:29:22", "remaining_time": "2:08:56", "throughput": 2318.7, "total_tokens": 20781584} {"current_steps": 36040, "total_steps": 67140, "loss": 0.4587, "lr": 2.615378452391243e-05, "epoch": 5.36788799523384, "percentage": 53.68, "elapsed_time": "2:29:23", "remaining_time": "2:08:55", "throughput": 2318.72, "total_tokens": 20784400} {"current_steps": 36045, "total_steps": 67140, "loss": 0.7195, "lr": 2.614729256688564e-05, "epoch": 5.368632707774799, "percentage": 53.69, "elapsed_time": "2:29:24", "remaining_time": "2:08:53", "throughput": 2318.74, "total_tokens": 20787248} {"current_steps": 36050, "total_steps": 67140, "loss": 0.5969, "lr": 2.6140800532329486e-05, "epoch": 5.369377420315758, "percentage": 53.69, "elapsed_time": "2:29:25", "remaining_time": "2:08:52", "throughput": 2318.76, "total_tokens": 20789936} {"current_steps": 36055, "total_steps": 67140, "loss": 0.6218, "lr": 2.6134308420682667e-05, "epoch": 5.370122132856717, "percentage": 53.7, "elapsed_time": "2:29:27", "remaining_time": "2:08:51", "throughput": 2318.82, "total_tokens": 20793200} {"current_steps": 36060, "total_steps": 67140, "loss": 0.422, "lr": 2.61278162323839e-05, "epoch": 5.370866845397677, "percentage": 53.71, "elapsed_time": "2:29:28", "remaining_time": "2:08:49", "throughput": 2318.86, "total_tokens": 20796240} {"current_steps": 36065, "total_steps": 67140, "loss": 0.4968, "lr": 2.612132396787189e-05, "epoch": 5.371611557938635, "percentage": 53.72, "elapsed_time": "2:29:29", "remaining_time": "2:08:48", "throughput": 2318.87, "total_tokens": 20798960} {"current_steps": 36070, "total_steps": 67140, "loss": 0.5476, "lr": 2.6114831627585367e-05, "epoch": 5.372356270479595, "percentage": 53.72, "elapsed_time": "2:29:30", "remaining_time": "2:08:47", "throughput": 2318.9, "total_tokens": 20801872} {"current_steps": 36075, "total_steps": 67140, "loss": 0.6353, "lr": 2.610833921196306e-05, "epoch": 5.373100983020554, "percentage": 53.73, "elapsed_time": "2:29:31", "remaining_time": "2:08:45", "throughput": 2318.93, "total_tokens": 20804784} {"current_steps": 36080, "total_steps": 67140, "loss": 0.6413, "lr": 2.61018467214437e-05, "epoch": 5.3738456955615135, "percentage": 53.74, "elapsed_time": "2:29:32", "remaining_time": "2:08:44", "throughput": 2318.97, "total_tokens": 20807856} {"current_steps": 36085, "total_steps": 67140, "loss": 0.6173, "lr": 2.609535415646601e-05, "epoch": 5.374590408102472, "percentage": 53.75, "elapsed_time": "2:29:33", "remaining_time": "2:08:43", "throughput": 2318.99, "total_tokens": 20810544} {"current_steps": 36090, "total_steps": 67140, "loss": 0.6836, "lr": 2.6088861517468745e-05, "epoch": 5.375335120643432, "percentage": 53.75, "elapsed_time": "2:29:35", "remaining_time": "2:08:41", "throughput": 2319.01, "total_tokens": 20813360} {"current_steps": 36095, "total_steps": 67140, "loss": 0.8279, "lr": 2.6082368804890644e-05, "epoch": 5.376079833184391, "percentage": 53.76, "elapsed_time": "2:29:36", "remaining_time": "2:08:40", "throughput": 2319.04, "total_tokens": 20816272} {"current_steps": 36100, "total_steps": 67140, "loss": 0.5853, "lr": 2.6075876019170453e-05, "epoch": 5.37682454572535, "percentage": 53.77, "elapsed_time": "2:29:37", "remaining_time": "2:08:39", "throughput": 2319.06, "total_tokens": 20819088} {"current_steps": 36105, "total_steps": 67140, "loss": 0.7541, "lr": 2.606938316074694e-05, "epoch": 5.377569258266309, "percentage": 53.78, "elapsed_time": "2:29:38", "remaining_time": "2:08:37", "throughput": 2319.09, "total_tokens": 20822000} {"current_steps": 36110, "total_steps": 67140, "loss": 0.4206, "lr": 2.606289023005886e-05, "epoch": 5.378313970807269, "percentage": 53.78, "elapsed_time": "2:29:39", "remaining_time": "2:08:36", "throughput": 2319.11, "total_tokens": 20824784} {"current_steps": 36115, "total_steps": 67140, "loss": 0.6657, "lr": 2.6056397227544988e-05, "epoch": 5.3790586833482275, "percentage": 53.79, "elapsed_time": "2:29:40", "remaining_time": "2:08:35", "throughput": 2319.13, "total_tokens": 20827536} {"current_steps": 36120, "total_steps": 67140, "loss": 0.6661, "lr": 2.6049904153644072e-05, "epoch": 5.379803395889187, "percentage": 53.8, "elapsed_time": "2:29:41", "remaining_time": "2:08:33", "throughput": 2319.17, "total_tokens": 20830512} {"current_steps": 36125, "total_steps": 67140, "loss": 0.5997, "lr": 2.6043411008794915e-05, "epoch": 5.380548108430146, "percentage": 53.81, "elapsed_time": "2:29:42", "remaining_time": "2:08:32", "throughput": 2319.18, "total_tokens": 20833168} {"current_steps": 36130, "total_steps": 67140, "loss": 0.4776, "lr": 2.603691779343627e-05, "epoch": 5.3812928209711055, "percentage": 53.81, "elapsed_time": "2:29:44", "remaining_time": "2:08:30", "throughput": 2319.2, "total_tokens": 20835920} {"current_steps": 36135, "total_steps": 67140, "loss": 0.5471, "lr": 2.603042450800695e-05, "epoch": 5.382037533512064, "percentage": 53.82, "elapsed_time": "2:29:45", "remaining_time": "2:08:29", "throughput": 2319.23, "total_tokens": 20838896} {"current_steps": 36140, "total_steps": 67140, "loss": 0.6208, "lr": 2.6023931152945725e-05, "epoch": 5.382782246053024, "percentage": 53.83, "elapsed_time": "2:29:46", "remaining_time": "2:08:28", "throughput": 2319.25, "total_tokens": 20841712} {"current_steps": 36145, "total_steps": 67140, "loss": 0.6074, "lr": 2.6017437728691396e-05, "epoch": 5.383526958593983, "percentage": 53.84, "elapsed_time": "2:29:47", "remaining_time": "2:08:27", "throughput": 2319.3, "total_tokens": 20844848} {"current_steps": 36150, "total_steps": 67140, "loss": 0.6558, "lr": 2.601094423568276e-05, "epoch": 5.384271671134942, "percentage": 53.84, "elapsed_time": "2:29:48", "remaining_time": "2:08:25", "throughput": 2319.34, "total_tokens": 20847888} {"current_steps": 36155, "total_steps": 67140, "loss": 0.6957, "lr": 2.6004450674358628e-05, "epoch": 5.385016383675901, "percentage": 53.85, "elapsed_time": "2:29:49", "remaining_time": "2:08:24", "throughput": 2319.36, "total_tokens": 20850672} {"current_steps": 36160, "total_steps": 67140, "loss": 0.5466, "lr": 2.59979570451578e-05, "epoch": 5.385761096216861, "percentage": 53.86, "elapsed_time": "2:29:50", "remaining_time": "2:08:22", "throughput": 2319.37, "total_tokens": 20853392} {"current_steps": 36165, "total_steps": 67140, "loss": 0.6267, "lr": 2.599146334851909e-05, "epoch": 5.3865058087578195, "percentage": 53.87, "elapsed_time": "2:29:52", "remaining_time": "2:08:21", "throughput": 2319.39, "total_tokens": 20856176} {"current_steps": 36170, "total_steps": 67140, "loss": 0.5237, "lr": 2.598496958488132e-05, "epoch": 5.387250521298778, "percentage": 53.87, "elapsed_time": "2:29:53", "remaining_time": "2:08:20", "throughput": 2319.43, "total_tokens": 20859152} {"current_steps": 36175, "total_steps": 67140, "loss": 0.663, "lr": 2.5978475754683307e-05, "epoch": 5.387995233839738, "percentage": 53.88, "elapsed_time": "2:29:54", "remaining_time": "2:08:18", "throughput": 2319.46, "total_tokens": 20862096} {"current_steps": 36180, "total_steps": 67140, "loss": 0.5364, "lr": 2.5971981858363886e-05, "epoch": 5.388739946380697, "percentage": 53.89, "elapsed_time": "2:29:55", "remaining_time": "2:08:17", "throughput": 2319.5, "total_tokens": 20865200} {"current_steps": 36185, "total_steps": 67140, "loss": 0.5117, "lr": 2.5965487896361878e-05, "epoch": 5.389484658921656, "percentage": 53.89, "elapsed_time": "2:29:56", "remaining_time": "2:08:16", "throughput": 2319.52, "total_tokens": 20867920} {"current_steps": 36190, "total_steps": 67140, "loss": 0.787, "lr": 2.5958993869116134e-05, "epoch": 5.390229371462615, "percentage": 53.9, "elapsed_time": "2:29:57", "remaining_time": "2:08:14", "throughput": 2319.53, "total_tokens": 20870576} {"current_steps": 36195, "total_steps": 67140, "loss": 0.7208, "lr": 2.5952499777065474e-05, "epoch": 5.390974084003575, "percentage": 53.91, "elapsed_time": "2:29:58", "remaining_time": "2:08:13", "throughput": 2319.55, "total_tokens": 20873328} {"current_steps": 36200, "total_steps": 67140, "loss": 0.6784, "lr": 2.594600562064875e-05, "epoch": 5.3917187965445335, "percentage": 53.92, "elapsed_time": "2:30:00", "remaining_time": "2:08:12", "throughput": 2319.6, "total_tokens": 20876496} {"current_steps": 36205, "total_steps": 67140, "loss": 0.6035, "lr": 2.593951140030481e-05, "epoch": 5.392463509085493, "percentage": 53.92, "elapsed_time": "2:30:01", "remaining_time": "2:08:11", "throughput": 2319.64, "total_tokens": 20879600} {"current_steps": 36210, "total_steps": 67140, "loss": 0.6025, "lr": 2.593301711647252e-05, "epoch": 5.393208221626452, "percentage": 53.93, "elapsed_time": "2:30:02", "remaining_time": "2:08:09", "throughput": 2319.66, "total_tokens": 20882448} {"current_steps": 36215, "total_steps": 67140, "loss": 0.6012, "lr": 2.592652276959072e-05, "epoch": 5.3939529341674115, "percentage": 53.94, "elapsed_time": "2:30:03", "remaining_time": "2:08:08", "throughput": 2319.7, "total_tokens": 20885424} {"current_steps": 36220, "total_steps": 67140, "loss": 0.5514, "lr": 2.592002836009828e-05, "epoch": 5.39469764670837, "percentage": 53.95, "elapsed_time": "2:30:04", "remaining_time": "2:08:06", "throughput": 2319.71, "total_tokens": 20888080} {"current_steps": 36225, "total_steps": 67140, "loss": 0.402, "lr": 2.5913533888434067e-05, "epoch": 5.39544235924933, "percentage": 53.95, "elapsed_time": "2:30:05", "remaining_time": "2:08:05", "throughput": 2319.74, "total_tokens": 20891024} {"current_steps": 36230, "total_steps": 67140, "loss": 0.67, "lr": 2.5907039355036944e-05, "epoch": 5.396187071790289, "percentage": 53.96, "elapsed_time": "2:30:06", "remaining_time": "2:08:04", "throughput": 2319.78, "total_tokens": 20894064} {"current_steps": 36235, "total_steps": 67140, "loss": 0.4952, "lr": 2.590054476034579e-05, "epoch": 5.396931784331248, "percentage": 53.97, "elapsed_time": "2:30:08", "remaining_time": "2:08:03", "throughput": 2319.81, "total_tokens": 20896976} {"current_steps": 36240, "total_steps": 67140, "loss": 0.5975, "lr": 2.5894050104799477e-05, "epoch": 5.397676496872207, "percentage": 53.98, "elapsed_time": "2:30:09", "remaining_time": "2:08:01", "throughput": 2319.85, "total_tokens": 20899984} {"current_steps": 36245, "total_steps": 67140, "loss": 0.6546, "lr": 2.5887555388836905e-05, "epoch": 5.398421209413167, "percentage": 53.98, "elapsed_time": "2:30:10", "remaining_time": "2:08:00", "throughput": 2319.88, "total_tokens": 20902992} {"current_steps": 36250, "total_steps": 67140, "loss": 0.8199, "lr": 2.5881060612896936e-05, "epoch": 5.3991659219541255, "percentage": 53.99, "elapsed_time": "2:30:11", "remaining_time": "2:07:59", "throughput": 2319.89, "total_tokens": 20905552} {"current_steps": 36255, "total_steps": 67140, "loss": 0.6154, "lr": 2.587456577741848e-05, "epoch": 5.399910634495085, "percentage": 54.0, "elapsed_time": "2:30:12", "remaining_time": "2:07:57", "throughput": 2319.92, "total_tokens": 20908528} {"current_steps": 36260, "total_steps": 67140, "loss": 0.5338, "lr": 2.5868070882840423e-05, "epoch": 5.400655347036044, "percentage": 54.01, "elapsed_time": "2:30:13", "remaining_time": "2:07:56", "throughput": 2319.95, "total_tokens": 20911376} {"current_steps": 36265, "total_steps": 67140, "loss": 0.6352, "lr": 2.5861575929601663e-05, "epoch": 5.4014000595770035, "percentage": 54.01, "elapsed_time": "2:30:14", "remaining_time": "2:07:54", "throughput": 2319.98, "total_tokens": 20914256} {"current_steps": 36270, "total_steps": 67140, "loss": 0.6972, "lr": 2.5855080918141107e-05, "epoch": 5.402144772117962, "percentage": 54.02, "elapsed_time": "2:30:15", "remaining_time": "2:07:53", "throughput": 2319.99, "total_tokens": 20916944} {"current_steps": 36275, "total_steps": 67140, "loss": 0.4735, "lr": 2.5848585848897654e-05, "epoch": 5.402889484658922, "percentage": 54.03, "elapsed_time": "2:30:17", "remaining_time": "2:07:52", "throughput": 2320.0, "total_tokens": 20919536} {"current_steps": 36280, "total_steps": 67140, "loss": 0.6043, "lr": 2.584209072231023e-05, "epoch": 5.403634197199881, "percentage": 54.04, "elapsed_time": "2:30:18", "remaining_time": "2:07:50", "throughput": 2320.02, "total_tokens": 20922288} {"current_steps": 36285, "total_steps": 67140, "loss": 0.5708, "lr": 2.583559553881773e-05, "epoch": 5.40437890974084, "percentage": 54.04, "elapsed_time": "2:30:19", "remaining_time": "2:07:49", "throughput": 2320.04, "total_tokens": 20925104} {"current_steps": 36290, "total_steps": 67140, "loss": 0.6128, "lr": 2.582910029885909e-05, "epoch": 5.405123622281799, "percentage": 54.05, "elapsed_time": "2:30:20", "remaining_time": "2:07:48", "throughput": 2320.06, "total_tokens": 20927856} {"current_steps": 36295, "total_steps": 67140, "loss": 0.609, "lr": 2.5822605002873213e-05, "epoch": 5.405868334822759, "percentage": 54.06, "elapsed_time": "2:30:21", "remaining_time": "2:07:46", "throughput": 2320.09, "total_tokens": 20930864} {"current_steps": 36300, "total_steps": 67140, "loss": 0.6711, "lr": 2.5816109651299035e-05, "epoch": 5.4066130473637175, "percentage": 54.07, "elapsed_time": "2:30:22", "remaining_time": "2:07:45", "throughput": 2320.16, "total_tokens": 20934288} {"current_steps": 36305, "total_steps": 67140, "loss": 0.6505, "lr": 2.5809614244575488e-05, "epoch": 5.407357759904677, "percentage": 54.07, "elapsed_time": "2:30:23", "remaining_time": "2:07:44", "throughput": 2320.17, "total_tokens": 20937040} {"current_steps": 36310, "total_steps": 67140, "loss": 0.6543, "lr": 2.58031187831415e-05, "epoch": 5.408102472445636, "percentage": 54.08, "elapsed_time": "2:30:25", "remaining_time": "2:07:42", "throughput": 2320.2, "total_tokens": 20939920} {"current_steps": 36315, "total_steps": 67140, "loss": 0.7486, "lr": 2.5796623267436016e-05, "epoch": 5.408847184986596, "percentage": 54.09, "elapsed_time": "2:30:26", "remaining_time": "2:07:41", "throughput": 2320.24, "total_tokens": 20942992} {"current_steps": 36320, "total_steps": 67140, "loss": 0.6513, "lr": 2.579012769789796e-05, "epoch": 5.409591897527554, "percentage": 54.1, "elapsed_time": "2:30:27", "remaining_time": "2:07:40", "throughput": 2320.26, "total_tokens": 20945712} {"current_steps": 36325, "total_steps": 67140, "loss": 0.4757, "lr": 2.5783632074966298e-05, "epoch": 5.410336610068514, "percentage": 54.1, "elapsed_time": "2:30:28", "remaining_time": "2:07:38", "throughput": 2320.26, "total_tokens": 20948208} {"current_steps": 36330, "total_steps": 67140, "loss": 0.6654, "lr": 2.5777136399079955e-05, "epoch": 5.411081322609473, "percentage": 54.11, "elapsed_time": "2:30:29", "remaining_time": "2:07:37", "throughput": 2320.3, "total_tokens": 20951280} {"current_steps": 36335, "total_steps": 67140, "loss": 0.7413, "lr": 2.5770640670677902e-05, "epoch": 5.4118260351504315, "percentage": 54.12, "elapsed_time": "2:30:30", "remaining_time": "2:07:36", "throughput": 2320.32, "total_tokens": 20954000} {"current_steps": 36340, "total_steps": 67140, "loss": 0.5159, "lr": 2.5764144890199078e-05, "epoch": 5.412570747691391, "percentage": 54.13, "elapsed_time": "2:30:31", "remaining_time": "2:07:34", "throughput": 2320.35, "total_tokens": 20956976} {"current_steps": 36345, "total_steps": 67140, "loss": 0.6621, "lr": 2.5757649058082455e-05, "epoch": 5.413315460232351, "percentage": 54.13, "elapsed_time": "2:30:32", "remaining_time": "2:07:33", "throughput": 2320.39, "total_tokens": 20960016} {"current_steps": 36350, "total_steps": 67140, "loss": 0.5287, "lr": 2.5751153174766983e-05, "epoch": 5.4140601727733095, "percentage": 54.14, "elapsed_time": "2:30:34", "remaining_time": "2:07:32", "throughput": 2320.4, "total_tokens": 20962672} {"current_steps": 36355, "total_steps": 67140, "loss": 0.4842, "lr": 2.5744657240691646e-05, "epoch": 5.414804885314268, "percentage": 54.15, "elapsed_time": "2:30:35", "remaining_time": "2:07:30", "throughput": 2320.43, "total_tokens": 20965584} {"current_steps": 36360, "total_steps": 67140, "loss": 0.648, "lr": 2.5738161256295396e-05, "epoch": 5.415549597855228, "percentage": 54.16, "elapsed_time": "2:30:36", "remaining_time": "2:07:29", "throughput": 2320.47, "total_tokens": 20968656} {"current_steps": 36365, "total_steps": 67140, "loss": 0.6192, "lr": 2.5731665222017202e-05, "epoch": 5.416294310396187, "percentage": 54.16, "elapsed_time": "2:30:37", "remaining_time": "2:07:28", "throughput": 2320.51, "total_tokens": 20971760} {"current_steps": 36370, "total_steps": 67140, "loss": 0.6808, "lr": 2.5725169138296046e-05, "epoch": 5.417039022937146, "percentage": 54.17, "elapsed_time": "2:30:38", "remaining_time": "2:07:27", "throughput": 2320.56, "total_tokens": 20974864} {"current_steps": 36375, "total_steps": 67140, "loss": 0.5392, "lr": 2.571867300557092e-05, "epoch": 5.417783735478105, "percentage": 54.18, "elapsed_time": "2:30:39", "remaining_time": "2:07:25", "throughput": 2320.56, "total_tokens": 20977456} {"current_steps": 36380, "total_steps": 67140, "loss": 0.6127, "lr": 2.5712176824280787e-05, "epoch": 5.418528448019065, "percentage": 54.19, "elapsed_time": "2:30:40", "remaining_time": "2:07:24", "throughput": 2320.58, "total_tokens": 20980208} {"current_steps": 36385, "total_steps": 67140, "loss": 0.6201, "lr": 2.5705680594864634e-05, "epoch": 5.4192731605600235, "percentage": 54.19, "elapsed_time": "2:30:42", "remaining_time": "2:07:22", "throughput": 2320.61, "total_tokens": 20983152} {"current_steps": 36390, "total_steps": 67140, "loss": 0.8036, "lr": 2.5699184317761465e-05, "epoch": 5.420017873100983, "percentage": 54.2, "elapsed_time": "2:30:43", "remaining_time": "2:07:21", "throughput": 2320.65, "total_tokens": 20986128} {"current_steps": 36395, "total_steps": 67140, "loss": 0.7022, "lr": 2.5692687993410263e-05, "epoch": 5.420762585641942, "percentage": 54.21, "elapsed_time": "2:30:44", "remaining_time": "2:07:20", "throughput": 2320.67, "total_tokens": 20989040} {"current_steps": 36400, "total_steps": 67140, "loss": 0.5829, "lr": 2.5686191622250017e-05, "epoch": 5.421507298182902, "percentage": 54.22, "elapsed_time": "2:30:45", "remaining_time": "2:07:18", "throughput": 2320.69, "total_tokens": 20991792} {"current_steps": 36405, "total_steps": 67140, "loss": 0.6845, "lr": 2.567969520471973e-05, "epoch": 5.42225201072386, "percentage": 54.22, "elapsed_time": "2:30:46", "remaining_time": "2:07:17", "throughput": 2320.71, "total_tokens": 20994576} {"current_steps": 36410, "total_steps": 67140, "loss": 0.6344, "lr": 2.5673198741258408e-05, "epoch": 5.42299672326482, "percentage": 54.23, "elapsed_time": "2:30:47", "remaining_time": "2:07:16", "throughput": 2320.71, "total_tokens": 20996976} {"current_steps": 36415, "total_steps": 67140, "loss": 0.4553, "lr": 2.5666702232305055e-05, "epoch": 5.423741435805779, "percentage": 54.24, "elapsed_time": "2:30:48", "remaining_time": "2:07:14", "throughput": 2320.73, "total_tokens": 20999760} {"current_steps": 36420, "total_steps": 67140, "loss": 0.4995, "lr": 2.5660205678298664e-05, "epoch": 5.424486148346738, "percentage": 54.24, "elapsed_time": "2:30:49", "remaining_time": "2:07:13", "throughput": 2320.76, "total_tokens": 21002704} {"current_steps": 36425, "total_steps": 67140, "loss": 0.6528, "lr": 2.5653709079678274e-05, "epoch": 5.425230860887697, "percentage": 54.25, "elapsed_time": "2:30:51", "remaining_time": "2:07:12", "throughput": 2320.78, "total_tokens": 21005456} {"current_steps": 36430, "total_steps": 67140, "loss": 0.6517, "lr": 2.5647212436882867e-05, "epoch": 5.425975573428657, "percentage": 54.26, "elapsed_time": "2:30:52", "remaining_time": "2:07:10", "throughput": 2320.79, "total_tokens": 21008144} {"current_steps": 36435, "total_steps": 67140, "loss": 0.7405, "lr": 2.5640715750351486e-05, "epoch": 5.4267202859696155, "percentage": 54.27, "elapsed_time": "2:30:53", "remaining_time": "2:07:09", "throughput": 2320.81, "total_tokens": 21010864} {"current_steps": 36440, "total_steps": 67140, "loss": 0.5853, "lr": 2.5634219020523132e-05, "epoch": 5.427464998510575, "percentage": 54.27, "elapsed_time": "2:30:54", "remaining_time": "2:07:08", "throughput": 2320.85, "total_tokens": 21013936} {"current_steps": 36445, "total_steps": 67140, "loss": 0.5993, "lr": 2.5627722247836838e-05, "epoch": 5.428209711051534, "percentage": 54.28, "elapsed_time": "2:30:55", "remaining_time": "2:07:06", "throughput": 2320.85, "total_tokens": 21016496} {"current_steps": 36450, "total_steps": 67140, "loss": 0.6035, "lr": 2.5621225432731626e-05, "epoch": 5.428954423592494, "percentage": 54.29, "elapsed_time": "2:30:56", "remaining_time": "2:07:05", "throughput": 2320.88, "total_tokens": 21019376} {"current_steps": 36455, "total_steps": 67140, "loss": 0.5776, "lr": 2.561472857564653e-05, "epoch": 5.429699136133452, "percentage": 54.3, "elapsed_time": "2:30:57", "remaining_time": "2:07:04", "throughput": 2320.9, "total_tokens": 21022224} {"current_steps": 36460, "total_steps": 67140, "loss": 0.5165, "lr": 2.560823167702057e-05, "epoch": 5.430443848674412, "percentage": 54.3, "elapsed_time": "2:30:58", "remaining_time": "2:07:02", "throughput": 2320.93, "total_tokens": 21025072} {"current_steps": 36465, "total_steps": 67140, "loss": 0.6602, "lr": 2.5601734737292787e-05, "epoch": 5.431188561215371, "percentage": 54.31, "elapsed_time": "2:31:00", "remaining_time": "2:07:01", "throughput": 2320.96, "total_tokens": 21027920} {"current_steps": 36470, "total_steps": 67140, "loss": 0.6513, "lr": 2.5595237756902217e-05, "epoch": 5.43193327375633, "percentage": 54.32, "elapsed_time": "2:31:01", "remaining_time": "2:07:00", "throughput": 2320.98, "total_tokens": 21030832} {"current_steps": 36475, "total_steps": 67140, "loss": 0.6775, "lr": 2.558874073628791e-05, "epoch": 5.432677986297289, "percentage": 54.33, "elapsed_time": "2:31:02", "remaining_time": "2:06:58", "throughput": 2321.0, "total_tokens": 21033552} {"current_steps": 36480, "total_steps": 67140, "loss": 0.5596, "lr": 2.5582243675888885e-05, "epoch": 5.433422698838249, "percentage": 54.33, "elapsed_time": "2:31:03", "remaining_time": "2:06:57", "throughput": 2321.01, "total_tokens": 21036240} {"current_steps": 36485, "total_steps": 67140, "loss": 0.6354, "lr": 2.55757465761442e-05, "epoch": 5.434167411379208, "percentage": 54.34, "elapsed_time": "2:31:04", "remaining_time": "2:06:56", "throughput": 2321.04, "total_tokens": 21039248} {"current_steps": 36490, "total_steps": 67140, "loss": 0.5294, "lr": 2.5569249437492903e-05, "epoch": 5.434912123920167, "percentage": 54.35, "elapsed_time": "2:31:05", "remaining_time": "2:06:54", "throughput": 2321.12, "total_tokens": 21042864} {"current_steps": 36495, "total_steps": 67140, "loss": 0.6926, "lr": 2.5562752260374053e-05, "epoch": 5.435656836461126, "percentage": 54.36, "elapsed_time": "2:31:06", "remaining_time": "2:06:53", "throughput": 2321.15, "total_tokens": 21045744} {"current_steps": 36500, "total_steps": 67140, "loss": 0.7802, "lr": 2.555625504522668e-05, "epoch": 5.436401549002086, "percentage": 54.36, "elapsed_time": "2:31:08", "remaining_time": "2:06:52", "throughput": 2321.17, "total_tokens": 21048560} {"current_steps": 36505, "total_steps": 67140, "loss": 0.7, "lr": 2.5549757792489853e-05, "epoch": 5.437146261543044, "percentage": 54.37, "elapsed_time": "2:31:09", "remaining_time": "2:06:50", "throughput": 2321.19, "total_tokens": 21051344} {"current_steps": 36510, "total_steps": 67140, "loss": 0.7623, "lr": 2.554326050260264e-05, "epoch": 5.437890974084004, "percentage": 54.38, "elapsed_time": "2:31:10", "remaining_time": "2:06:49", "throughput": 2321.21, "total_tokens": 21054096} {"current_steps": 36515, "total_steps": 67140, "loss": 0.6874, "lr": 2.5536763176004086e-05, "epoch": 5.438635686624963, "percentage": 54.39, "elapsed_time": "2:31:11", "remaining_time": "2:06:48", "throughput": 2321.24, "total_tokens": 21056912} {"current_steps": 36520, "total_steps": 67140, "loss": 0.5739, "lr": 2.553026581313326e-05, "epoch": 5.4393803991659215, "percentage": 54.39, "elapsed_time": "2:31:12", "remaining_time": "2:06:46", "throughput": 2321.25, "total_tokens": 21059664} {"current_steps": 36525, "total_steps": 67140, "loss": 0.7617, "lr": 2.5523768414429227e-05, "epoch": 5.440125111706881, "percentage": 54.4, "elapsed_time": "2:31:13", "remaining_time": "2:06:45", "throughput": 2321.29, "total_tokens": 21062672} {"current_steps": 36530, "total_steps": 67140, "loss": 0.6196, "lr": 2.551727098033105e-05, "epoch": 5.44086982424784, "percentage": 54.41, "elapsed_time": "2:31:14", "remaining_time": "2:06:44", "throughput": 2321.31, "total_tokens": 21065488} {"current_steps": 36535, "total_steps": 67140, "loss": 0.6338, "lr": 2.5510773511277804e-05, "epoch": 5.4416145367888, "percentage": 54.42, "elapsed_time": "2:31:15", "remaining_time": "2:06:42", "throughput": 2321.34, "total_tokens": 21068432} {"current_steps": 36540, "total_steps": 67140, "loss": 0.5845, "lr": 2.5504276007708566e-05, "epoch": 5.442359249329758, "percentage": 54.42, "elapsed_time": "2:31:17", "remaining_time": "2:06:41", "throughput": 2321.37, "total_tokens": 21071216} {"current_steps": 36545, "total_steps": 67140, "loss": 0.5876, "lr": 2.54977784700624e-05, "epoch": 5.443103961870718, "percentage": 54.43, "elapsed_time": "2:31:18", "remaining_time": "2:06:40", "throughput": 2321.38, "total_tokens": 21073840} {"current_steps": 36550, "total_steps": 67140, "loss": 0.4703, "lr": 2.5491280898778386e-05, "epoch": 5.443848674411677, "percentage": 54.44, "elapsed_time": "2:31:19", "remaining_time": "2:06:38", "throughput": 2321.41, "total_tokens": 21076880} {"current_steps": 36555, "total_steps": 67140, "loss": 0.5702, "lr": 2.548478329429561e-05, "epoch": 5.444593386952636, "percentage": 54.45, "elapsed_time": "2:31:20", "remaining_time": "2:06:37", "throughput": 2321.45, "total_tokens": 21079920} {"current_steps": 36560, "total_steps": 67140, "loss": 0.6923, "lr": 2.547828565705316e-05, "epoch": 5.445338099493595, "percentage": 54.45, "elapsed_time": "2:31:21", "remaining_time": "2:06:36", "throughput": 2321.47, "total_tokens": 21082672} {"current_steps": 36565, "total_steps": 67140, "loss": 0.6783, "lr": 2.5471787987490092e-05, "epoch": 5.446082812034555, "percentage": 54.46, "elapsed_time": "2:31:22", "remaining_time": "2:06:34", "throughput": 2321.48, "total_tokens": 21085360} {"current_steps": 36570, "total_steps": 67140, "loss": 0.519, "lr": 2.5465290286045518e-05, "epoch": 5.446827524575514, "percentage": 54.47, "elapsed_time": "2:31:23", "remaining_time": "2:06:33", "throughput": 2321.51, "total_tokens": 21088272} {"current_steps": 36575, "total_steps": 67140, "loss": 0.5252, "lr": 2.5458792553158518e-05, "epoch": 5.447572237116473, "percentage": 54.48, "elapsed_time": "2:31:24", "remaining_time": "2:06:32", "throughput": 2321.53, "total_tokens": 21091088} {"current_steps": 36580, "total_steps": 67140, "loss": 0.5848, "lr": 2.5452294789268187e-05, "epoch": 5.448316949657432, "percentage": 54.48, "elapsed_time": "2:31:26", "remaining_time": "2:06:30", "throughput": 2321.58, "total_tokens": 21094160} {"current_steps": 36585, "total_steps": 67140, "loss": 0.7184, "lr": 2.544579699481361e-05, "epoch": 5.449061662198392, "percentage": 54.49, "elapsed_time": "2:31:27", "remaining_time": "2:06:29", "throughput": 2321.6, "total_tokens": 21097072} {"current_steps": 36590, "total_steps": 67140, "loss": 0.7713, "lr": 2.5439299170233883e-05, "epoch": 5.44980637473935, "percentage": 54.5, "elapsed_time": "2:31:28", "remaining_time": "2:06:28", "throughput": 2321.64, "total_tokens": 21100112} {"current_steps": 36595, "total_steps": 67140, "loss": 0.4275, "lr": 2.54328013159681e-05, "epoch": 5.45055108728031, "percentage": 54.51, "elapsed_time": "2:31:29", "remaining_time": "2:06:26", "throughput": 2321.67, "total_tokens": 21103088} {"current_steps": 36600, "total_steps": 67140, "loss": 0.8787, "lr": 2.5426303432455374e-05, "epoch": 5.451295799821269, "percentage": 54.51, "elapsed_time": "2:31:30", "remaining_time": "2:06:25", "throughput": 2321.71, "total_tokens": 21106064} {"current_steps": 36605, "total_steps": 67140, "loss": 0.6675, "lr": 2.5419805520134788e-05, "epoch": 5.452040512362228, "percentage": 54.52, "elapsed_time": "2:31:31", "remaining_time": "2:06:24", "throughput": 2321.73, "total_tokens": 21108880} {"current_steps": 36610, "total_steps": 67140, "loss": 0.6283, "lr": 2.5413307579445456e-05, "epoch": 5.452785224903187, "percentage": 54.53, "elapsed_time": "2:31:33", "remaining_time": "2:06:22", "throughput": 2321.75, "total_tokens": 21111760} {"current_steps": 36615, "total_steps": 67140, "loss": 0.5654, "lr": 2.540680961082647e-05, "epoch": 5.453529937444147, "percentage": 54.54, "elapsed_time": "2:31:34", "remaining_time": "2:06:21", "throughput": 2321.75, "total_tokens": 21114352} {"current_steps": 36620, "total_steps": 67140, "loss": 0.7693, "lr": 2.5400311614716955e-05, "epoch": 5.454274649985106, "percentage": 54.54, "elapsed_time": "2:31:35", "remaining_time": "2:06:20", "throughput": 2321.76, "total_tokens": 21116976} {"current_steps": 36625, "total_steps": 67140, "loss": 0.6387, "lr": 2.5393813591556002e-05, "epoch": 5.455019362526065, "percentage": 54.55, "elapsed_time": "2:31:36", "remaining_time": "2:06:18", "throughput": 2321.8, "total_tokens": 21120080} {"current_steps": 36630, "total_steps": 67140, "loss": 0.7543, "lr": 2.538731554178273e-05, "epoch": 5.455764075067024, "percentage": 54.56, "elapsed_time": "2:31:37", "remaining_time": "2:06:17", "throughput": 2321.83, "total_tokens": 21122960} {"current_steps": 36635, "total_steps": 67140, "loss": 0.6782, "lr": 2.5380817465836245e-05, "epoch": 5.456508787607984, "percentage": 54.57, "elapsed_time": "2:31:38", "remaining_time": "2:06:16", "throughput": 2321.88, "total_tokens": 21126192} {"current_steps": 36640, "total_steps": 67140, "loss": 0.6183, "lr": 2.5374319364155673e-05, "epoch": 5.457253500148942, "percentage": 54.57, "elapsed_time": "2:31:39", "remaining_time": "2:06:14", "throughput": 2321.91, "total_tokens": 21129136} {"current_steps": 36645, "total_steps": 67140, "loss": 0.739, "lr": 2.536782123718011e-05, "epoch": 5.457998212689902, "percentage": 54.58, "elapsed_time": "2:31:41", "remaining_time": "2:06:13", "throughput": 2321.92, "total_tokens": 21131824} {"current_steps": 36650, "total_steps": 67140, "loss": 0.7395, "lr": 2.5361323085348687e-05, "epoch": 5.458742925230861, "percentage": 54.59, "elapsed_time": "2:31:42", "remaining_time": "2:06:12", "throughput": 2321.95, "total_tokens": 21134704} {"current_steps": 36655, "total_steps": 67140, "loss": 0.7025, "lr": 2.5354824909100522e-05, "epoch": 5.4594876377718204, "percentage": 54.59, "elapsed_time": "2:31:43", "remaining_time": "2:06:10", "throughput": 2321.98, "total_tokens": 21137552} {"current_steps": 36660, "total_steps": 67140, "loss": 0.5793, "lr": 2.5348326708874732e-05, "epoch": 5.460232350312779, "percentage": 54.6, "elapsed_time": "2:31:44", "remaining_time": "2:06:09", "throughput": 2322.0, "total_tokens": 21140304} {"current_steps": 36665, "total_steps": 67140, "loss": 0.8049, "lr": 2.5341828485110435e-05, "epoch": 5.460977062853739, "percentage": 54.61, "elapsed_time": "2:31:45", "remaining_time": "2:06:08", "throughput": 2322.04, "total_tokens": 21143504} {"current_steps": 36670, "total_steps": 67140, "loss": 0.5252, "lr": 2.5335330238246756e-05, "epoch": 5.461721775394698, "percentage": 54.62, "elapsed_time": "2:31:46", "remaining_time": "2:06:06", "throughput": 2322.08, "total_tokens": 21146512} {"current_steps": 36675, "total_steps": 67140, "loss": 0.9003, "lr": 2.532883196872283e-05, "epoch": 5.462466487935657, "percentage": 54.62, "elapsed_time": "2:31:47", "remaining_time": "2:06:05", "throughput": 2322.11, "total_tokens": 21149520} {"current_steps": 36680, "total_steps": 67140, "loss": 0.595, "lr": 2.5322333676977778e-05, "epoch": 5.463211200476616, "percentage": 54.63, "elapsed_time": "2:31:49", "remaining_time": "2:06:04", "throughput": 2322.14, "total_tokens": 21152432} {"current_steps": 36685, "total_steps": 67140, "loss": 0.5773, "lr": 2.531583536345072e-05, "epoch": 5.463955913017575, "percentage": 54.64, "elapsed_time": "2:31:50", "remaining_time": "2:06:03", "throughput": 2322.19, "total_tokens": 21155632} {"current_steps": 36690, "total_steps": 67140, "loss": 0.7592, "lr": 2.5309337028580792e-05, "epoch": 5.464700625558534, "percentage": 54.65, "elapsed_time": "2:31:51", "remaining_time": "2:06:01", "throughput": 2322.23, "total_tokens": 21158640} {"current_steps": 36695, "total_steps": 67140, "loss": 0.5534, "lr": 2.5302838672807128e-05, "epoch": 5.465445338099494, "percentage": 54.65, "elapsed_time": "2:31:52", "remaining_time": "2:06:00", "throughput": 2322.26, "total_tokens": 21161552} {"current_steps": 36700, "total_steps": 67140, "loss": 0.6642, "lr": 2.529634029656886e-05, "epoch": 5.466190050640453, "percentage": 54.66, "elapsed_time": "2:31:53", "remaining_time": "2:05:59", "throughput": 2322.26, "total_tokens": 21164112} {"current_steps": 36705, "total_steps": 67140, "loss": 0.7525, "lr": 2.528984190030512e-05, "epoch": 5.466934763181412, "percentage": 54.67, "elapsed_time": "2:31:54", "remaining_time": "2:05:57", "throughput": 2322.3, "total_tokens": 21167216} {"current_steps": 36710, "total_steps": 67140, "loss": 0.5677, "lr": 2.5283343484455036e-05, "epoch": 5.467679475722371, "percentage": 54.68, "elapsed_time": "2:31:55", "remaining_time": "2:05:56", "throughput": 2322.33, "total_tokens": 21170064} {"current_steps": 36715, "total_steps": 67140, "loss": 0.6416, "lr": 2.5276845049457754e-05, "epoch": 5.46842418826333, "percentage": 54.68, "elapsed_time": "2:31:57", "remaining_time": "2:05:55", "throughput": 2322.36, "total_tokens": 21172944} {"current_steps": 36720, "total_steps": 67140, "loss": 0.6473, "lr": 2.5270346595752414e-05, "epoch": 5.46916890080429, "percentage": 54.69, "elapsed_time": "2:31:58", "remaining_time": "2:05:53", "throughput": 2322.39, "total_tokens": 21175888} {"current_steps": 36725, "total_steps": 67140, "loss": 0.6013, "lr": 2.526384812377815e-05, "epoch": 5.469913613345248, "percentage": 54.7, "elapsed_time": "2:31:59", "remaining_time": "2:05:52", "throughput": 2322.42, "total_tokens": 21178832} {"current_steps": 36730, "total_steps": 67140, "loss": 0.451, "lr": 2.525734963397409e-05, "epoch": 5.470658325886208, "percentage": 54.71, "elapsed_time": "2:32:00", "remaining_time": "2:05:51", "throughput": 2322.45, "total_tokens": 21181840} {"current_steps": 36735, "total_steps": 67140, "loss": 0.6912, "lr": 2.5250851126779397e-05, "epoch": 5.471403038427167, "percentage": 54.71, "elapsed_time": "2:32:01", "remaining_time": "2:05:49", "throughput": 2322.5, "total_tokens": 21185008} {"current_steps": 36740, "total_steps": 67140, "loss": 0.8321, "lr": 2.5244352602633215e-05, "epoch": 5.4721477509681264, "percentage": 54.72, "elapsed_time": "2:32:02", "remaining_time": "2:05:48", "throughput": 2322.54, "total_tokens": 21188176} {"current_steps": 36745, "total_steps": 67140, "loss": 0.6341, "lr": 2.5237854061974665e-05, "epoch": 5.472892463509085, "percentage": 54.73, "elapsed_time": "2:32:03", "remaining_time": "2:05:47", "throughput": 2322.56, "total_tokens": 21190992} {"current_steps": 36750, "total_steps": 67140, "loss": 0.6225, "lr": 2.5231355505242906e-05, "epoch": 5.473637176050045, "percentage": 54.74, "elapsed_time": "2:32:05", "remaining_time": "2:05:45", "throughput": 2322.59, "total_tokens": 21193904} {"current_steps": 36755, "total_steps": 67140, "loss": 0.682, "lr": 2.5224856932877083e-05, "epoch": 5.474381888591004, "percentage": 54.74, "elapsed_time": "2:32:06", "remaining_time": "2:05:44", "throughput": 2322.62, "total_tokens": 21196752} {"current_steps": 36760, "total_steps": 67140, "loss": 0.6751, "lr": 2.5218358345316346e-05, "epoch": 5.475126601131963, "percentage": 54.75, "elapsed_time": "2:32:07", "remaining_time": "2:05:43", "throughput": 2322.64, "total_tokens": 21199536} {"current_steps": 36765, "total_steps": 67140, "loss": 0.3399, "lr": 2.521185974299983e-05, "epoch": 5.475871313672922, "percentage": 54.76, "elapsed_time": "2:32:08", "remaining_time": "2:05:41", "throughput": 2322.67, "total_tokens": 21202512} {"current_steps": 36770, "total_steps": 67140, "loss": 0.5843, "lr": 2.52053611263667e-05, "epoch": 5.476616026213882, "percentage": 54.77, "elapsed_time": "2:32:09", "remaining_time": "2:05:40", "throughput": 2322.7, "total_tokens": 21205424} {"current_steps": 36775, "total_steps": 67140, "loss": 0.6318, "lr": 2.5198862495856106e-05, "epoch": 5.47736073875484, "percentage": 54.77, "elapsed_time": "2:32:10", "remaining_time": "2:05:39", "throughput": 2322.73, "total_tokens": 21208400} {"current_steps": 36780, "total_steps": 67140, "loss": 0.6811, "lr": 2.519236385190719e-05, "epoch": 5.4781054512958, "percentage": 54.78, "elapsed_time": "2:32:11", "remaining_time": "2:05:37", "throughput": 2322.73, "total_tokens": 21210960} {"current_steps": 36785, "total_steps": 67140, "loss": 0.5435, "lr": 2.5185865194959103e-05, "epoch": 5.478850163836759, "percentage": 54.79, "elapsed_time": "2:32:13", "remaining_time": "2:05:36", "throughput": 2322.76, "total_tokens": 21213776} {"current_steps": 36790, "total_steps": 67140, "loss": 0.6836, "lr": 2.517936652545101e-05, "epoch": 5.4795948763777185, "percentage": 54.8, "elapsed_time": "2:32:14", "remaining_time": "2:05:35", "throughput": 2322.77, "total_tokens": 21216464} {"current_steps": 36795, "total_steps": 67140, "loss": 0.5762, "lr": 2.5172867843822046e-05, "epoch": 5.480339588918677, "percentage": 54.8, "elapsed_time": "2:32:15", "remaining_time": "2:05:33", "throughput": 2322.79, "total_tokens": 21219248} {"current_steps": 36800, "total_steps": 67140, "loss": 0.5974, "lr": 2.516636915051138e-05, "epoch": 5.481084301459637, "percentage": 54.81, "elapsed_time": "2:32:16", "remaining_time": "2:05:32", "throughput": 2322.81, "total_tokens": 21222096} {"current_steps": 36805, "total_steps": 67140, "loss": 0.5997, "lr": 2.515987044595817e-05, "epoch": 5.481829014000596, "percentage": 54.82, "elapsed_time": "2:32:17", "remaining_time": "2:05:31", "throughput": 2322.83, "total_tokens": 21224752} {"current_steps": 36810, "total_steps": 67140, "loss": 0.666, "lr": 2.5153371730601556e-05, "epoch": 5.482573726541555, "percentage": 54.83, "elapsed_time": "2:32:18", "remaining_time": "2:05:29", "throughput": 2322.85, "total_tokens": 21227664} {"current_steps": 36815, "total_steps": 67140, "loss": 0.6151, "lr": 2.51468730048807e-05, "epoch": 5.483318439082514, "percentage": 54.83, "elapsed_time": "2:32:19", "remaining_time": "2:05:28", "throughput": 2322.88, "total_tokens": 21230512} {"current_steps": 36820, "total_steps": 67140, "loss": 0.7202, "lr": 2.5140374269234772e-05, "epoch": 5.484063151623474, "percentage": 54.84, "elapsed_time": "2:32:20", "remaining_time": "2:05:27", "throughput": 2322.9, "total_tokens": 21233328} {"current_steps": 36825, "total_steps": 67140, "loss": 0.4693, "lr": 2.5133875524102922e-05, "epoch": 5.4848078641644324, "percentage": 54.85, "elapsed_time": "2:32:22", "remaining_time": "2:05:25", "throughput": 2322.93, "total_tokens": 21236240} {"current_steps": 36830, "total_steps": 67140, "loss": 0.6141, "lr": 2.5127376769924306e-05, "epoch": 5.485552576705392, "percentage": 54.86, "elapsed_time": "2:32:23", "remaining_time": "2:05:24", "throughput": 2322.94, "total_tokens": 21239024} {"current_steps": 36835, "total_steps": 67140, "loss": 0.6056, "lr": 2.512087800713808e-05, "epoch": 5.486297289246351, "percentage": 54.86, "elapsed_time": "2:32:24", "remaining_time": "2:05:23", "throughput": 2322.97, "total_tokens": 21241936} {"current_steps": 36840, "total_steps": 67140, "loss": 0.5053, "lr": 2.511437923618343e-05, "epoch": 5.4870420017873105, "percentage": 54.87, "elapsed_time": "2:32:25", "remaining_time": "2:05:21", "throughput": 2323.01, "total_tokens": 21244880} {"current_steps": 36845, "total_steps": 67140, "loss": 0.6644, "lr": 2.510788045749948e-05, "epoch": 5.487786714328269, "percentage": 54.88, "elapsed_time": "2:32:26", "remaining_time": "2:05:20", "throughput": 2323.02, "total_tokens": 21247536} {"current_steps": 36850, "total_steps": 67140, "loss": 0.5807, "lr": 2.5101381671525404e-05, "epoch": 5.488531426869228, "percentage": 54.89, "elapsed_time": "2:32:27", "remaining_time": "2:05:19", "throughput": 2323.08, "total_tokens": 21250992} {"current_steps": 36855, "total_steps": 67140, "loss": 0.5734, "lr": 2.5094882878700372e-05, "epoch": 5.489276139410188, "percentage": 54.89, "elapsed_time": "2:32:28", "remaining_time": "2:05:17", "throughput": 2323.1, "total_tokens": 21253776} {"current_steps": 36860, "total_steps": 67140, "loss": 0.6536, "lr": 2.5088384079463544e-05, "epoch": 5.490020851951147, "percentage": 54.9, "elapsed_time": "2:32:29", "remaining_time": "2:05:16", "throughput": 2323.11, "total_tokens": 21256432} {"current_steps": 36865, "total_steps": 67140, "loss": 0.5421, "lr": 2.5081885274254076e-05, "epoch": 5.490765564492106, "percentage": 54.91, "elapsed_time": "2:32:31", "remaining_time": "2:05:15", "throughput": 2323.13, "total_tokens": 21259216} {"current_steps": 36870, "total_steps": 67140, "loss": 0.6099, "lr": 2.5075386463511135e-05, "epoch": 5.491510277033065, "percentage": 54.92, "elapsed_time": "2:32:32", "remaining_time": "2:05:13", "throughput": 2323.18, "total_tokens": 21262352} {"current_steps": 36875, "total_steps": 67140, "loss": 0.6006, "lr": 2.5068887647673878e-05, "epoch": 5.4922549895740245, "percentage": 54.92, "elapsed_time": "2:32:33", "remaining_time": "2:05:12", "throughput": 2323.2, "total_tokens": 21265136} {"current_steps": 36880, "total_steps": 67140, "loss": 0.6293, "lr": 2.5062388827181483e-05, "epoch": 5.492999702114983, "percentage": 54.93, "elapsed_time": "2:32:34", "remaining_time": "2:05:11", "throughput": 2323.22, "total_tokens": 21267920} {"current_steps": 36885, "total_steps": 67140, "loss": 0.6628, "lr": 2.5055890002473097e-05, "epoch": 5.493744414655943, "percentage": 54.94, "elapsed_time": "2:32:35", "remaining_time": "2:05:09", "throughput": 2323.24, "total_tokens": 21270736} {"current_steps": 36890, "total_steps": 67140, "loss": 0.618, "lr": 2.5049391173987896e-05, "epoch": 5.494489127196902, "percentage": 54.94, "elapsed_time": "2:32:36", "remaining_time": "2:05:08", "throughput": 2323.27, "total_tokens": 21273776} {"current_steps": 36895, "total_steps": 67140, "loss": 0.54, "lr": 2.5042892342165036e-05, "epoch": 5.495233839737861, "percentage": 54.95, "elapsed_time": "2:32:37", "remaining_time": "2:05:07", "throughput": 2323.3, "total_tokens": 21276688} {"current_steps": 36900, "total_steps": 67140, "loss": 0.5514, "lr": 2.5036393507443694e-05, "epoch": 5.49597855227882, "percentage": 54.96, "elapsed_time": "2:32:39", "remaining_time": "2:05:05", "throughput": 2323.32, "total_tokens": 21279376} {"current_steps": 36905, "total_steps": 67140, "loss": 0.599, "lr": 2.5029894670263025e-05, "epoch": 5.49672326481978, "percentage": 54.97, "elapsed_time": "2:32:40", "remaining_time": "2:05:04", "throughput": 2323.33, "total_tokens": 21282096} {"current_steps": 36910, "total_steps": 67140, "loss": 0.7126, "lr": 2.502339583106219e-05, "epoch": 5.4974679773607384, "percentage": 54.97, "elapsed_time": "2:32:41", "remaining_time": "2:05:03", "throughput": 2323.39, "total_tokens": 21285456} {"current_steps": 36915, "total_steps": 67140, "loss": 0.7365, "lr": 2.5016896990280357e-05, "epoch": 5.498212689901698, "percentage": 54.98, "elapsed_time": "2:32:42", "remaining_time": "2:05:02", "throughput": 2323.42, "total_tokens": 21288464} {"current_steps": 36920, "total_steps": 67140, "loss": 0.7768, "lr": 2.50103981483567e-05, "epoch": 5.498957402442657, "percentage": 54.99, "elapsed_time": "2:32:43", "remaining_time": "2:05:00", "throughput": 2323.46, "total_tokens": 21291472} {"current_steps": 36925, "total_steps": 67140, "loss": 0.4672, "lr": 2.5003899305730383e-05, "epoch": 5.4997021149836165, "percentage": 55.0, "elapsed_time": "2:32:44", "remaining_time": "2:04:59", "throughput": 2323.48, "total_tokens": 21294256} {"current_steps": 36927, "total_steps": 67140, "eval_loss": 0.6592589616775513, "epoch": 5.5, "percentage": 55.0, "elapsed_time": "2:33:59", "remaining_time": "2:05:59", "throughput": 2304.79, "total_tokens": 21295472} {"current_steps": 36930, "total_steps": 67140, "loss": 0.6886, "lr": 2.499740046284056e-05, "epoch": 5.500446827524575, "percentage": 55.0, "elapsed_time": "2:34:02", "remaining_time": "2:06:00", "throughput": 2304.41, "total_tokens": 21297424} {"current_steps": 36935, "total_steps": 67140, "loss": 0.5999, "lr": 2.49909016201264e-05, "epoch": 5.501191540065535, "percentage": 55.01, "elapsed_time": "2:34:03", "remaining_time": "2:05:58", "throughput": 2304.44, "total_tokens": 21300368} {"current_steps": 36940, "total_steps": 67140, "loss": 0.4958, "lr": 2.498440277802708e-05, "epoch": 5.501936252606494, "percentage": 55.02, "elapsed_time": "2:34:04", "remaining_time": "2:05:57", "throughput": 2304.46, "total_tokens": 21303152} {"current_steps": 36945, "total_steps": 67140, "loss": 0.5292, "lr": 2.497790393698175e-05, "epoch": 5.502680965147453, "percentage": 55.03, "elapsed_time": "2:34:05", "remaining_time": "2:05:56", "throughput": 2304.5, "total_tokens": 21306256} {"current_steps": 36950, "total_steps": 67140, "loss": 0.4821, "lr": 2.4971405097429595e-05, "epoch": 5.503425677688412, "percentage": 55.03, "elapsed_time": "2:34:06", "remaining_time": "2:05:54", "throughput": 2304.51, "total_tokens": 21308880} {"current_steps": 36955, "total_steps": 67140, "loss": 0.6783, "lr": 2.4964906259809754e-05, "epoch": 5.504170390229372, "percentage": 55.04, "elapsed_time": "2:34:07", "remaining_time": "2:05:53", "throughput": 2304.53, "total_tokens": 21311536} {"current_steps": 36960, "total_steps": 67140, "loss": 0.6875, "lr": 2.495840742456141e-05, "epoch": 5.5049151027703305, "percentage": 55.05, "elapsed_time": "2:34:08", "remaining_time": "2:05:52", "throughput": 2304.55, "total_tokens": 21314352} {"current_steps": 36965, "total_steps": 67140, "loss": 0.3848, "lr": 2.495190859212372e-05, "epoch": 5.50565981531129, "percentage": 55.06, "elapsed_time": "2:34:09", "remaining_time": "2:05:50", "throughput": 2304.56, "total_tokens": 21317008} {"current_steps": 36970, "total_steps": 67140, "loss": 0.5121, "lr": 2.4945409762935855e-05, "epoch": 5.506404527852249, "percentage": 55.06, "elapsed_time": "2:34:11", "remaining_time": "2:05:49", "throughput": 2304.61, "total_tokens": 21320080} {"current_steps": 36975, "total_steps": 67140, "loss": 0.7067, "lr": 2.4938910937436974e-05, "epoch": 5.5071492403932085, "percentage": 55.07, "elapsed_time": "2:34:12", "remaining_time": "2:05:48", "throughput": 2304.62, "total_tokens": 21322672} {"current_steps": 36980, "total_steps": 67140, "loss": 0.6563, "lr": 2.4932412116066243e-05, "epoch": 5.507893952934167, "percentage": 55.08, "elapsed_time": "2:34:13", "remaining_time": "2:05:46", "throughput": 2304.67, "total_tokens": 21325840} {"current_steps": 36985, "total_steps": 67140, "loss": 0.5481, "lr": 2.492591329926283e-05, "epoch": 5.508638665475127, "percentage": 55.09, "elapsed_time": "2:34:14", "remaining_time": "2:05:45", "throughput": 2304.7, "total_tokens": 21328720} {"current_steps": 36990, "total_steps": 67140, "loss": 0.6746, "lr": 2.49194144874659e-05, "epoch": 5.509383378016086, "percentage": 55.09, "elapsed_time": "2:34:15", "remaining_time": "2:05:44", "throughput": 2304.72, "total_tokens": 21331472} {"current_steps": 36995, "total_steps": 67140, "loss": 0.5855, "lr": 2.4912915681114603e-05, "epoch": 5.510128090557045, "percentage": 55.1, "elapsed_time": "2:34:16", "remaining_time": "2:05:42", "throughput": 2304.76, "total_tokens": 21334608} {"current_steps": 37000, "total_steps": 67140, "loss": 0.5853, "lr": 2.490641688064811e-05, "epoch": 5.510872803098004, "percentage": 55.11, "elapsed_time": "2:34:17", "remaining_time": "2:05:41", "throughput": 2304.79, "total_tokens": 21337392} {"current_steps": 37005, "total_steps": 67140, "loss": 0.537, "lr": 2.4899918086505585e-05, "epoch": 5.511617515638964, "percentage": 55.12, "elapsed_time": "2:34:18", "remaining_time": "2:05:40", "throughput": 2304.8, "total_tokens": 21339984} {"current_steps": 37010, "total_steps": 67140, "loss": 0.5708, "lr": 2.489341929912619e-05, "epoch": 5.5123622281799225, "percentage": 55.12, "elapsed_time": "2:34:20", "remaining_time": "2:05:38", "throughput": 2304.8, "total_tokens": 21342512} {"current_steps": 37015, "total_steps": 67140, "loss": 0.644, "lr": 2.488692051894908e-05, "epoch": 5.513106940720881, "percentage": 55.13, "elapsed_time": "2:34:21", "remaining_time": "2:05:37", "throughput": 2304.84, "total_tokens": 21345552} {"current_steps": 37020, "total_steps": 67140, "loss": 0.5467, "lr": 2.488042174641343e-05, "epoch": 5.513851653261841, "percentage": 55.14, "elapsed_time": "2:34:22", "remaining_time": "2:05:35", "throughput": 2304.86, "total_tokens": 21348336} {"current_steps": 37025, "total_steps": 67140, "loss": 0.4946, "lr": 2.4873922981958383e-05, "epoch": 5.5145963658028005, "percentage": 55.15, "elapsed_time": "2:34:23", "remaining_time": "2:05:34", "throughput": 2304.88, "total_tokens": 21351120} {"current_steps": 37030, "total_steps": 67140, "loss": 0.6472, "lr": 2.4867424226023123e-05, "epoch": 5.515341078343759, "percentage": 55.15, "elapsed_time": "2:34:24", "remaining_time": "2:05:33", "throughput": 2304.91, "total_tokens": 21353968} {"current_steps": 37035, "total_steps": 67140, "loss": 0.5705, "lr": 2.486092547904678e-05, "epoch": 5.516085790884718, "percentage": 55.16, "elapsed_time": "2:34:25", "remaining_time": "2:05:31", "throughput": 2304.92, "total_tokens": 21356688} {"current_steps": 37040, "total_steps": 67140, "loss": 0.6724, "lr": 2.4854426741468537e-05, "epoch": 5.516830503425678, "percentage": 55.17, "elapsed_time": "2:34:26", "remaining_time": "2:05:30", "throughput": 2304.97, "total_tokens": 21359856} {"current_steps": 37045, "total_steps": 67140, "loss": 0.6013, "lr": 2.4847928013727537e-05, "epoch": 5.517575215966637, "percentage": 55.18, "elapsed_time": "2:34:28", "remaining_time": "2:05:29", "throughput": 2305.01, "total_tokens": 21362896} {"current_steps": 37050, "total_steps": 67140, "loss": 0.5766, "lr": 2.484142929626294e-05, "epoch": 5.518319928507596, "percentage": 55.18, "elapsed_time": "2:34:29", "remaining_time": "2:05:27", "throughput": 2305.04, "total_tokens": 21365776} {"current_steps": 37055, "total_steps": 67140, "loss": 0.6587, "lr": 2.4834930589513915e-05, "epoch": 5.519064641048555, "percentage": 55.19, "elapsed_time": "2:34:30", "remaining_time": "2:05:26", "throughput": 2305.1, "total_tokens": 21369136} {"current_steps": 37060, "total_steps": 67140, "loss": 0.5296, "lr": 2.4828431893919608e-05, "epoch": 5.5198093535895145, "percentage": 55.2, "elapsed_time": "2:34:31", "remaining_time": "2:05:25", "throughput": 2305.14, "total_tokens": 21372144} {"current_steps": 37065, "total_steps": 67140, "loss": 0.5295, "lr": 2.482193320991917e-05, "epoch": 5.520554066130473, "percentage": 55.21, "elapsed_time": "2:34:32", "remaining_time": "2:05:23", "throughput": 2305.15, "total_tokens": 21374768} {"current_steps": 37070, "total_steps": 67140, "loss": 0.6373, "lr": 2.4815434537951773e-05, "epoch": 5.521298778671433, "percentage": 55.21, "elapsed_time": "2:34:33", "remaining_time": "2:05:22", "throughput": 2305.17, "total_tokens": 21377552} {"current_steps": 37075, "total_steps": 67140, "loss": 0.6664, "lr": 2.4808935878456556e-05, "epoch": 5.522043491212392, "percentage": 55.22, "elapsed_time": "2:34:34", "remaining_time": "2:05:21", "throughput": 2305.22, "total_tokens": 21380816} {"current_steps": 37080, "total_steps": 67140, "loss": 0.702, "lr": 2.480243723187267e-05, "epoch": 5.522788203753351, "percentage": 55.23, "elapsed_time": "2:34:36", "remaining_time": "2:05:19", "throughput": 2305.24, "total_tokens": 21383472} {"current_steps": 37085, "total_steps": 67140, "loss": 0.5293, "lr": 2.4795938598639273e-05, "epoch": 5.52353291629431, "percentage": 55.24, "elapsed_time": "2:34:37", "remaining_time": "2:05:18", "throughput": 2305.28, "total_tokens": 21386608} {"current_steps": 37090, "total_steps": 67140, "loss": 0.5726, "lr": 2.478943997919552e-05, "epoch": 5.52427762883527, "percentage": 55.24, "elapsed_time": "2:34:38", "remaining_time": "2:05:17", "throughput": 2305.31, "total_tokens": 21389456} {"current_steps": 37095, "total_steps": 67140, "loss": 0.5648, "lr": 2.4782941373980552e-05, "epoch": 5.5250223413762285, "percentage": 55.25, "elapsed_time": "2:34:39", "remaining_time": "2:05:15", "throughput": 2305.36, "total_tokens": 21392624} {"current_steps": 37100, "total_steps": 67140, "loss": 0.5232, "lr": 2.4776442783433523e-05, "epoch": 5.525767053917188, "percentage": 55.26, "elapsed_time": "2:34:40", "remaining_time": "2:05:14", "throughput": 2305.38, "total_tokens": 21395504} {"current_steps": 37105, "total_steps": 67140, "loss": 0.6212, "lr": 2.476994420799359e-05, "epoch": 5.526511766458147, "percentage": 55.27, "elapsed_time": "2:34:41", "remaining_time": "2:05:13", "throughput": 2305.39, "total_tokens": 21398064} {"current_steps": 37110, "total_steps": 67140, "loss": 0.7065, "lr": 2.4763445648099894e-05, "epoch": 5.5272564789991065, "percentage": 55.27, "elapsed_time": "2:34:42", "remaining_time": "2:05:11", "throughput": 2305.44, "total_tokens": 21401296} {"current_steps": 37115, "total_steps": 67140, "loss": 0.4205, "lr": 2.4756947104191573e-05, "epoch": 5.528001191540065, "percentage": 55.28, "elapsed_time": "2:34:44", "remaining_time": "2:05:10", "throughput": 2305.46, "total_tokens": 21403952} {"current_steps": 37120, "total_steps": 67140, "loss": 0.7208, "lr": 2.4750448576707773e-05, "epoch": 5.528745904081025, "percentage": 55.29, "elapsed_time": "2:34:45", "remaining_time": "2:05:09", "throughput": 2305.47, "total_tokens": 21406608} {"current_steps": 37125, "total_steps": 67140, "loss": 0.4289, "lr": 2.474395006608765e-05, "epoch": 5.529490616621984, "percentage": 55.29, "elapsed_time": "2:34:46", "remaining_time": "2:05:07", "throughput": 2305.49, "total_tokens": 21409424} {"current_steps": 37130, "total_steps": 67140, "loss": 0.571, "lr": 2.4737451572770337e-05, "epoch": 5.530235329162943, "percentage": 55.3, "elapsed_time": "2:34:47", "remaining_time": "2:05:06", "throughput": 2305.51, "total_tokens": 21412176} {"current_steps": 37135, "total_steps": 67140, "loss": 0.6225, "lr": 2.4730953097194987e-05, "epoch": 5.530980041703902, "percentage": 55.31, "elapsed_time": "2:34:48", "remaining_time": "2:05:05", "throughput": 2305.55, "total_tokens": 21415152} {"current_steps": 37140, "total_steps": 67140, "loss": 0.6458, "lr": 2.4724454639800724e-05, "epoch": 5.531724754244862, "percentage": 55.32, "elapsed_time": "2:34:49", "remaining_time": "2:05:03", "throughput": 2305.6, "total_tokens": 21418384} {"current_steps": 37145, "total_steps": 67140, "loss": 0.8471, "lr": 2.4717956201026694e-05, "epoch": 5.5324694667858205, "percentage": 55.32, "elapsed_time": "2:34:50", "remaining_time": "2:05:02", "throughput": 2305.64, "total_tokens": 21421392} {"current_steps": 37150, "total_steps": 67140, "loss": 0.4779, "lr": 2.4711457781312052e-05, "epoch": 5.53321417932678, "percentage": 55.33, "elapsed_time": "2:34:52", "remaining_time": "2:05:01", "throughput": 2305.67, "total_tokens": 21424272} {"current_steps": 37155, "total_steps": 67140, "loss": 0.6874, "lr": 2.4704959381095914e-05, "epoch": 5.533958891867739, "percentage": 55.34, "elapsed_time": "2:34:53", "remaining_time": "2:04:59", "throughput": 2305.72, "total_tokens": 21427472} {"current_steps": 37160, "total_steps": 67140, "loss": 0.7357, "lr": 2.4698461000817415e-05, "epoch": 5.534703604408699, "percentage": 55.35, "elapsed_time": "2:34:54", "remaining_time": "2:04:58", "throughput": 2305.75, "total_tokens": 21430480} {"current_steps": 37165, "total_steps": 67140, "loss": 0.5918, "lr": 2.46919626409157e-05, "epoch": 5.535448316949657, "percentage": 55.35, "elapsed_time": "2:34:55", "remaining_time": "2:04:57", "throughput": 2305.8, "total_tokens": 21433616} {"current_steps": 37170, "total_steps": 67140, "loss": 0.6364, "lr": 2.46854643018299e-05, "epoch": 5.536193029490617, "percentage": 55.36, "elapsed_time": "2:34:56", "remaining_time": "2:04:55", "throughput": 2305.82, "total_tokens": 21436432} {"current_steps": 37175, "total_steps": 67140, "loss": 0.6204, "lr": 2.4678965983999133e-05, "epoch": 5.536937742031576, "percentage": 55.37, "elapsed_time": "2:34:57", "remaining_time": "2:04:54", "throughput": 2305.86, "total_tokens": 21439376} {"current_steps": 37180, "total_steps": 67140, "loss": 0.6563, "lr": 2.4672467687862545e-05, "epoch": 5.537682454572535, "percentage": 55.38, "elapsed_time": "2:34:58", "remaining_time": "2:04:53", "throughput": 2305.88, "total_tokens": 21442224} {"current_steps": 37185, "total_steps": 67140, "loss": 0.6908, "lr": 2.4665969413859264e-05, "epoch": 5.538427167113494, "percentage": 55.38, "elapsed_time": "2:35:00", "remaining_time": "2:04:51", "throughput": 2305.9, "total_tokens": 21445040} {"current_steps": 37190, "total_steps": 67140, "loss": 0.6029, "lr": 2.4659471162428404e-05, "epoch": 5.539171879654454, "percentage": 55.39, "elapsed_time": "2:35:01", "remaining_time": "2:04:50", "throughput": 2305.92, "total_tokens": 21447728} {"current_steps": 37195, "total_steps": 67140, "loss": 0.6129, "lr": 2.4652972934009112e-05, "epoch": 5.5399165921954125, "percentage": 55.4, "elapsed_time": "2:35:02", "remaining_time": "2:04:49", "throughput": 2305.95, "total_tokens": 21450640} {"current_steps": 37200, "total_steps": 67140, "loss": 0.5387, "lr": 2.4646474729040486e-05, "epoch": 5.540661304736371, "percentage": 55.41, "elapsed_time": "2:35:03", "remaining_time": "2:04:47", "throughput": 2305.98, "total_tokens": 21453616} {"current_steps": 37205, "total_steps": 67140, "loss": 0.5947, "lr": 2.4639976547961665e-05, "epoch": 5.541406017277331, "percentage": 55.41, "elapsed_time": "2:35:04", "remaining_time": "2:04:46", "throughput": 2306.02, "total_tokens": 21456624} {"current_steps": 37210, "total_steps": 67140, "loss": 0.6194, "lr": 2.4633478391211762e-05, "epoch": 5.542150729818291, "percentage": 55.42, "elapsed_time": "2:35:05", "remaining_time": "2:04:45", "throughput": 2306.03, "total_tokens": 21459280} {"current_steps": 37215, "total_steps": 67140, "loss": 0.8001, "lr": 2.46269802592299e-05, "epoch": 5.542895442359249, "percentage": 55.43, "elapsed_time": "2:35:06", "remaining_time": "2:04:43", "throughput": 2306.07, "total_tokens": 21462192} {"current_steps": 37220, "total_steps": 67140, "loss": 0.5839, "lr": 2.4620482152455197e-05, "epoch": 5.543640154900208, "percentage": 55.44, "elapsed_time": "2:35:07", "remaining_time": "2:04:42", "throughput": 2306.09, "total_tokens": 21465008} {"current_steps": 37225, "total_steps": 67140, "loss": 0.5783, "lr": 2.4613984071326762e-05, "epoch": 5.544384867441168, "percentage": 55.44, "elapsed_time": "2:35:09", "remaining_time": "2:04:41", "throughput": 2306.11, "total_tokens": 21467760} {"current_steps": 37230, "total_steps": 67140, "loss": 0.7038, "lr": 2.4607486016283717e-05, "epoch": 5.5451295799821265, "percentage": 55.45, "elapsed_time": "2:35:10", "remaining_time": "2:04:39", "throughput": 2306.13, "total_tokens": 21470576} {"current_steps": 37235, "total_steps": 67140, "loss": 0.3802, "lr": 2.4600987987765183e-05, "epoch": 5.545874292523086, "percentage": 55.46, "elapsed_time": "2:35:11", "remaining_time": "2:04:38", "throughput": 2306.18, "total_tokens": 21473840} {"current_steps": 37240, "total_steps": 67140, "loss": 0.4973, "lr": 2.459448998621025e-05, "epoch": 5.546619005064045, "percentage": 55.47, "elapsed_time": "2:35:12", "remaining_time": "2:04:37", "throughput": 2306.22, "total_tokens": 21476848} {"current_steps": 37245, "total_steps": 67140, "loss": 0.8171, "lr": 2.458799201205803e-05, "epoch": 5.547363717605005, "percentage": 55.47, "elapsed_time": "2:35:13", "remaining_time": "2:04:35", "throughput": 2306.24, "total_tokens": 21479632} {"current_steps": 37250, "total_steps": 67140, "loss": 0.4878, "lr": 2.4581494065747634e-05, "epoch": 5.548108430145963, "percentage": 55.48, "elapsed_time": "2:35:14", "remaining_time": "2:04:34", "throughput": 2306.27, "total_tokens": 21482576} {"current_steps": 37255, "total_steps": 67140, "loss": 0.5079, "lr": 2.4574996147718175e-05, "epoch": 5.548853142686923, "percentage": 55.49, "elapsed_time": "2:35:15", "remaining_time": "2:04:33", "throughput": 2306.29, "total_tokens": 21485360} {"current_steps": 37260, "total_steps": 67140, "loss": 0.9374, "lr": 2.456849825840874e-05, "epoch": 5.549597855227882, "percentage": 55.5, "elapsed_time": "2:35:17", "remaining_time": "2:04:31", "throughput": 2306.32, "total_tokens": 21488144} {"current_steps": 37265, "total_steps": 67140, "loss": 0.5154, "lr": 2.4562000398258442e-05, "epoch": 5.550342567768841, "percentage": 55.5, "elapsed_time": "2:35:18", "remaining_time": "2:04:30", "throughput": 2306.34, "total_tokens": 21490960} {"current_steps": 37270, "total_steps": 67140, "loss": 0.711, "lr": 2.455550256770638e-05, "epoch": 5.5510872803098, "percentage": 55.51, "elapsed_time": "2:35:19", "remaining_time": "2:04:29", "throughput": 2306.39, "total_tokens": 21494192} {"current_steps": 37275, "total_steps": 67140, "loss": 0.5794, "lr": 2.454900476719165e-05, "epoch": 5.55183199285076, "percentage": 55.52, "elapsed_time": "2:35:20", "remaining_time": "2:04:27", "throughput": 2306.41, "total_tokens": 21497072} {"current_steps": 37280, "total_steps": 67140, "loss": 0.6596, "lr": 2.454250699715334e-05, "epoch": 5.5525767053917185, "percentage": 55.53, "elapsed_time": "2:35:21", "remaining_time": "2:04:26", "throughput": 2306.43, "total_tokens": 21499824} {"current_steps": 37285, "total_steps": 67140, "loss": 0.6461, "lr": 2.453600925803054e-05, "epoch": 5.553321417932678, "percentage": 55.53, "elapsed_time": "2:35:22", "remaining_time": "2:04:24", "throughput": 2306.46, "total_tokens": 21502640} {"current_steps": 37290, "total_steps": 67140, "loss": 0.8666, "lr": 2.4529511550262357e-05, "epoch": 5.554066130473637, "percentage": 55.54, "elapsed_time": "2:35:23", "remaining_time": "2:04:23", "throughput": 2306.5, "total_tokens": 21505680} {"current_steps": 37295, "total_steps": 67140, "loss": 0.4476, "lr": 2.4523013874287863e-05, "epoch": 5.554810843014597, "percentage": 55.55, "elapsed_time": "2:35:25", "remaining_time": "2:04:22", "throughput": 2306.54, "total_tokens": 21508720} {"current_steps": 37300, "total_steps": 67140, "loss": 0.5751, "lr": 2.451651623054616e-05, "epoch": 5.555555555555555, "percentage": 55.56, "elapsed_time": "2:35:26", "remaining_time": "2:04:20", "throughput": 2306.55, "total_tokens": 21511472} {"current_steps": 37305, "total_steps": 67140, "loss": 0.5118, "lr": 2.451001861947632e-05, "epoch": 5.556300268096515, "percentage": 55.56, "elapsed_time": "2:35:27", "remaining_time": "2:04:19", "throughput": 2306.58, "total_tokens": 21514320} {"current_steps": 37310, "total_steps": 67140, "loss": 0.637, "lr": 2.4503521041517426e-05, "epoch": 5.557044980637474, "percentage": 55.57, "elapsed_time": "2:35:28", "remaining_time": "2:04:18", "throughput": 2306.6, "total_tokens": 21517104} {"current_steps": 37315, "total_steps": 67140, "loss": 0.578, "lr": 2.4497023497108575e-05, "epoch": 5.557789693178433, "percentage": 55.58, "elapsed_time": "2:35:29", "remaining_time": "2:04:16", "throughput": 2306.62, "total_tokens": 21519984} {"current_steps": 37320, "total_steps": 67140, "loss": 0.6859, "lr": 2.4490525986688826e-05, "epoch": 5.558534405719392, "percentage": 55.59, "elapsed_time": "2:35:30", "remaining_time": "2:04:15", "throughput": 2306.67, "total_tokens": 21523120} {"current_steps": 37325, "total_steps": 67140, "loss": 0.6046, "lr": 2.4484028510697253e-05, "epoch": 5.559279118260352, "percentage": 55.59, "elapsed_time": "2:35:31", "remaining_time": "2:04:14", "throughput": 2306.69, "total_tokens": 21525872} {"current_steps": 37330, "total_steps": 67140, "loss": 0.5942, "lr": 2.4477531069572934e-05, "epoch": 5.560023830801311, "percentage": 55.6, "elapsed_time": "2:35:33", "remaining_time": "2:04:12", "throughput": 2306.71, "total_tokens": 21528752} {"current_steps": 37335, "total_steps": 67140, "loss": 0.6525, "lr": 2.447103366375495e-05, "epoch": 5.56076854334227, "percentage": 55.61, "elapsed_time": "2:35:34", "remaining_time": "2:04:11", "throughput": 2306.72, "total_tokens": 21531280} {"current_steps": 37340, "total_steps": 67140, "loss": 0.6359, "lr": 2.4464536293682353e-05, "epoch": 5.561513255883229, "percentage": 55.62, "elapsed_time": "2:35:35", "remaining_time": "2:04:10", "throughput": 2306.78, "total_tokens": 21534576} {"current_steps": 37345, "total_steps": 67140, "loss": 0.6865, "lr": 2.4458038959794218e-05, "epoch": 5.562257968424189, "percentage": 55.62, "elapsed_time": "2:35:36", "remaining_time": "2:04:08", "throughput": 2306.81, "total_tokens": 21537488} {"current_steps": 37350, "total_steps": 67140, "loss": 0.4761, "lr": 2.4451541662529605e-05, "epoch": 5.563002680965147, "percentage": 55.63, "elapsed_time": "2:35:37", "remaining_time": "2:04:07", "throughput": 2306.83, "total_tokens": 21540336} {"current_steps": 37355, "total_steps": 67140, "loss": 0.465, "lr": 2.444504440232759e-05, "epoch": 5.563747393506107, "percentage": 55.64, "elapsed_time": "2:35:38", "remaining_time": "2:04:06", "throughput": 2306.85, "total_tokens": 21543024} {"current_steps": 37360, "total_steps": 67140, "loss": 0.7162, "lr": 2.4438547179627203e-05, "epoch": 5.564492106047066, "percentage": 55.64, "elapsed_time": "2:35:39", "remaining_time": "2:04:04", "throughput": 2306.88, "total_tokens": 21545872} {"current_steps": 37365, "total_steps": 67140, "loss": 0.5972, "lr": 2.443204999486752e-05, "epoch": 5.5652368185880245, "percentage": 55.65, "elapsed_time": "2:35:41", "remaining_time": "2:04:03", "throughput": 2306.92, "total_tokens": 21549008} {"current_steps": 37370, "total_steps": 67140, "loss": 0.8129, "lr": 2.4425552848487588e-05, "epoch": 5.565981531128984, "percentage": 55.66, "elapsed_time": "2:35:42", "remaining_time": "2:04:02", "throughput": 2306.93, "total_tokens": 21551632} {"current_steps": 37375, "total_steps": 67140, "loss": 0.6687, "lr": 2.4419055740926456e-05, "epoch": 5.566726243669944, "percentage": 55.67, "elapsed_time": "2:35:43", "remaining_time": "2:04:00", "throughput": 2306.96, "total_tokens": 21554416} {"current_steps": 37380, "total_steps": 67140, "loss": 0.7506, "lr": 2.4412558672623177e-05, "epoch": 5.567470956210903, "percentage": 55.67, "elapsed_time": "2:35:44", "remaining_time": "2:03:59", "throughput": 2306.97, "total_tokens": 21557040} {"current_steps": 37385, "total_steps": 67140, "loss": 0.5274, "lr": 2.44060616440168e-05, "epoch": 5.568215668751861, "percentage": 55.68, "elapsed_time": "2:35:45", "remaining_time": "2:03:58", "throughput": 2306.99, "total_tokens": 21559888} {"current_steps": 37390, "total_steps": 67140, "loss": 0.6325, "lr": 2.4399564655546354e-05, "epoch": 5.568960381292821, "percentage": 55.69, "elapsed_time": "2:35:46", "remaining_time": "2:03:56", "throughput": 2307.04, "total_tokens": 21563088} {"current_steps": 37395, "total_steps": 67140, "loss": 0.5117, "lr": 2.43930677076509e-05, "epoch": 5.569705093833781, "percentage": 55.7, "elapsed_time": "2:35:47", "remaining_time": "2:03:55", "throughput": 2307.06, "total_tokens": 21565744} {"current_steps": 37400, "total_steps": 67140, "loss": 0.577, "lr": 2.4386570800769447e-05, "epoch": 5.570449806374739, "percentage": 55.7, "elapsed_time": "2:35:48", "remaining_time": "2:03:54", "throughput": 2307.08, "total_tokens": 21568496} {"current_steps": 37405, "total_steps": 67140, "loss": 0.5985, "lr": 2.438007393534106e-05, "epoch": 5.571194518915698, "percentage": 55.71, "elapsed_time": "2:35:49", "remaining_time": "2:03:52", "throughput": 2307.09, "total_tokens": 21571120} {"current_steps": 37410, "total_steps": 67140, "loss": 0.7462, "lr": 2.4373577111804744e-05, "epoch": 5.571939231456658, "percentage": 55.72, "elapsed_time": "2:35:51", "remaining_time": "2:03:51", "throughput": 2307.1, "total_tokens": 21573712} {"current_steps": 37415, "total_steps": 67140, "loss": 0.475, "lr": 2.436708033059954e-05, "epoch": 5.572683943997617, "percentage": 55.73, "elapsed_time": "2:35:52", "remaining_time": "2:03:49", "throughput": 2307.1, "total_tokens": 21576240} {"current_steps": 37420, "total_steps": 67140, "loss": 0.7115, "lr": 2.4360583592164483e-05, "epoch": 5.573428656538576, "percentage": 55.73, "elapsed_time": "2:35:53", "remaining_time": "2:03:48", "throughput": 2307.14, "total_tokens": 21579248} {"current_steps": 37425, "total_steps": 67140, "loss": 0.359, "lr": 2.435408689693858e-05, "epoch": 5.574173369079535, "percentage": 55.74, "elapsed_time": "2:35:54", "remaining_time": "2:03:47", "throughput": 2307.17, "total_tokens": 21582160} {"current_steps": 37430, "total_steps": 67140, "loss": 0.6467, "lr": 2.4347590245360857e-05, "epoch": 5.574918081620495, "percentage": 55.75, "elapsed_time": "2:35:55", "remaining_time": "2:03:45", "throughput": 2307.22, "total_tokens": 21585360} {"current_steps": 37435, "total_steps": 67140, "loss": 0.5769, "lr": 2.4341093637870345e-05, "epoch": 5.575662794161453, "percentage": 55.76, "elapsed_time": "2:35:56", "remaining_time": "2:03:44", "throughput": 2307.26, "total_tokens": 21588464} {"current_steps": 37440, "total_steps": 67140, "loss": 0.4329, "lr": 2.433459707490604e-05, "epoch": 5.576407506702413, "percentage": 55.76, "elapsed_time": "2:35:57", "remaining_time": "2:03:43", "throughput": 2307.3, "total_tokens": 21591504} {"current_steps": 37445, "total_steps": 67140, "loss": 0.7015, "lr": 2.4328100556906956e-05, "epoch": 5.577152219243372, "percentage": 55.77, "elapsed_time": "2:35:59", "remaining_time": "2:03:42", "throughput": 2307.34, "total_tokens": 21594672} {"current_steps": 37450, "total_steps": 67140, "loss": 0.6582, "lr": 2.4321604084312103e-05, "epoch": 5.577896931784331, "percentage": 55.78, "elapsed_time": "2:36:00", "remaining_time": "2:03:40", "throughput": 2307.38, "total_tokens": 21597712} {"current_steps": 37455, "total_steps": 67140, "loss": 0.5611, "lr": 2.4315107657560492e-05, "epoch": 5.57864164432529, "percentage": 55.79, "elapsed_time": "2:36:01", "remaining_time": "2:03:39", "throughput": 2307.42, "total_tokens": 21600656} {"current_steps": 37460, "total_steps": 67140, "loss": 0.3912, "lr": 2.4308611277091118e-05, "epoch": 5.57938635686625, "percentage": 55.79, "elapsed_time": "2:36:02", "remaining_time": "2:03:38", "throughput": 2307.43, "total_tokens": 21603312} {"current_steps": 37465, "total_steps": 67140, "loss": 0.6519, "lr": 2.4302114943342986e-05, "epoch": 5.580131069407209, "percentage": 55.8, "elapsed_time": "2:36:03", "remaining_time": "2:03:36", "throughput": 2307.43, "total_tokens": 21605872} {"current_steps": 37470, "total_steps": 67140, "loss": 0.6821, "lr": 2.4295618656755084e-05, "epoch": 5.580875781948168, "percentage": 55.81, "elapsed_time": "2:36:04", "remaining_time": "2:03:35", "throughput": 2307.45, "total_tokens": 21608624} {"current_steps": 37475, "total_steps": 67140, "loss": 0.6249, "lr": 2.4289122417766422e-05, "epoch": 5.581620494489127, "percentage": 55.82, "elapsed_time": "2:36:05", "remaining_time": "2:03:33", "throughput": 2307.47, "total_tokens": 21611408} {"current_steps": 37480, "total_steps": 67140, "loss": 0.5938, "lr": 2.4282626226815963e-05, "epoch": 5.582365207030087, "percentage": 55.82, "elapsed_time": "2:36:06", "remaining_time": "2:03:32", "throughput": 2307.49, "total_tokens": 21614192} {"current_steps": 37485, "total_steps": 67140, "loss": 0.6446, "lr": 2.4276130084342714e-05, "epoch": 5.583109919571045, "percentage": 55.83, "elapsed_time": "2:36:08", "remaining_time": "2:03:31", "throughput": 2307.53, "total_tokens": 21617200} {"current_steps": 37490, "total_steps": 67140, "loss": 0.6166, "lr": 2.4269633990785645e-05, "epoch": 5.583854632112005, "percentage": 55.84, "elapsed_time": "2:36:09", "remaining_time": "2:03:29", "throughput": 2307.55, "total_tokens": 21619984} {"current_steps": 37495, "total_steps": 67140, "loss": 0.5992, "lr": 2.4263137946583743e-05, "epoch": 5.584599344652964, "percentage": 55.85, "elapsed_time": "2:36:10", "remaining_time": "2:03:28", "throughput": 2307.58, "total_tokens": 21622832} {"current_steps": 37500, "total_steps": 67140, "loss": 0.6057, "lr": 2.4256641952175983e-05, "epoch": 5.5853440571939235, "percentage": 55.85, "elapsed_time": "2:36:11", "remaining_time": "2:03:27", "throughput": 2307.61, "total_tokens": 21625680} {"current_steps": 37505, "total_steps": 67140, "loss": 0.6987, "lr": 2.425014600800134e-05, "epoch": 5.586088769734882, "percentage": 55.86, "elapsed_time": "2:36:12", "remaining_time": "2:03:25", "throughput": 2307.62, "total_tokens": 21628336} {"current_steps": 37510, "total_steps": 67140, "loss": 0.6304, "lr": 2.4243650114498776e-05, "epoch": 5.586833482275842, "percentage": 55.87, "elapsed_time": "2:36:13", "remaining_time": "2:03:24", "throughput": 2307.65, "total_tokens": 21631280} {"current_steps": 37515, "total_steps": 67140, "loss": 0.7236, "lr": 2.4237154272107274e-05, "epoch": 5.587578194816801, "percentage": 55.88, "elapsed_time": "2:36:14", "remaining_time": "2:03:23", "throughput": 2307.69, "total_tokens": 21634224} {"current_steps": 37520, "total_steps": 67140, "loss": 0.6433, "lr": 2.423065848126578e-05, "epoch": 5.58832290735776, "percentage": 55.88, "elapsed_time": "2:36:16", "remaining_time": "2:03:21", "throughput": 2307.72, "total_tokens": 21637168} {"current_steps": 37525, "total_steps": 67140, "loss": 0.5505, "lr": 2.4224162742413252e-05, "epoch": 5.589067619898719, "percentage": 55.89, "elapsed_time": "2:36:17", "remaining_time": "2:03:20", "throughput": 2307.75, "total_tokens": 21640144} {"current_steps": 37530, "total_steps": 67140, "loss": 0.6794, "lr": 2.421766705598865e-05, "epoch": 5.589812332439678, "percentage": 55.9, "elapsed_time": "2:36:18", "remaining_time": "2:03:19", "throughput": 2307.77, "total_tokens": 21642896} {"current_steps": 37535, "total_steps": 67140, "loss": 0.6556, "lr": 2.4211171422430937e-05, "epoch": 5.590557044980637, "percentage": 55.91, "elapsed_time": "2:36:19", "remaining_time": "2:03:17", "throughput": 2307.82, "total_tokens": 21646160} {"current_steps": 37540, "total_steps": 67140, "loss": 0.6964, "lr": 2.4204675842179046e-05, "epoch": 5.591301757521597, "percentage": 55.91, "elapsed_time": "2:36:20", "remaining_time": "2:03:16", "throughput": 2307.85, "total_tokens": 21648976} {"current_steps": 37545, "total_steps": 67140, "loss": 0.683, "lr": 2.4198180315671927e-05, "epoch": 5.592046470062556, "percentage": 55.92, "elapsed_time": "2:36:21", "remaining_time": "2:03:15", "throughput": 2307.86, "total_tokens": 21651728} {"current_steps": 37550, "total_steps": 67140, "loss": 0.6794, "lr": 2.4191684843348524e-05, "epoch": 5.592791182603515, "percentage": 55.93, "elapsed_time": "2:36:22", "remaining_time": "2:03:13", "throughput": 2307.88, "total_tokens": 21654512} {"current_steps": 37555, "total_steps": 67140, "loss": 0.4025, "lr": 2.418518942564778e-05, "epoch": 5.593535895144474, "percentage": 55.94, "elapsed_time": "2:36:23", "remaining_time": "2:03:12", "throughput": 2307.91, "total_tokens": 21657296} {"current_steps": 37560, "total_steps": 67140, "loss": 0.6185, "lr": 2.4178694063008616e-05, "epoch": 5.594280607685434, "percentage": 55.94, "elapsed_time": "2:36:25", "remaining_time": "2:03:11", "throughput": 2307.93, "total_tokens": 21660176} {"current_steps": 37565, "total_steps": 67140, "loss": 0.7664, "lr": 2.4172198755869962e-05, "epoch": 5.595025320226393, "percentage": 55.95, "elapsed_time": "2:36:26", "remaining_time": "2:03:09", "throughput": 2307.98, "total_tokens": 21663440} {"current_steps": 37570, "total_steps": 67140, "loss": 0.7011, "lr": 2.4165703504670757e-05, "epoch": 5.595770032767351, "percentage": 55.96, "elapsed_time": "2:36:27", "remaining_time": "2:03:08", "throughput": 2308.0, "total_tokens": 21666224} {"current_steps": 37575, "total_steps": 67140, "loss": 0.6396, "lr": 2.4159208309849916e-05, "epoch": 5.596514745308311, "percentage": 55.97, "elapsed_time": "2:36:28", "remaining_time": "2:03:07", "throughput": 2308.03, "total_tokens": 21669104} {"current_steps": 37580, "total_steps": 67140, "loss": 0.4561, "lr": 2.4152713171846355e-05, "epoch": 5.59725945784927, "percentage": 55.97, "elapsed_time": "2:36:29", "remaining_time": "2:03:05", "throughput": 2308.05, "total_tokens": 21671888} {"current_steps": 37585, "total_steps": 67140, "loss": 0.7441, "lr": 2.4146218091099e-05, "epoch": 5.5980041703902295, "percentage": 55.98, "elapsed_time": "2:36:30", "remaining_time": "2:03:04", "throughput": 2308.08, "total_tokens": 21674832} {"current_steps": 37590, "total_steps": 67140, "loss": 0.6088, "lr": 2.413972306804675e-05, "epoch": 5.598748882931188, "percentage": 55.99, "elapsed_time": "2:36:31", "remaining_time": "2:03:03", "throughput": 2308.09, "total_tokens": 21677456} {"current_steps": 37595, "total_steps": 67140, "loss": 0.4449, "lr": 2.4133228103128526e-05, "epoch": 5.599493595472148, "percentage": 55.99, "elapsed_time": "2:36:33", "remaining_time": "2:03:01", "throughput": 2308.13, "total_tokens": 21680400} {"current_steps": 37600, "total_steps": 67140, "loss": 0.6593, "lr": 2.4126733196783214e-05, "epoch": 5.600238308013107, "percentage": 56.0, "elapsed_time": "2:36:34", "remaining_time": "2:03:00", "throughput": 2308.16, "total_tokens": 21683344} {"current_steps": 37605, "total_steps": 67140, "loss": 0.7041, "lr": 2.4120238349449728e-05, "epoch": 5.600983020554066, "percentage": 56.01, "elapsed_time": "2:36:35", "remaining_time": "2:02:59", "throughput": 2308.18, "total_tokens": 21686192} {"current_steps": 37610, "total_steps": 67140, "loss": 0.6012, "lr": 2.411374356156695e-05, "epoch": 5.601727733095025, "percentage": 56.02, "elapsed_time": "2:36:36", "remaining_time": "2:02:57", "throughput": 2308.21, "total_tokens": 21689008} {"current_steps": 37615, "total_steps": 67140, "loss": 0.5547, "lr": 2.410724883357378e-05, "epoch": 5.602472445635985, "percentage": 56.02, "elapsed_time": "2:36:37", "remaining_time": "2:02:56", "throughput": 2308.22, "total_tokens": 21691600} {"current_steps": 37620, "total_steps": 67140, "loss": 0.7528, "lr": 2.4100754165909108e-05, "epoch": 5.603217158176943, "percentage": 56.03, "elapsed_time": "2:36:38", "remaining_time": "2:02:55", "throughput": 2308.23, "total_tokens": 21694288} {"current_steps": 37625, "total_steps": 67140, "loss": 0.5462, "lr": 2.4094259559011813e-05, "epoch": 5.603961870717903, "percentage": 56.04, "elapsed_time": "2:36:39", "remaining_time": "2:02:53", "throughput": 2308.26, "total_tokens": 21697232} {"current_steps": 37630, "total_steps": 67140, "loss": 0.5346, "lr": 2.4087765013320776e-05, "epoch": 5.604706583258862, "percentage": 56.05, "elapsed_time": "2:36:40", "remaining_time": "2:02:52", "throughput": 2308.28, "total_tokens": 21699984} {"current_steps": 37635, "total_steps": 67140, "loss": 0.6819, "lr": 2.408127052927487e-05, "epoch": 5.6054512957998215, "percentage": 56.05, "elapsed_time": "2:36:42", "remaining_time": "2:02:51", "throughput": 2308.3, "total_tokens": 21702832} {"current_steps": 37640, "total_steps": 67140, "loss": 0.6865, "lr": 2.407477610731297e-05, "epoch": 5.60619600834078, "percentage": 56.06, "elapsed_time": "2:36:43", "remaining_time": "2:02:49", "throughput": 2308.33, "total_tokens": 21705680} {"current_steps": 37645, "total_steps": 67140, "loss": 0.7127, "lr": 2.4068281747873927e-05, "epoch": 5.60694072088174, "percentage": 56.07, "elapsed_time": "2:36:44", "remaining_time": "2:02:48", "throughput": 2308.36, "total_tokens": 21708624} {"current_steps": 37650, "total_steps": 67140, "loss": 0.6553, "lr": 2.4061787451396626e-05, "epoch": 5.607685433422699, "percentage": 56.08, "elapsed_time": "2:36:45", "remaining_time": "2:02:46", "throughput": 2308.38, "total_tokens": 21711344} {"current_steps": 37655, "total_steps": 67140, "loss": 0.5969, "lr": 2.4055293218319907e-05, "epoch": 5.608430145963658, "percentage": 56.08, "elapsed_time": "2:36:46", "remaining_time": "2:02:45", "throughput": 2308.43, "total_tokens": 21714672} {"current_steps": 37660, "total_steps": 67140, "loss": 0.6125, "lr": 2.4048799049082632e-05, "epoch": 5.609174858504617, "percentage": 56.09, "elapsed_time": "2:36:47", "remaining_time": "2:02:44", "throughput": 2308.46, "total_tokens": 21717616} {"current_steps": 37665, "total_steps": 67140, "loss": 0.6056, "lr": 2.4042304944123654e-05, "epoch": 5.609919571045577, "percentage": 56.1, "elapsed_time": "2:36:48", "remaining_time": "2:02:43", "throughput": 2308.49, "total_tokens": 21720464} {"current_steps": 37670, "total_steps": 67140, "loss": 0.4977, "lr": 2.4035810903881813e-05, "epoch": 5.6106642835865355, "percentage": 56.11, "elapsed_time": "2:36:50", "remaining_time": "2:02:41", "throughput": 2308.52, "total_tokens": 21723312} {"current_steps": 37675, "total_steps": 67140, "loss": 0.7294, "lr": 2.4029316928795958e-05, "epoch": 5.611408996127495, "percentage": 56.11, "elapsed_time": "2:36:51", "remaining_time": "2:02:40", "throughput": 2308.56, "total_tokens": 21726384} {"current_steps": 37680, "total_steps": 67140, "loss": 0.696, "lr": 2.402282301930491e-05, "epoch": 5.612153708668454, "percentage": 56.12, "elapsed_time": "2:36:52", "remaining_time": "2:02:39", "throughput": 2308.58, "total_tokens": 21729296} {"current_steps": 37685, "total_steps": 67140, "loss": 0.5361, "lr": 2.4016329175847514e-05, "epoch": 5.6128984212094135, "percentage": 56.13, "elapsed_time": "2:36:53", "remaining_time": "2:02:37", "throughput": 2308.61, "total_tokens": 21732208} {"current_steps": 37690, "total_steps": 67140, "loss": 0.5637, "lr": 2.4009835398862588e-05, "epoch": 5.613643133750372, "percentage": 56.14, "elapsed_time": "2:36:54", "remaining_time": "2:02:36", "throughput": 2308.63, "total_tokens": 21734960} {"current_steps": 37695, "total_steps": 67140, "loss": 0.8136, "lr": 2.4003341688788958e-05, "epoch": 5.614387846291332, "percentage": 56.14, "elapsed_time": "2:36:55", "remaining_time": "2:02:35", "throughput": 2308.65, "total_tokens": 21737744} {"current_steps": 37700, "total_steps": 67140, "loss": 0.6566, "lr": 2.399684804606545e-05, "epoch": 5.615132558832291, "percentage": 56.15, "elapsed_time": "2:36:56", "remaining_time": "2:02:33", "throughput": 2308.68, "total_tokens": 21740592} {"current_steps": 37705, "total_steps": 67140, "loss": 0.6448, "lr": 2.3990354471130873e-05, "epoch": 5.61587727137325, "percentage": 56.16, "elapsed_time": "2:36:58", "remaining_time": "2:02:32", "throughput": 2308.71, "total_tokens": 21743440} {"current_steps": 37710, "total_steps": 67140, "loss": 0.5375, "lr": 2.398386096442403e-05, "epoch": 5.616621983914209, "percentage": 56.17, "elapsed_time": "2:36:59", "remaining_time": "2:02:30", "throughput": 2308.72, "total_tokens": 21746128} {"current_steps": 37715, "total_steps": 67140, "loss": 0.6296, "lr": 2.3977367526383744e-05, "epoch": 5.617366696455168, "percentage": 56.17, "elapsed_time": "2:37:00", "remaining_time": "2:02:29", "throughput": 2308.75, "total_tokens": 21749136} {"current_steps": 37720, "total_steps": 67140, "loss": 0.4822, "lr": 2.39708741574488e-05, "epoch": 5.6181114089961275, "percentage": 56.18, "elapsed_time": "2:37:01", "remaining_time": "2:02:28", "throughput": 2308.77, "total_tokens": 21751920} {"current_steps": 37725, "total_steps": 67140, "loss": 0.5568, "lr": 2.3964380858057985e-05, "epoch": 5.618856121537087, "percentage": 56.19, "elapsed_time": "2:37:02", "remaining_time": "2:02:26", "throughput": 2308.81, "total_tokens": 21754960} {"current_steps": 37730, "total_steps": 67140, "loss": 0.4774, "lr": 2.3957887628650104e-05, "epoch": 5.619600834078046, "percentage": 56.2, "elapsed_time": "2:37:03", "remaining_time": "2:02:25", "throughput": 2308.83, "total_tokens": 21757712} {"current_steps": 37735, "total_steps": 67140, "loss": 0.6351, "lr": 2.3951394469663946e-05, "epoch": 5.620345546619005, "percentage": 56.2, "elapsed_time": "2:37:04", "remaining_time": "2:02:24", "throughput": 2308.89, "total_tokens": 21760976} {"current_steps": 37740, "total_steps": 67140, "loss": 0.6191, "lr": 2.394490138153828e-05, "epoch": 5.621090259159964, "percentage": 56.21, "elapsed_time": "2:37:06", "remaining_time": "2:02:23", "throughput": 2308.92, "total_tokens": 21763952} {"current_steps": 37745, "total_steps": 67140, "loss": 0.7159, "lr": 2.393840836471189e-05, "epoch": 5.621834971700923, "percentage": 56.22, "elapsed_time": "2:37:07", "remaining_time": "2:02:21", "throughput": 2308.96, "total_tokens": 21766928} {"current_steps": 37750, "total_steps": 67140, "loss": 0.6139, "lr": 2.3931915419623552e-05, "epoch": 5.622579684241883, "percentage": 56.23, "elapsed_time": "2:37:08", "remaining_time": "2:02:20", "throughput": 2308.99, "total_tokens": 21769904} {"current_steps": 37755, "total_steps": 67140, "loss": 0.6807, "lr": 2.3925422546712032e-05, "epoch": 5.6233243967828415, "percentage": 56.23, "elapsed_time": "2:37:09", "remaining_time": "2:02:19", "throughput": 2309.02, "total_tokens": 21772720} {"current_steps": 37760, "total_steps": 67140, "loss": 0.5637, "lr": 2.3918929746416077e-05, "epoch": 5.624069109323801, "percentage": 56.24, "elapsed_time": "2:37:10", "remaining_time": "2:02:17", "throughput": 2309.04, "total_tokens": 21775568} {"current_steps": 37765, "total_steps": 67140, "loss": 0.6337, "lr": 2.3912437019174454e-05, "epoch": 5.62481382186476, "percentage": 56.25, "elapsed_time": "2:37:11", "remaining_time": "2:02:16", "throughput": 2309.07, "total_tokens": 21778512} {"current_steps": 37770, "total_steps": 67140, "loss": 0.6915, "lr": 2.3905944365425922e-05, "epoch": 5.6255585344057195, "percentage": 56.26, "elapsed_time": "2:37:12", "remaining_time": "2:02:14", "throughput": 2309.1, "total_tokens": 21781360} {"current_steps": 37775, "total_steps": 67140, "loss": 0.7824, "lr": 2.3899451785609218e-05, "epoch": 5.626303246946678, "percentage": 56.26, "elapsed_time": "2:37:14", "remaining_time": "2:02:13", "throughput": 2309.14, "total_tokens": 21784464} {"current_steps": 37780, "total_steps": 67140, "loss": 0.4372, "lr": 2.3892959280163084e-05, "epoch": 5.627047959487638, "percentage": 56.27, "elapsed_time": "2:37:15", "remaining_time": "2:02:12", "throughput": 2309.17, "total_tokens": 21787312} {"current_steps": 37785, "total_steps": 67140, "loss": 0.623, "lr": 2.388646684952627e-05, "epoch": 5.627792672028597, "percentage": 56.28, "elapsed_time": "2:37:16", "remaining_time": "2:02:11", "throughput": 2309.19, "total_tokens": 21790256} {"current_steps": 37790, "total_steps": 67140, "loss": 0.6117, "lr": 2.3879974494137487e-05, "epoch": 5.628537384569556, "percentage": 56.29, "elapsed_time": "2:37:17", "remaining_time": "2:02:09", "throughput": 2309.21, "total_tokens": 21793008} {"current_steps": 37795, "total_steps": 67140, "loss": 0.4301, "lr": 2.3873482214435486e-05, "epoch": 5.629282097110515, "percentage": 56.29, "elapsed_time": "2:37:18", "remaining_time": "2:02:08", "throughput": 2309.25, "total_tokens": 21795984} {"current_steps": 37800, "total_steps": 67140, "loss": 0.564, "lr": 2.3866990010858976e-05, "epoch": 5.630026809651475, "percentage": 56.3, "elapsed_time": "2:37:19", "remaining_time": "2:02:07", "throughput": 2309.28, "total_tokens": 21798960} {"current_steps": 37805, "total_steps": 67140, "loss": 0.6431, "lr": 2.386049788384667e-05, "epoch": 5.6307715221924335, "percentage": 56.31, "elapsed_time": "2:37:20", "remaining_time": "2:02:05", "throughput": 2309.3, "total_tokens": 21801744} {"current_steps": 37810, "total_steps": 67140, "loss": 0.7561, "lr": 2.3854005833837285e-05, "epoch": 5.631516234733393, "percentage": 56.32, "elapsed_time": "2:37:21", "remaining_time": "2:02:04", "throughput": 2309.33, "total_tokens": 21804560} {"current_steps": 37815, "total_steps": 67140, "loss": 0.6376, "lr": 2.384751386126953e-05, "epoch": 5.632260947274352, "percentage": 56.32, "elapsed_time": "2:37:23", "remaining_time": "2:02:02", "throughput": 2309.34, "total_tokens": 21807344} {"current_steps": 37820, "total_steps": 67140, "loss": 0.4963, "lr": 2.3841021966582095e-05, "epoch": 5.6330056598153115, "percentage": 56.33, "elapsed_time": "2:37:24", "remaining_time": "2:02:01", "throughput": 2309.36, "total_tokens": 21810032} {"current_steps": 37825, "total_steps": 67140, "loss": 0.4711, "lr": 2.3834530150213686e-05, "epoch": 5.63375037235627, "percentage": 56.34, "elapsed_time": "2:37:25", "remaining_time": "2:02:00", "throughput": 2309.38, "total_tokens": 21812816} {"current_steps": 37830, "total_steps": 67140, "loss": 0.5228, "lr": 2.3828038412602993e-05, "epoch": 5.63449508489723, "percentage": 56.34, "elapsed_time": "2:37:26", "remaining_time": "2:01:58", "throughput": 2309.38, "total_tokens": 21815312} {"current_steps": 37835, "total_steps": 67140, "loss": 0.645, "lr": 2.3821546754188698e-05, "epoch": 5.635239797438189, "percentage": 56.35, "elapsed_time": "2:37:27", "remaining_time": "2:01:57", "throughput": 2309.42, "total_tokens": 21818256} {"current_steps": 37840, "total_steps": 67140, "loss": 0.7109, "lr": 2.381505517540949e-05, "epoch": 5.635984509979148, "percentage": 56.36, "elapsed_time": "2:37:28", "remaining_time": "2:01:56", "throughput": 2309.43, "total_tokens": 21820976} {"current_steps": 37845, "total_steps": 67140, "loss": 0.726, "lr": 2.3808563676704027e-05, "epoch": 5.636729222520107, "percentage": 56.37, "elapsed_time": "2:37:29", "remaining_time": "2:01:54", "throughput": 2309.47, "total_tokens": 21823984} {"current_steps": 37850, "total_steps": 67140, "loss": 0.7929, "lr": 2.3802072258510986e-05, "epoch": 5.637473935061067, "percentage": 56.37, "elapsed_time": "2:37:30", "remaining_time": "2:01:53", "throughput": 2309.52, "total_tokens": 21827120} {"current_steps": 37855, "total_steps": 67140, "loss": 0.5427, "lr": 2.3795580921269034e-05, "epoch": 5.6382186476020255, "percentage": 56.38, "elapsed_time": "2:37:32", "remaining_time": "2:01:52", "throughput": 2309.54, "total_tokens": 21830000} {"current_steps": 37860, "total_steps": 67140, "loss": 0.536, "lr": 2.378908966541682e-05, "epoch": 5.638963360142985, "percentage": 56.39, "elapsed_time": "2:37:33", "remaining_time": "2:01:50", "throughput": 2309.57, "total_tokens": 21832880} {"current_steps": 37865, "total_steps": 67140, "loss": 0.6833, "lr": 2.3782598491393014e-05, "epoch": 5.639708072683944, "percentage": 56.4, "elapsed_time": "2:37:34", "remaining_time": "2:01:49", "throughput": 2309.6, "total_tokens": 21835792} {"current_steps": 37870, "total_steps": 67140, "loss": 0.7052, "lr": 2.3776107399636247e-05, "epoch": 5.640452785224904, "percentage": 56.4, "elapsed_time": "2:37:35", "remaining_time": "2:01:48", "throughput": 2309.62, "total_tokens": 21838608} {"current_steps": 37875, "total_steps": 67140, "loss": 0.6632, "lr": 2.376961639058516e-05, "epoch": 5.641197497765862, "percentage": 56.41, "elapsed_time": "2:37:36", "remaining_time": "2:01:46", "throughput": 2309.64, "total_tokens": 21841264} {"current_steps": 37880, "total_steps": 67140, "loss": 0.5914, "lr": 2.3763125464678414e-05, "epoch": 5.641942210306821, "percentage": 56.42, "elapsed_time": "2:37:37", "remaining_time": "2:01:45", "throughput": 2309.68, "total_tokens": 21844336} {"current_steps": 37885, "total_steps": 67140, "loss": 0.6269, "lr": 2.3756634622354607e-05, "epoch": 5.642686922847781, "percentage": 56.43, "elapsed_time": "2:37:38", "remaining_time": "2:01:44", "throughput": 2309.69, "total_tokens": 21847056} {"current_steps": 37890, "total_steps": 67140, "loss": 0.671, "lr": 2.3750143864052376e-05, "epoch": 5.64343163538874, "percentage": 56.43, "elapsed_time": "2:37:39", "remaining_time": "2:01:42", "throughput": 2309.7, "total_tokens": 21849680} {"current_steps": 37895, "total_steps": 67140, "loss": 0.7038, "lr": 2.374365319021034e-05, "epoch": 5.644176347929699, "percentage": 56.44, "elapsed_time": "2:37:41", "remaining_time": "2:01:41", "throughput": 2309.72, "total_tokens": 21852432} {"current_steps": 37900, "total_steps": 67140, "loss": 0.634, "lr": 2.373716260126712e-05, "epoch": 5.644921060470658, "percentage": 56.45, "elapsed_time": "2:37:42", "remaining_time": "2:01:40", "throughput": 2309.74, "total_tokens": 21855184} {"current_steps": 37905, "total_steps": 67140, "loss": 0.6649, "lr": 2.373067209766131e-05, "epoch": 5.6456657730116175, "percentage": 56.46, "elapsed_time": "2:37:43", "remaining_time": "2:01:38", "throughput": 2309.75, "total_tokens": 21857936} {"current_steps": 37910, "total_steps": 67140, "loss": 0.6153, "lr": 2.372418167983152e-05, "epoch": 5.646410485552577, "percentage": 56.46, "elapsed_time": "2:37:44", "remaining_time": "2:01:37", "throughput": 2309.78, "total_tokens": 21860752} {"current_steps": 37915, "total_steps": 67140, "loss": 0.4255, "lr": 2.371769134821635e-05, "epoch": 5.647155198093536, "percentage": 56.47, "elapsed_time": "2:37:45", "remaining_time": "2:01:36", "throughput": 2309.81, "total_tokens": 21863728} {"current_steps": 37920, "total_steps": 67140, "loss": 0.7053, "lr": 2.371120110325439e-05, "epoch": 5.647899910634495, "percentage": 56.48, "elapsed_time": "2:37:46", "remaining_time": "2:01:34", "throughput": 2309.85, "total_tokens": 21866768} {"current_steps": 37925, "total_steps": 67140, "loss": 0.7719, "lr": 2.370471094538421e-05, "epoch": 5.648644623175454, "percentage": 56.49, "elapsed_time": "2:37:47", "remaining_time": "2:01:33", "throughput": 2309.89, "total_tokens": 21869904} {"current_steps": 37930, "total_steps": 67140, "loss": 0.6487, "lr": 2.3698220875044396e-05, "epoch": 5.649389335716413, "percentage": 56.49, "elapsed_time": "2:37:49", "remaining_time": "2:01:32", "throughput": 2309.92, "total_tokens": 21872784} {"current_steps": 37935, "total_steps": 67140, "loss": 0.5447, "lr": 2.369173089267353e-05, "epoch": 5.650134048257373, "percentage": 56.5, "elapsed_time": "2:37:50", "remaining_time": "2:01:30", "throughput": 2309.93, "total_tokens": 21875472} {"current_steps": 37940, "total_steps": 67140, "loss": 0.5113, "lr": 2.3685240998710166e-05, "epoch": 5.6508787607983315, "percentage": 56.51, "elapsed_time": "2:37:51", "remaining_time": "2:01:29", "throughput": 2309.97, "total_tokens": 21878512} {"current_steps": 37945, "total_steps": 67140, "loss": 0.5116, "lr": 2.367875119359287e-05, "epoch": 5.651623473339291, "percentage": 56.52, "elapsed_time": "2:37:52", "remaining_time": "2:01:28", "throughput": 2309.99, "total_tokens": 21881264} {"current_steps": 37950, "total_steps": 67140, "loss": 0.3965, "lr": 2.36722614777602e-05, "epoch": 5.65236818588025, "percentage": 56.52, "elapsed_time": "2:37:53", "remaining_time": "2:01:26", "throughput": 2309.99, "total_tokens": 21883760} {"current_steps": 37955, "total_steps": 67140, "loss": 0.7554, "lr": 2.3665771851650697e-05, "epoch": 5.65311289842121, "percentage": 56.53, "elapsed_time": "2:37:54", "remaining_time": "2:01:25", "throughput": 2310.01, "total_tokens": 21886480} {"current_steps": 37960, "total_steps": 67140, "loss": 0.4894, "lr": 2.3659282315702918e-05, "epoch": 5.653857610962168, "percentage": 56.54, "elapsed_time": "2:37:55", "remaining_time": "2:01:24", "throughput": 2310.04, "total_tokens": 21889456} {"current_steps": 37965, "total_steps": 67140, "loss": 0.5411, "lr": 2.365279287035538e-05, "epoch": 5.654602323503128, "percentage": 56.55, "elapsed_time": "2:37:56", "remaining_time": "2:01:22", "throughput": 2310.05, "total_tokens": 21892080} {"current_steps": 37970, "total_steps": 67140, "loss": 0.5919, "lr": 2.3646303516046626e-05, "epoch": 5.655347036044087, "percentage": 56.55, "elapsed_time": "2:37:58", "remaining_time": "2:01:21", "throughput": 2310.09, "total_tokens": 21895152} {"current_steps": 37975, "total_steps": 67140, "loss": 0.6133, "lr": 2.363981425321517e-05, "epoch": 5.656091748585046, "percentage": 56.56, "elapsed_time": "2:37:59", "remaining_time": "2:01:20", "throughput": 2310.14, "total_tokens": 21898320} {"current_steps": 37980, "total_steps": 67140, "loss": 0.612, "lr": 2.3633325082299545e-05, "epoch": 5.656836461126005, "percentage": 56.57, "elapsed_time": "2:38:00", "remaining_time": "2:01:18", "throughput": 2310.16, "total_tokens": 21901040} {"current_steps": 37985, "total_steps": 67140, "loss": 0.6955, "lr": 2.362683600373825e-05, "epoch": 5.657581173666965, "percentage": 56.58, "elapsed_time": "2:38:01", "remaining_time": "2:01:17", "throughput": 2310.17, "total_tokens": 21903664} {"current_steps": 37990, "total_steps": 67140, "loss": 0.5762, "lr": 2.362034701796979e-05, "epoch": 5.6583258862079235, "percentage": 56.58, "elapsed_time": "2:38:02", "remaining_time": "2:01:16", "throughput": 2310.19, "total_tokens": 21906416} {"current_steps": 37995, "total_steps": 67140, "loss": 0.6596, "lr": 2.3613858125432677e-05, "epoch": 5.659070598748883, "percentage": 56.59, "elapsed_time": "2:38:03", "remaining_time": "2:01:14", "throughput": 2310.19, "total_tokens": 21908880} {"current_steps": 38000, "total_steps": 67140, "loss": 0.7202, "lr": 2.3607369326565403e-05, "epoch": 5.659815311289842, "percentage": 56.6, "elapsed_time": "2:38:04", "remaining_time": "2:01:13", "throughput": 2310.21, "total_tokens": 21911728} {"current_steps": 38005, "total_steps": 67140, "loss": 0.5349, "lr": 2.3600880621806438e-05, "epoch": 5.660560023830802, "percentage": 56.61, "elapsed_time": "2:38:05", "remaining_time": "2:01:11", "throughput": 2310.25, "total_tokens": 21914736} {"current_steps": 38010, "total_steps": 67140, "loss": 0.4991, "lr": 2.359439201159427e-05, "epoch": 5.66130473637176, "percentage": 56.61, "elapsed_time": "2:38:06", "remaining_time": "2:01:10", "throughput": 2310.26, "total_tokens": 21917424} {"current_steps": 38015, "total_steps": 67140, "loss": 0.5655, "lr": 2.3587903496367382e-05, "epoch": 5.66204944891272, "percentage": 56.62, "elapsed_time": "2:38:08", "remaining_time": "2:01:09", "throughput": 2310.3, "total_tokens": 21920432} {"current_steps": 38020, "total_steps": 67140, "loss": 0.6024, "lr": 2.3581415076564225e-05, "epoch": 5.662794161453679, "percentage": 56.63, "elapsed_time": "2:38:09", "remaining_time": "2:01:07", "throughput": 2310.34, "total_tokens": 21923600} {"current_steps": 38025, "total_steps": 67140, "loss": 0.6948, "lr": 2.3574926752623276e-05, "epoch": 5.663538873994638, "percentage": 56.64, "elapsed_time": "2:38:10", "remaining_time": "2:01:06", "throughput": 2310.37, "total_tokens": 21926480} {"current_steps": 38030, "total_steps": 67140, "loss": 0.5688, "lr": 2.3568438524982984e-05, "epoch": 5.664283586535597, "percentage": 56.64, "elapsed_time": "2:38:11", "remaining_time": "2:01:05", "throughput": 2310.41, "total_tokens": 21929616} {"current_steps": 38035, "total_steps": 67140, "loss": 0.5234, "lr": 2.3561950394081793e-05, "epoch": 5.665028299076557, "percentage": 56.65, "elapsed_time": "2:38:12", "remaining_time": "2:01:04", "throughput": 2310.43, "total_tokens": 21932400} {"current_steps": 38040, "total_steps": 67140, "loss": 0.7071, "lr": 2.3555462360358154e-05, "epoch": 5.665773011617516, "percentage": 56.66, "elapsed_time": "2:38:13", "remaining_time": "2:01:02", "throughput": 2310.47, "total_tokens": 21935408} {"current_steps": 38045, "total_steps": 67140, "loss": 0.7685, "lr": 2.3548974424250492e-05, "epoch": 5.666517724158475, "percentage": 56.67, "elapsed_time": "2:38:15", "remaining_time": "2:01:01", "throughput": 2310.48, "total_tokens": 21938096} {"current_steps": 38050, "total_steps": 67140, "loss": 0.6384, "lr": 2.3542486586197237e-05, "epoch": 5.667262436699434, "percentage": 56.67, "elapsed_time": "2:38:16", "remaining_time": "2:01:00", "throughput": 2310.52, "total_tokens": 21941040} {"current_steps": 38055, "total_steps": 67140, "loss": 0.6376, "lr": 2.3535998846636815e-05, "epoch": 5.668007149240394, "percentage": 56.68, "elapsed_time": "2:38:17", "remaining_time": "2:00:58", "throughput": 2310.51, "total_tokens": 21943472} {"current_steps": 38060, "total_steps": 67140, "loss": 0.6966, "lr": 2.352951120600763e-05, "epoch": 5.668751861781352, "percentage": 56.69, "elapsed_time": "2:38:18", "remaining_time": "2:00:57", "throughput": 2310.54, "total_tokens": 21946352} {"current_steps": 38065, "total_steps": 67140, "loss": 0.6787, "lr": 2.352302366474811e-05, "epoch": 5.669496574322311, "percentage": 56.69, "elapsed_time": "2:38:19", "remaining_time": "2:00:55", "throughput": 2310.55, "total_tokens": 21948976} {"current_steps": 38070, "total_steps": 67140, "loss": 0.6482, "lr": 2.351653622329664e-05, "epoch": 5.670241286863271, "percentage": 56.7, "elapsed_time": "2:38:20", "remaining_time": "2:00:54", "throughput": 2310.57, "total_tokens": 21951824} {"current_steps": 38075, "total_steps": 67140, "loss": 0.5022, "lr": 2.351004888209162e-05, "epoch": 5.67098599940423, "percentage": 56.71, "elapsed_time": "2:38:21", "remaining_time": "2:00:53", "throughput": 2310.6, "total_tokens": 21954736} {"current_steps": 38080, "total_steps": 67140, "loss": 0.6071, "lr": 2.3503561641571455e-05, "epoch": 5.671730711945189, "percentage": 56.72, "elapsed_time": "2:38:22", "remaining_time": "2:00:51", "throughput": 2310.61, "total_tokens": 21957360} {"current_steps": 38085, "total_steps": 67140, "loss": 0.5809, "lr": 2.3497074502174495e-05, "epoch": 5.672475424486148, "percentage": 56.72, "elapsed_time": "2:38:23", "remaining_time": "2:00:50", "throughput": 2310.62, "total_tokens": 21959984} {"current_steps": 38090, "total_steps": 67140, "loss": 0.6495, "lr": 2.349058746433913e-05, "epoch": 5.673220137027108, "percentage": 56.73, "elapsed_time": "2:38:25", "remaining_time": "2:00:49", "throughput": 2310.64, "total_tokens": 21962768} {"current_steps": 38095, "total_steps": 67140, "loss": 0.5757, "lr": 2.348410052850373e-05, "epoch": 5.673964849568066, "percentage": 56.74, "elapsed_time": "2:38:26", "remaining_time": "2:00:47", "throughput": 2310.67, "total_tokens": 21965808} {"current_steps": 38100, "total_steps": 67140, "loss": 0.5974, "lr": 2.347761369510665e-05, "epoch": 5.674709562109026, "percentage": 56.75, "elapsed_time": "2:38:27", "remaining_time": "2:00:46", "throughput": 2310.7, "total_tokens": 21968688} {"current_steps": 38105, "total_steps": 67140, "loss": 0.5208, "lr": 2.3471126964586247e-05, "epoch": 5.675454274649985, "percentage": 56.75, "elapsed_time": "2:38:28", "remaining_time": "2:00:45", "throughput": 2310.74, "total_tokens": 21971664} {"current_steps": 38110, "total_steps": 67140, "loss": 0.5204, "lr": 2.3464640337380868e-05, "epoch": 5.676198987190944, "percentage": 56.76, "elapsed_time": "2:38:29", "remaining_time": "2:00:43", "throughput": 2310.78, "total_tokens": 21974800} {"current_steps": 38115, "total_steps": 67140, "loss": 0.5036, "lr": 2.3458153813928857e-05, "epoch": 5.676943699731903, "percentage": 56.77, "elapsed_time": "2:38:30", "remaining_time": "2:00:42", "throughput": 2310.8, "total_tokens": 21977584} {"current_steps": 38120, "total_steps": 67140, "loss": 0.6117, "lr": 2.345166739466855e-05, "epoch": 5.677688412272863, "percentage": 56.78, "elapsed_time": "2:38:31", "remaining_time": "2:00:41", "throughput": 2310.84, "total_tokens": 21980656} {"current_steps": 38125, "total_steps": 67140, "loss": 0.6266, "lr": 2.344518108003825e-05, "epoch": 5.678433124813822, "percentage": 56.78, "elapsed_time": "2:38:33", "remaining_time": "2:00:40", "throughput": 2310.89, "total_tokens": 21983888} {"current_steps": 38130, "total_steps": 67140, "loss": 0.7696, "lr": 2.3438694870476295e-05, "epoch": 5.679177837354781, "percentage": 56.79, "elapsed_time": "2:38:34", "remaining_time": "2:00:38", "throughput": 2310.91, "total_tokens": 21986800} {"current_steps": 38135, "total_steps": 67140, "loss": 0.5178, "lr": 2.3432208766421e-05, "epoch": 5.67992254989574, "percentage": 56.8, "elapsed_time": "2:38:35", "remaining_time": "2:00:37", "throughput": 2310.94, "total_tokens": 21989680} {"current_steps": 38140, "total_steps": 67140, "loss": 0.6673, "lr": 2.3425722768310652e-05, "epoch": 5.6806672624367, "percentage": 56.81, "elapsed_time": "2:38:36", "remaining_time": "2:00:36", "throughput": 2310.96, "total_tokens": 21992560} {"current_steps": 38145, "total_steps": 67140, "loss": 0.5297, "lr": 2.3419236876583568e-05, "epoch": 5.681411974977658, "percentage": 56.81, "elapsed_time": "2:38:37", "remaining_time": "2:00:34", "throughput": 2310.99, "total_tokens": 21995440} {"current_steps": 38150, "total_steps": 67140, "loss": 0.8135, "lr": 2.341275109167802e-05, "epoch": 5.682156687518618, "percentage": 56.82, "elapsed_time": "2:38:38", "remaining_time": "2:00:33", "throughput": 2311.02, "total_tokens": 21998416} {"current_steps": 38155, "total_steps": 67140, "loss": 0.741, "lr": 2.34062654140323e-05, "epoch": 5.682901400059577, "percentage": 56.83, "elapsed_time": "2:38:40", "remaining_time": "2:00:32", "throughput": 2311.06, "total_tokens": 22001424} {"current_steps": 38160, "total_steps": 67140, "loss": 0.6242, "lr": 2.33997798440847e-05, "epoch": 5.683646112600536, "percentage": 56.84, "elapsed_time": "2:38:41", "remaining_time": "2:00:30", "throughput": 2311.09, "total_tokens": 22004336} {"current_steps": 38165, "total_steps": 67140, "loss": 0.7287, "lr": 2.3393294382273462e-05, "epoch": 5.684390825141495, "percentage": 56.84, "elapsed_time": "2:38:42", "remaining_time": "2:00:29", "throughput": 2311.1, "total_tokens": 22007024} {"current_steps": 38170, "total_steps": 67140, "loss": 0.9222, "lr": 2.338680902903685e-05, "epoch": 5.685135537682455, "percentage": 56.85, "elapsed_time": "2:38:43", "remaining_time": "2:00:28", "throughput": 2311.14, "total_tokens": 22010032} {"current_steps": 38175, "total_steps": 67140, "loss": 0.5643, "lr": 2.338032378481313e-05, "epoch": 5.685880250223414, "percentage": 56.86, "elapsed_time": "2:38:44", "remaining_time": "2:00:26", "throughput": 2311.18, "total_tokens": 22013040} {"current_steps": 38180, "total_steps": 67140, "loss": 0.5023, "lr": 2.3373838650040548e-05, "epoch": 5.686624962764373, "percentage": 56.87, "elapsed_time": "2:38:45", "remaining_time": "2:00:25", "throughput": 2311.23, "total_tokens": 22016272} {"current_steps": 38185, "total_steps": 67140, "loss": 0.4945, "lr": 2.3367353625157333e-05, "epoch": 5.687369675305332, "percentage": 56.87, "elapsed_time": "2:38:46", "remaining_time": "2:00:24", "throughput": 2311.26, "total_tokens": 22019056} {"current_steps": 38190, "total_steps": 67140, "loss": 0.5882, "lr": 2.3360868710601717e-05, "epoch": 5.688114387846292, "percentage": 56.88, "elapsed_time": "2:38:48", "remaining_time": "2:00:22", "throughput": 2311.28, "total_tokens": 22021936} {"current_steps": 38195, "total_steps": 67140, "loss": 0.508, "lr": 2.335438390681194e-05, "epoch": 5.68885910038725, "percentage": 56.89, "elapsed_time": "2:38:49", "remaining_time": "2:00:21", "throughput": 2311.33, "total_tokens": 22025072} {"current_steps": 38200, "total_steps": 67140, "loss": 0.5848, "lr": 2.3347899214226214e-05, "epoch": 5.68960381292821, "percentage": 56.9, "elapsed_time": "2:38:50", "remaining_time": "2:00:20", "throughput": 2311.34, "total_tokens": 22027760} {"current_steps": 38205, "total_steps": 67140, "loss": 0.6593, "lr": 2.334141463328273e-05, "epoch": 5.690348525469169, "percentage": 56.9, "elapsed_time": "2:38:51", "remaining_time": "2:00:18", "throughput": 2311.35, "total_tokens": 22030512} {"current_steps": 38210, "total_steps": 67140, "loss": 0.7383, "lr": 2.33349301644197e-05, "epoch": 5.6910932380101285, "percentage": 56.91, "elapsed_time": "2:38:52", "remaining_time": "2:00:17", "throughput": 2311.4, "total_tokens": 22033616} {"current_steps": 38215, "total_steps": 67140, "loss": 0.7924, "lr": 2.332844580807533e-05, "epoch": 5.691837950551087, "percentage": 56.92, "elapsed_time": "2:38:53", "remaining_time": "2:00:16", "throughput": 2311.42, "total_tokens": 22036400} {"current_steps": 38220, "total_steps": 67140, "loss": 0.5616, "lr": 2.3321961564687787e-05, "epoch": 5.692582663092047, "percentage": 56.93, "elapsed_time": "2:38:54", "remaining_time": "2:00:14", "throughput": 2311.42, "total_tokens": 22038864} {"current_steps": 38225, "total_steps": 67140, "loss": 0.6812, "lr": 2.3315477434695256e-05, "epoch": 5.693327375633006, "percentage": 56.93, "elapsed_time": "2:38:55", "remaining_time": "2:00:13", "throughput": 2311.44, "total_tokens": 22041744} {"current_steps": 38230, "total_steps": 67140, "loss": 0.5845, "lr": 2.3308993418535924e-05, "epoch": 5.694072088173964, "percentage": 56.94, "elapsed_time": "2:38:57", "remaining_time": "2:00:12", "throughput": 2311.49, "total_tokens": 22044784} {"current_steps": 38235, "total_steps": 67140, "loss": 0.6252, "lr": 2.330250951664793e-05, "epoch": 5.694816800714924, "percentage": 56.95, "elapsed_time": "2:38:58", "remaining_time": "2:00:10", "throughput": 2311.5, "total_tokens": 22047536} {"current_steps": 38240, "total_steps": 67140, "loss": 0.5004, "lr": 2.3296025729469457e-05, "epoch": 5.695561513255884, "percentage": 56.96, "elapsed_time": "2:38:59", "remaining_time": "2:00:09", "throughput": 2311.54, "total_tokens": 22050640} {"current_steps": 38245, "total_steps": 67140, "loss": 0.6188, "lr": 2.3289542057438625e-05, "epoch": 5.696306225796842, "percentage": 56.96, "elapsed_time": "2:39:00", "remaining_time": "2:00:08", "throughput": 2311.56, "total_tokens": 22053328} {"current_steps": 38250, "total_steps": 67140, "loss": 0.5537, "lr": 2.3283058500993587e-05, "epoch": 5.697050938337801, "percentage": 56.97, "elapsed_time": "2:39:01", "remaining_time": "2:00:06", "throughput": 2311.6, "total_tokens": 22056368} {"current_steps": 38255, "total_steps": 67140, "loss": 0.6447, "lr": 2.3276575060572476e-05, "epoch": 5.697795650878761, "percentage": 56.98, "elapsed_time": "2:39:02", "remaining_time": "2:00:05", "throughput": 2311.64, "total_tokens": 22059472} {"current_steps": 38260, "total_steps": 67140, "loss": 0.7336, "lr": 2.3270091736613412e-05, "epoch": 5.6985403634197205, "percentage": 56.99, "elapsed_time": "2:39:03", "remaining_time": "2:00:04", "throughput": 2311.65, "total_tokens": 22062192} {"current_steps": 38265, "total_steps": 67140, "loss": 0.6954, "lr": 2.326360852955452e-05, "epoch": 5.699285075960679, "percentage": 56.99, "elapsed_time": "2:39:05", "remaining_time": "2:00:02", "throughput": 2311.67, "total_tokens": 22064976} {"current_steps": 38270, "total_steps": 67140, "loss": 0.7254, "lr": 2.3257125439833902e-05, "epoch": 5.700029788501638, "percentage": 57.0, "elapsed_time": "2:39:06", "remaining_time": "2:00:01", "throughput": 2311.72, "total_tokens": 22068208} {"current_steps": 38275, "total_steps": 67140, "loss": 0.6033, "lr": 2.325064246788966e-05, "epoch": 5.700774501042598, "percentage": 57.01, "elapsed_time": "2:39:07", "remaining_time": "2:00:00", "throughput": 2311.77, "total_tokens": 22071344} {"current_steps": 38280, "total_steps": 67140, "loss": 0.7534, "lr": 2.3244159614159898e-05, "epoch": 5.701519213583556, "percentage": 57.02, "elapsed_time": "2:39:08", "remaining_time": "1:59:58", "throughput": 2311.79, "total_tokens": 22074192} {"current_steps": 38285, "total_steps": 67140, "loss": 0.6461, "lr": 2.3237676879082682e-05, "epoch": 5.702263926124516, "percentage": 57.02, "elapsed_time": "2:39:09", "remaining_time": "1:59:57", "throughput": 2311.83, "total_tokens": 22077168} {"current_steps": 38290, "total_steps": 67140, "loss": 0.6054, "lr": 2.3231194263096096e-05, "epoch": 5.703008638665475, "percentage": 57.03, "elapsed_time": "2:39:10", "remaining_time": "1:59:56", "throughput": 2311.83, "total_tokens": 22079664} {"current_steps": 38295, "total_steps": 67140, "loss": 0.4092, "lr": 2.322471176663821e-05, "epoch": 5.7037533512064345, "percentage": 57.04, "elapsed_time": "2:39:11", "remaining_time": "1:59:54", "throughput": 2311.86, "total_tokens": 22082640} {"current_steps": 38300, "total_steps": 67140, "loss": 0.5669, "lr": 2.3218229390147086e-05, "epoch": 5.704498063747393, "percentage": 57.04, "elapsed_time": "2:39:13", "remaining_time": "1:59:53", "throughput": 2311.87, "total_tokens": 22085328} {"current_steps": 38305, "total_steps": 67140, "loss": 0.7431, "lr": 2.3211747134060774e-05, "epoch": 5.705242776288353, "percentage": 57.05, "elapsed_time": "2:39:14", "remaining_time": "1:59:52", "throughput": 2311.9, "total_tokens": 22088208} {"current_steps": 38310, "total_steps": 67140, "loss": 0.5458, "lr": 2.3205264998817326e-05, "epoch": 5.705987488829312, "percentage": 57.06, "elapsed_time": "2:39:15", "remaining_time": "1:59:50", "throughput": 2311.92, "total_tokens": 22090992} {"current_steps": 38315, "total_steps": 67140, "loss": 0.8951, "lr": 2.3198782984854765e-05, "epoch": 5.706732201370271, "percentage": 57.07, "elapsed_time": "2:39:16", "remaining_time": "1:59:49", "throughput": 2311.95, "total_tokens": 22093904} {"current_steps": 38320, "total_steps": 67140, "loss": 0.7424, "lr": 2.3192301092611138e-05, "epoch": 5.70747691391123, "percentage": 57.07, "elapsed_time": "2:39:17", "remaining_time": "1:59:48", "throughput": 2311.99, "total_tokens": 22097008} {"current_steps": 38325, "total_steps": 67140, "loss": 0.6715, "lr": 2.3185819322524443e-05, "epoch": 5.70822162645219, "percentage": 57.08, "elapsed_time": "2:39:18", "remaining_time": "1:59:46", "throughput": 2312.03, "total_tokens": 22100080} {"current_steps": 38330, "total_steps": 67140, "loss": 0.7193, "lr": 2.3179337675032707e-05, "epoch": 5.708966338993148, "percentage": 57.09, "elapsed_time": "2:39:19", "remaining_time": "1:59:45", "throughput": 2312.03, "total_tokens": 22102672} {"current_steps": 38335, "total_steps": 67140, "loss": 0.5369, "lr": 2.3172856150573926e-05, "epoch": 5.709711051534108, "percentage": 57.1, "elapsed_time": "2:39:20", "remaining_time": "1:59:44", "throughput": 2312.06, "total_tokens": 22105616} {"current_steps": 38340, "total_steps": 67140, "loss": 0.4043, "lr": 2.3166374749586094e-05, "epoch": 5.710455764075067, "percentage": 57.1, "elapsed_time": "2:39:22", "remaining_time": "1:59:42", "throughput": 2312.1, "total_tokens": 22108752} {"current_steps": 38345, "total_steps": 67140, "loss": 0.5553, "lr": 2.3159893472507212e-05, "epoch": 5.7112004766160265, "percentage": 57.11, "elapsed_time": "2:39:23", "remaining_time": "1:59:41", "throughput": 2312.13, "total_tokens": 22111600} {"current_steps": 38350, "total_steps": 67140, "loss": 0.6689, "lr": 2.315341231977524e-05, "epoch": 5.711945189156985, "percentage": 57.12, "elapsed_time": "2:39:24", "remaining_time": "1:59:40", "throughput": 2312.14, "total_tokens": 22114384} {"current_steps": 38355, "total_steps": 67140, "loss": 0.476, "lr": 2.314693129182815e-05, "epoch": 5.712689901697945, "percentage": 57.13, "elapsed_time": "2:39:25", "remaining_time": "1:59:38", "throughput": 2312.15, "total_tokens": 22116944} {"current_steps": 38360, "total_steps": 67140, "loss": 0.6879, "lr": 2.314045038910393e-05, "epoch": 5.713434614238904, "percentage": 57.13, "elapsed_time": "2:39:26", "remaining_time": "1:59:37", "throughput": 2312.17, "total_tokens": 22119760} {"current_steps": 38365, "total_steps": 67140, "loss": 0.4924, "lr": 2.3133969612040503e-05, "epoch": 5.714179326779863, "percentage": 57.14, "elapsed_time": "2:39:27", "remaining_time": "1:59:36", "throughput": 2312.21, "total_tokens": 22122928} {"current_steps": 38370, "total_steps": 67140, "loss": 0.5203, "lr": 2.3127488961075812e-05, "epoch": 5.714924039320822, "percentage": 57.15, "elapsed_time": "2:39:28", "remaining_time": "1:59:34", "throughput": 2312.23, "total_tokens": 22125616} {"current_steps": 38375, "total_steps": 67140, "loss": 0.7085, "lr": 2.312100843664781e-05, "epoch": 5.715668751861782, "percentage": 57.16, "elapsed_time": "2:39:30", "remaining_time": "1:59:33", "throughput": 2312.25, "total_tokens": 22128528} {"current_steps": 38380, "total_steps": 67140, "loss": 0.6542, "lr": 2.311452803919442e-05, "epoch": 5.7164134644027405, "percentage": 57.16, "elapsed_time": "2:39:31", "remaining_time": "1:59:32", "throughput": 2312.3, "total_tokens": 22131664} {"current_steps": 38385, "total_steps": 67140, "loss": 0.6429, "lr": 2.3108047769153558e-05, "epoch": 5.7171581769437, "percentage": 57.17, "elapsed_time": "2:39:32", "remaining_time": "1:59:30", "throughput": 2312.34, "total_tokens": 22134736} {"current_steps": 38390, "total_steps": 67140, "loss": 0.7731, "lr": 2.3101567626963138e-05, "epoch": 5.717902889484659, "percentage": 57.18, "elapsed_time": "2:39:33", "remaining_time": "1:59:29", "throughput": 2312.36, "total_tokens": 22137552} {"current_steps": 38395, "total_steps": 67140, "loss": 0.601, "lr": 2.3095087613061058e-05, "epoch": 5.718647602025618, "percentage": 57.19, "elapsed_time": "2:39:34", "remaining_time": "1:59:28", "throughput": 2312.38, "total_tokens": 22140400} {"current_steps": 38400, "total_steps": 67140, "loss": 0.657, "lr": 2.3088607727885207e-05, "epoch": 5.719392314566577, "percentage": 57.19, "elapsed_time": "2:39:35", "remaining_time": "1:59:26", "throughput": 2312.41, "total_tokens": 22143248} {"current_steps": 38405, "total_steps": 67140, "loss": 0.6527, "lr": 2.3082127971873492e-05, "epoch": 5.720137027107537, "percentage": 57.2, "elapsed_time": "2:39:36", "remaining_time": "1:59:25", "throughput": 2312.44, "total_tokens": 22146160} {"current_steps": 38410, "total_steps": 67140, "loss": 0.6365, "lr": 2.3075648345463754e-05, "epoch": 5.720881739648496, "percentage": 57.21, "elapsed_time": "2:39:38", "remaining_time": "1:59:24", "throughput": 2312.44, "total_tokens": 22148720} {"current_steps": 38415, "total_steps": 67140, "loss": 0.7259, "lr": 2.3069168849093885e-05, "epoch": 5.721626452189454, "percentage": 57.22, "elapsed_time": "2:39:39", "remaining_time": "1:59:22", "throughput": 2312.46, "total_tokens": 22151504} {"current_steps": 38420, "total_steps": 67140, "loss": 0.5923, "lr": 2.306268948320173e-05, "epoch": 5.722371164730414, "percentage": 57.22, "elapsed_time": "2:39:40", "remaining_time": "1:59:21", "throughput": 2312.48, "total_tokens": 22154224} {"current_steps": 38425, "total_steps": 67140, "loss": 0.6044, "lr": 2.305621024822514e-05, "epoch": 5.723115877271374, "percentage": 57.23, "elapsed_time": "2:39:41", "remaining_time": "1:59:20", "throughput": 2312.5, "total_tokens": 22157072} {"current_steps": 38430, "total_steps": 67140, "loss": 0.413, "lr": 2.3049731144601967e-05, "epoch": 5.7238605898123325, "percentage": 57.24, "elapsed_time": "2:39:42", "remaining_time": "1:59:18", "throughput": 2312.51, "total_tokens": 22159568} {"current_steps": 38435, "total_steps": 67140, "loss": 0.7943, "lr": 2.3043252172770027e-05, "epoch": 5.724605302353291, "percentage": 57.25, "elapsed_time": "2:39:43", "remaining_time": "1:59:17", "throughput": 2312.54, "total_tokens": 22162512} {"current_steps": 38440, "total_steps": 67140, "loss": 0.7266, "lr": 2.303677333316715e-05, "epoch": 5.725350014894251, "percentage": 57.25, "elapsed_time": "2:39:44", "remaining_time": "1:59:16", "throughput": 2312.59, "total_tokens": 22165840} {"current_steps": 38445, "total_steps": 67140, "loss": 0.6115, "lr": 2.3030294626231162e-05, "epoch": 5.72609472743521, "percentage": 57.26, "elapsed_time": "2:39:46", "remaining_time": "1:59:14", "throughput": 2312.63, "total_tokens": 22168976} {"current_steps": 38450, "total_steps": 67140, "loss": 0.5643, "lr": 2.302381605239985e-05, "epoch": 5.726839439976169, "percentage": 57.27, "elapsed_time": "2:39:47", "remaining_time": "1:59:13", "throughput": 2312.66, "total_tokens": 22171760} {"current_steps": 38455, "total_steps": 67140, "loss": 0.5943, "lr": 2.3017337612111007e-05, "epoch": 5.727584152517128, "percentage": 57.28, "elapsed_time": "2:39:48", "remaining_time": "1:59:12", "throughput": 2312.69, "total_tokens": 22174736} {"current_steps": 38460, "total_steps": 67140, "loss": 0.629, "lr": 2.3010859305802426e-05, "epoch": 5.728328865058088, "percentage": 57.28, "elapsed_time": "2:39:49", "remaining_time": "1:59:10", "throughput": 2312.72, "total_tokens": 22177680} {"current_steps": 38465, "total_steps": 67140, "loss": 0.6939, "lr": 2.300438113391189e-05, "epoch": 5.7290735775990465, "percentage": 57.29, "elapsed_time": "2:39:50", "remaining_time": "1:59:09", "throughput": 2312.75, "total_tokens": 22180656} {"current_steps": 38470, "total_steps": 67140, "loss": 0.6204, "lr": 2.2997903096877164e-05, "epoch": 5.729818290140006, "percentage": 57.3, "elapsed_time": "2:39:51", "remaining_time": "1:59:08", "throughput": 2312.79, "total_tokens": 22183600} {"current_steps": 38475, "total_steps": 67140, "loss": 0.848, "lr": 2.299142519513601e-05, "epoch": 5.730563002680965, "percentage": 57.31, "elapsed_time": "2:39:52", "remaining_time": "1:59:06", "throughput": 2312.82, "total_tokens": 22186544} {"current_steps": 38480, "total_steps": 67140, "loss": 0.6154, "lr": 2.298494742912617e-05, "epoch": 5.7313077152219245, "percentage": 57.31, "elapsed_time": "2:39:53", "remaining_time": "1:59:05", "throughput": 2312.83, "total_tokens": 22189136} {"current_steps": 38485, "total_steps": 67140, "loss": 0.6088, "lr": 2.2978469799285397e-05, "epoch": 5.732052427762883, "percentage": 57.32, "elapsed_time": "2:39:55", "remaining_time": "1:59:04", "throughput": 2312.87, "total_tokens": 22192208} {"current_steps": 38490, "total_steps": 67140, "loss": 0.6639, "lr": 2.297199230605141e-05, "epoch": 5.732797140303843, "percentage": 57.33, "elapsed_time": "2:39:56", "remaining_time": "1:59:02", "throughput": 2312.89, "total_tokens": 22195120} {"current_steps": 38495, "total_steps": 67140, "loss": 0.5077, "lr": 2.2965514949861938e-05, "epoch": 5.733541852844802, "percentage": 57.34, "elapsed_time": "2:39:57", "remaining_time": "1:59:01", "throughput": 2312.91, "total_tokens": 22197808} {"current_steps": 38500, "total_steps": 67140, "loss": 0.7272, "lr": 2.2959037731154692e-05, "epoch": 5.734286565385761, "percentage": 57.34, "elapsed_time": "2:39:58", "remaining_time": "1:59:00", "throughput": 2312.94, "total_tokens": 22200848} {"current_steps": 38505, "total_steps": 67140, "loss": 0.5174, "lr": 2.295256065036738e-05, "epoch": 5.73503127792672, "percentage": 57.35, "elapsed_time": "2:39:59", "remaining_time": "1:58:58", "throughput": 2312.94, "total_tokens": 22203408} {"current_steps": 38510, "total_steps": 67140, "loss": 0.6559, "lr": 2.2946083707937697e-05, "epoch": 5.73577599046768, "percentage": 57.36, "elapsed_time": "2:40:00", "remaining_time": "1:58:57", "throughput": 2312.99, "total_tokens": 22206640} {"current_steps": 38515, "total_steps": 67140, "loss": 0.6981, "lr": 2.293960690430332e-05, "epoch": 5.7365207030086385, "percentage": 57.37, "elapsed_time": "2:40:01", "remaining_time": "1:58:56", "throughput": 2313.02, "total_tokens": 22209488} {"current_steps": 38520, "total_steps": 67140, "loss": 0.5502, "lr": 2.2933130239901934e-05, "epoch": 5.737265415549598, "percentage": 57.37, "elapsed_time": "2:40:03", "remaining_time": "1:58:55", "throughput": 2313.05, "total_tokens": 22212528} {"current_steps": 38525, "total_steps": 67140, "loss": 0.5216, "lr": 2.2926653715171215e-05, "epoch": 5.738010128090557, "percentage": 57.38, "elapsed_time": "2:40:04", "remaining_time": "1:58:53", "throughput": 2313.1, "total_tokens": 22215632} {"current_steps": 38530, "total_steps": 67140, "loss": 0.5905, "lr": 2.2920177330548802e-05, "epoch": 5.7387548406315165, "percentage": 57.39, "elapsed_time": "2:40:05", "remaining_time": "1:58:52", "throughput": 2313.12, "total_tokens": 22218480} {"current_steps": 38535, "total_steps": 67140, "loss": 0.5301, "lr": 2.2913701086472343e-05, "epoch": 5.739499553172475, "percentage": 57.39, "elapsed_time": "2:40:06", "remaining_time": "1:58:51", "throughput": 2313.15, "total_tokens": 22221392} {"current_steps": 38540, "total_steps": 67140, "loss": 0.749, "lr": 2.290722498337948e-05, "epoch": 5.740244265713435, "percentage": 57.4, "elapsed_time": "2:40:07", "remaining_time": "1:58:49", "throughput": 2313.16, "total_tokens": 22224048} {"current_steps": 38545, "total_steps": 67140, "loss": 0.6275, "lr": 2.2900749021707855e-05, "epoch": 5.740988978254394, "percentage": 57.41, "elapsed_time": "2:40:08", "remaining_time": "1:58:48", "throughput": 2313.18, "total_tokens": 22226768} {"current_steps": 38550, "total_steps": 67140, "loss": 0.6619, "lr": 2.2894273201895068e-05, "epoch": 5.741733690795353, "percentage": 57.42, "elapsed_time": "2:40:09", "remaining_time": "1:58:47", "throughput": 2313.19, "total_tokens": 22229520} {"current_steps": 38555, "total_steps": 67140, "loss": 0.5017, "lr": 2.2887797524378734e-05, "epoch": 5.742478403336312, "percentage": 57.42, "elapsed_time": "2:40:11", "remaining_time": "1:58:45", "throughput": 2313.22, "total_tokens": 22232432} {"current_steps": 38560, "total_steps": 67140, "loss": 0.6252, "lr": 2.2881321989596464e-05, "epoch": 5.743223115877272, "percentage": 57.43, "elapsed_time": "2:40:12", "remaining_time": "1:58:44", "throughput": 2313.25, "total_tokens": 22235312} {"current_steps": 38565, "total_steps": 67140, "loss": 0.6454, "lr": 2.2874846597985842e-05, "epoch": 5.7439678284182305, "percentage": 57.44, "elapsed_time": "2:40:13", "remaining_time": "1:58:43", "throughput": 2313.28, "total_tokens": 22238288} {"current_steps": 38570, "total_steps": 67140, "loss": 0.8203, "lr": 2.2868371349984442e-05, "epoch": 5.74471254095919, "percentage": 57.45, "elapsed_time": "2:40:14", "remaining_time": "1:58:41", "throughput": 2313.28, "total_tokens": 22240816} {"current_steps": 38575, "total_steps": 67140, "loss": 0.7289, "lr": 2.2861896246029835e-05, "epoch": 5.745457253500149, "percentage": 57.45, "elapsed_time": "2:40:15", "remaining_time": "1:58:40", "throughput": 2313.31, "total_tokens": 22243792} {"current_steps": 38580, "total_steps": 67140, "loss": 0.6691, "lr": 2.2855421286559593e-05, "epoch": 5.746201966041108, "percentage": 57.46, "elapsed_time": "2:40:16", "remaining_time": "1:58:39", "throughput": 2313.33, "total_tokens": 22246544} {"current_steps": 38585, "total_steps": 67140, "loss": 0.5352, "lr": 2.2848946472011258e-05, "epoch": 5.746946678582067, "percentage": 57.47, "elapsed_time": "2:40:17", "remaining_time": "1:58:37", "throughput": 2313.36, "total_tokens": 22249456} {"current_steps": 38590, "total_steps": 67140, "loss": 0.6343, "lr": 2.2842471802822372e-05, "epoch": 5.747691391123027, "percentage": 57.48, "elapsed_time": "2:40:18", "remaining_time": "1:58:36", "throughput": 2313.38, "total_tokens": 22252368} {"current_steps": 38595, "total_steps": 67140, "loss": 0.6535, "lr": 2.2835997279430475e-05, "epoch": 5.748436103663986, "percentage": 57.48, "elapsed_time": "2:40:20", "remaining_time": "1:58:35", "throughput": 2313.4, "total_tokens": 22255152} {"current_steps": 38600, "total_steps": 67140, "loss": 0.5156, "lr": 2.282952290227308e-05, "epoch": 5.7491808162049445, "percentage": 57.49, "elapsed_time": "2:40:21", "remaining_time": "1:58:33", "throughput": 2313.45, "total_tokens": 22258288} {"current_steps": 38605, "total_steps": 67140, "loss": 0.5479, "lr": 2.2823048671787715e-05, "epoch": 5.749925528745904, "percentage": 57.5, "elapsed_time": "2:40:22", "remaining_time": "1:58:32", "throughput": 2313.46, "total_tokens": 22260976} {"current_steps": 38610, "total_steps": 67140, "loss": 0.5519, "lr": 2.2816574588411857e-05, "epoch": 5.750670241286863, "percentage": 57.51, "elapsed_time": "2:40:23", "remaining_time": "1:58:31", "throughput": 2313.48, "total_tokens": 22263760} {"current_steps": 38615, "total_steps": 67140, "loss": 0.6402, "lr": 2.2810100652583016e-05, "epoch": 5.7514149538278225, "percentage": 57.51, "elapsed_time": "2:40:24", "remaining_time": "1:58:29", "throughput": 2313.51, "total_tokens": 22266672} {"current_steps": 38620, "total_steps": 67140, "loss": 0.657, "lr": 2.2803626864738664e-05, "epoch": 5.752159666368781, "percentage": 57.52, "elapsed_time": "2:40:25", "remaining_time": "1:58:28", "throughput": 2313.53, "total_tokens": 22269424} {"current_steps": 38625, "total_steps": 67140, "loss": 0.5343, "lr": 2.279715322531628e-05, "epoch": 5.752904378909741, "percentage": 57.53, "elapsed_time": "2:40:26", "remaining_time": "1:58:27", "throughput": 2313.57, "total_tokens": 22272464} {"current_steps": 38630, "total_steps": 67140, "loss": 0.6779, "lr": 2.2790679734753327e-05, "epoch": 5.7536490914507, "percentage": 57.54, "elapsed_time": "2:40:27", "remaining_time": "1:58:25", "throughput": 2313.57, "total_tokens": 22275088} {"current_steps": 38635, "total_steps": 67140, "loss": 0.6652, "lr": 2.2784206393487256e-05, "epoch": 5.754393803991659, "percentage": 57.54, "elapsed_time": "2:40:29", "remaining_time": "1:58:24", "throughput": 2313.58, "total_tokens": 22277680} {"current_steps": 38640, "total_steps": 67140, "loss": 0.7261, "lr": 2.277773320195551e-05, "epoch": 5.755138516532618, "percentage": 57.55, "elapsed_time": "2:40:30", "remaining_time": "1:58:23", "throughput": 2313.61, "total_tokens": 22280624} {"current_steps": 38645, "total_steps": 67140, "loss": 0.629, "lr": 2.2771260160595516e-05, "epoch": 5.755883229073578, "percentage": 57.56, "elapsed_time": "2:40:31", "remaining_time": "1:58:21", "throughput": 2313.63, "total_tokens": 22283344} {"current_steps": 38650, "total_steps": 67140, "loss": 0.7589, "lr": 2.2764787269844704e-05, "epoch": 5.7566279416145365, "percentage": 57.57, "elapsed_time": "2:40:32", "remaining_time": "1:58:20", "throughput": 2313.69, "total_tokens": 22286704} {"current_steps": 38655, "total_steps": 67140, "loss": 0.6174, "lr": 2.2758314530140473e-05, "epoch": 5.757372654155496, "percentage": 57.57, "elapsed_time": "2:40:33", "remaining_time": "1:58:19", "throughput": 2313.74, "total_tokens": 22290000} {"current_steps": 38660, "total_steps": 67140, "loss": 0.6678, "lr": 2.2751841941920238e-05, "epoch": 5.758117366696455, "percentage": 57.58, "elapsed_time": "2:40:34", "remaining_time": "1:58:17", "throughput": 2313.78, "total_tokens": 22293104} {"current_steps": 38665, "total_steps": 67140, "loss": 0.6343, "lr": 2.274536950562138e-05, "epoch": 5.7588620792374146, "percentage": 57.59, "elapsed_time": "2:40:36", "remaining_time": "1:58:16", "throughput": 2313.81, "total_tokens": 22296048} {"current_steps": 38670, "total_steps": 67140, "loss": 0.6117, "lr": 2.2738897221681284e-05, "epoch": 5.759606791778373, "percentage": 57.6, "elapsed_time": "2:40:37", "remaining_time": "1:58:15", "throughput": 2313.84, "total_tokens": 22298992} {"current_steps": 38675, "total_steps": 67140, "loss": 0.8476, "lr": 2.2732425090537323e-05, "epoch": 5.760351504319333, "percentage": 57.6, "elapsed_time": "2:40:38", "remaining_time": "1:58:13", "throughput": 2313.89, "total_tokens": 22302160} {"current_steps": 38680, "total_steps": 67140, "loss": 0.7983, "lr": 2.272595311262685e-05, "epoch": 5.761096216860292, "percentage": 57.61, "elapsed_time": "2:40:39", "remaining_time": "1:58:12", "throughput": 2313.93, "total_tokens": 22305360} {"current_steps": 38685, "total_steps": 67140, "loss": 0.4981, "lr": 2.2719481288387234e-05, "epoch": 5.761840929401251, "percentage": 57.62, "elapsed_time": "2:40:40", "remaining_time": "1:58:11", "throughput": 2313.95, "total_tokens": 22308176} {"current_steps": 38690, "total_steps": 67140, "loss": 0.508, "lr": 2.2713009618255788e-05, "epoch": 5.76258564194221, "percentage": 57.63, "elapsed_time": "2:40:41", "remaining_time": "1:58:09", "throughput": 2313.98, "total_tokens": 22311056} {"current_steps": 38695, "total_steps": 67140, "loss": 0.5412, "lr": 2.270653810266986e-05, "epoch": 5.76333035448317, "percentage": 57.63, "elapsed_time": "2:40:43", "remaining_time": "1:58:08", "throughput": 2314.03, "total_tokens": 22314224} {"current_steps": 38700, "total_steps": 67140, "loss": 0.6598, "lr": 2.2700066742066754e-05, "epoch": 5.7640750670241285, "percentage": 57.64, "elapsed_time": "2:40:44", "remaining_time": "1:58:07", "throughput": 2314.05, "total_tokens": 22317104} {"current_steps": 38705, "total_steps": 67140, "loss": 0.6504, "lr": 2.2693595536883792e-05, "epoch": 5.764819779565088, "percentage": 57.65, "elapsed_time": "2:40:45", "remaining_time": "1:58:05", "throughput": 2314.08, "total_tokens": 22319952} {"current_steps": 38710, "total_steps": 67140, "loss": 0.4734, "lr": 2.2687124487558267e-05, "epoch": 5.765564492106047, "percentage": 57.66, "elapsed_time": "2:40:46", "remaining_time": "1:58:04", "throughput": 2314.11, "total_tokens": 22322864} {"current_steps": 38715, "total_steps": 67140, "loss": 0.5086, "lr": 2.268065359452746e-05, "epoch": 5.766309204647007, "percentage": 57.66, "elapsed_time": "2:40:47", "remaining_time": "1:58:03", "throughput": 2314.12, "total_tokens": 22325648} {"current_steps": 38720, "total_steps": 67140, "loss": 0.6051, "lr": 2.267418285822866e-05, "epoch": 5.767053917187965, "percentage": 57.67, "elapsed_time": "2:40:48", "remaining_time": "1:58:02", "throughput": 2314.18, "total_tokens": 22328976} {"current_steps": 38725, "total_steps": 67140, "loss": 0.4397, "lr": 2.266771227909913e-05, "epoch": 5.767798629728925, "percentage": 57.68, "elapsed_time": "2:40:49", "remaining_time": "1:58:00", "throughput": 2314.19, "total_tokens": 22331696} {"current_steps": 38730, "total_steps": 67140, "loss": 0.7529, "lr": 2.266124185757612e-05, "epoch": 5.768543342269884, "percentage": 57.69, "elapsed_time": "2:40:51", "remaining_time": "1:57:59", "throughput": 2314.22, "total_tokens": 22334608} {"current_steps": 38735, "total_steps": 67140, "loss": 0.5314, "lr": 2.265477159409687e-05, "epoch": 5.769288054810843, "percentage": 57.69, "elapsed_time": "2:40:52", "remaining_time": "1:57:58", "throughput": 2314.24, "total_tokens": 22337360} {"current_steps": 38740, "total_steps": 67140, "loss": 0.6973, "lr": 2.2648301489098624e-05, "epoch": 5.770032767351802, "percentage": 57.7, "elapsed_time": "2:40:53", "remaining_time": "1:57:56", "throughput": 2314.27, "total_tokens": 22340272} {"current_steps": 38745, "total_steps": 67140, "loss": 0.7334, "lr": 2.26418315430186e-05, "epoch": 5.770777479892761, "percentage": 57.71, "elapsed_time": "2:40:54", "remaining_time": "1:57:55", "throughput": 2314.29, "total_tokens": 22343184} {"current_steps": 38750, "total_steps": 67140, "loss": 0.6998, "lr": 2.2635361756294014e-05, "epoch": 5.7715221924337206, "percentage": 57.72, "elapsed_time": "2:40:55", "remaining_time": "1:57:54", "throughput": 2314.31, "total_tokens": 22345904} {"current_steps": 38755, "total_steps": 67140, "loss": 0.6548, "lr": 2.2628892129362064e-05, "epoch": 5.77226690497468, "percentage": 57.72, "elapsed_time": "2:40:56", "remaining_time": "1:57:52", "throughput": 2314.31, "total_tokens": 22348432} {"current_steps": 38760, "total_steps": 67140, "loss": 0.4445, "lr": 2.2622422662659952e-05, "epoch": 5.773011617515639, "percentage": 57.73, "elapsed_time": "2:40:57", "remaining_time": "1:57:51", "throughput": 2314.33, "total_tokens": 22351152} {"current_steps": 38765, "total_steps": 67140, "loss": 0.6955, "lr": 2.2615953356624852e-05, "epoch": 5.773756330056598, "percentage": 57.74, "elapsed_time": "2:40:58", "remaining_time": "1:57:50", "throughput": 2314.34, "total_tokens": 22353936} {"current_steps": 38770, "total_steps": 67140, "loss": 0.5749, "lr": 2.260948421169392e-05, "epoch": 5.774501042597557, "percentage": 57.75, "elapsed_time": "2:41:00", "remaining_time": "1:57:48", "throughput": 2314.38, "total_tokens": 22356976} {"current_steps": 38775, "total_steps": 67140, "loss": 0.8043, "lr": 2.260301522830433e-05, "epoch": 5.775245755138517, "percentage": 57.75, "elapsed_time": "2:41:01", "remaining_time": "1:57:47", "throughput": 2314.42, "total_tokens": 22360048} {"current_steps": 38780, "total_steps": 67140, "loss": 0.8935, "lr": 2.2596546406893227e-05, "epoch": 5.775990467679476, "percentage": 57.76, "elapsed_time": "2:41:02", "remaining_time": "1:57:46", "throughput": 2314.44, "total_tokens": 22362768} {"current_steps": 38785, "total_steps": 67140, "loss": 0.5685, "lr": 2.259007774789774e-05, "epoch": 5.7767351802204345, "percentage": 57.77, "elapsed_time": "2:41:03", "remaining_time": "1:57:44", "throughput": 2314.47, "total_tokens": 22365808} {"current_steps": 38790, "total_steps": 67140, "loss": 0.5129, "lr": 2.2583609251755004e-05, "epoch": 5.777479892761394, "percentage": 57.77, "elapsed_time": "2:41:04", "remaining_time": "1:57:43", "throughput": 2314.49, "total_tokens": 22368528} {"current_steps": 38795, "total_steps": 67140, "loss": 0.5177, "lr": 2.2577140918902135e-05, "epoch": 5.778224605302353, "percentage": 57.78, "elapsed_time": "2:41:05", "remaining_time": "1:57:42", "throughput": 2314.52, "total_tokens": 22371536} {"current_steps": 38800, "total_steps": 67140, "loss": 0.6213, "lr": 2.2570672749776222e-05, "epoch": 5.778969317843313, "percentage": 57.79, "elapsed_time": "2:41:06", "remaining_time": "1:57:40", "throughput": 2314.55, "total_tokens": 22374512} {"current_steps": 38805, "total_steps": 67140, "loss": 0.5821, "lr": 2.2564204744814384e-05, "epoch": 5.779714030384271, "percentage": 57.8, "elapsed_time": "2:41:08", "remaining_time": "1:57:39", "throughput": 2314.6, "total_tokens": 22377712} {"current_steps": 38810, "total_steps": 67140, "loss": 0.5735, "lr": 2.2557736904453674e-05, "epoch": 5.780458742925231, "percentage": 57.8, "elapsed_time": "2:41:09", "remaining_time": "1:57:38", "throughput": 2314.62, "total_tokens": 22380656} {"current_steps": 38815, "total_steps": 67140, "loss": 0.662, "lr": 2.255126922913118e-05, "epoch": 5.78120345546619, "percentage": 57.81, "elapsed_time": "2:41:10", "remaining_time": "1:57:36", "throughput": 2314.65, "total_tokens": 22383568} {"current_steps": 38820, "total_steps": 67140, "loss": 0.5542, "lr": 2.254480171928395e-05, "epoch": 5.781948168007149, "percentage": 57.82, "elapsed_time": "2:41:11", "remaining_time": "1:57:35", "throughput": 2314.67, "total_tokens": 22386320} {"current_steps": 38825, "total_steps": 67140, "loss": 0.6922, "lr": 2.2538334375349044e-05, "epoch": 5.782692880548108, "percentage": 57.83, "elapsed_time": "2:41:12", "remaining_time": "1:57:34", "throughput": 2314.7, "total_tokens": 22389264} {"current_steps": 38830, "total_steps": 67140, "loss": 0.5562, "lr": 2.2531867197763484e-05, "epoch": 5.783437593089068, "percentage": 57.83, "elapsed_time": "2:41:13", "remaining_time": "1:57:32", "throughput": 2314.73, "total_tokens": 22392144} {"current_steps": 38835, "total_steps": 67140, "loss": 0.7668, "lr": 2.2525400186964308e-05, "epoch": 5.7841823056300266, "percentage": 57.84, "elapsed_time": "2:41:14", "remaining_time": "1:57:31", "throughput": 2314.75, "total_tokens": 22395024} {"current_steps": 38840, "total_steps": 67140, "loss": 0.5592, "lr": 2.2518933343388528e-05, "epoch": 5.784927018170986, "percentage": 57.85, "elapsed_time": "2:41:16", "remaining_time": "1:57:30", "throughput": 2314.77, "total_tokens": 22397776} {"current_steps": 38845, "total_steps": 67140, "loss": 0.6296, "lr": 2.2512466667473152e-05, "epoch": 5.785671730711945, "percentage": 57.86, "elapsed_time": "2:41:17", "remaining_time": "1:57:28", "throughput": 2314.82, "total_tokens": 22400976} {"current_steps": 38850, "total_steps": 67140, "loss": 0.6363, "lr": 2.2506000159655158e-05, "epoch": 5.786416443252905, "percentage": 57.86, "elapsed_time": "2:41:18", "remaining_time": "1:57:27", "throughput": 2314.85, "total_tokens": 22403952} {"current_steps": 38855, "total_steps": 67140, "loss": 0.4629, "lr": 2.249953382037153e-05, "epoch": 5.787161155793863, "percentage": 57.87, "elapsed_time": "2:41:19", "remaining_time": "1:57:26", "throughput": 2314.88, "total_tokens": 22406960} {"current_steps": 38860, "total_steps": 67140, "loss": 0.7218, "lr": 2.2493067650059247e-05, "epoch": 5.787905868334823, "percentage": 57.88, "elapsed_time": "2:41:20", "remaining_time": "1:57:25", "throughput": 2314.92, "total_tokens": 22409968} {"current_steps": 38865, "total_steps": 67140, "loss": 0.5438, "lr": 2.248660164915525e-05, "epoch": 5.788650580875782, "percentage": 57.89, "elapsed_time": "2:41:21", "remaining_time": "1:57:23", "throughput": 2314.94, "total_tokens": 22412880} {"current_steps": 38870, "total_steps": 67140, "loss": 0.6107, "lr": 2.2480135818096497e-05, "epoch": 5.789395293416741, "percentage": 57.89, "elapsed_time": "2:41:22", "remaining_time": "1:57:22", "throughput": 2314.96, "total_tokens": 22415568} {"current_steps": 38875, "total_steps": 67140, "loss": 0.7577, "lr": 2.247367015731993e-05, "epoch": 5.7901400059577, "percentage": 57.9, "elapsed_time": "2:41:24", "remaining_time": "1:57:21", "throughput": 2314.99, "total_tokens": 22418512} {"current_steps": 38880, "total_steps": 67140, "loss": 0.6713, "lr": 2.2467204667262454e-05, "epoch": 5.79088471849866, "percentage": 57.91, "elapsed_time": "2:41:25", "remaining_time": "1:57:19", "throughput": 2315.02, "total_tokens": 22421424} {"current_steps": 38885, "total_steps": 67140, "loss": 0.554, "lr": 2.2460739348361e-05, "epoch": 5.791629431039619, "percentage": 57.92, "elapsed_time": "2:41:26", "remaining_time": "1:57:18", "throughput": 2315.06, "total_tokens": 22424592} {"current_steps": 38890, "total_steps": 67140, "loss": 0.4843, "lr": 2.2454274201052443e-05, "epoch": 5.792374143580578, "percentage": 57.92, "elapsed_time": "2:41:27", "remaining_time": "1:57:17", "throughput": 2315.09, "total_tokens": 22427440} {"current_steps": 38895, "total_steps": 67140, "loss": 0.6267, "lr": 2.2447809225773698e-05, "epoch": 5.793118856121537, "percentage": 57.93, "elapsed_time": "2:41:28", "remaining_time": "1:57:15", "throughput": 2315.12, "total_tokens": 22430384} {"current_steps": 38900, "total_steps": 67140, "loss": 0.5882, "lr": 2.2441344422961618e-05, "epoch": 5.793863568662497, "percentage": 57.94, "elapsed_time": "2:41:29", "remaining_time": "1:57:14", "throughput": 2315.14, "total_tokens": 22433232} {"current_steps": 38905, "total_steps": 67140, "loss": 0.601, "lr": 2.243487979305308e-05, "epoch": 5.794608281203455, "percentage": 57.95, "elapsed_time": "2:41:30", "remaining_time": "1:57:13", "throughput": 2315.17, "total_tokens": 22436144} {"current_steps": 38910, "total_steps": 67140, "loss": 0.7301, "lr": 2.2428415336484944e-05, "epoch": 5.795352993744415, "percentage": 57.95, "elapsed_time": "2:41:32", "remaining_time": "1:57:11", "throughput": 2315.22, "total_tokens": 22439472} {"current_steps": 38915, "total_steps": 67140, "loss": 0.5857, "lr": 2.2421951053694034e-05, "epoch": 5.796097706285374, "percentage": 57.96, "elapsed_time": "2:41:33", "remaining_time": "1:57:10", "throughput": 2315.25, "total_tokens": 22442320} {"current_steps": 38920, "total_steps": 67140, "loss": 0.5682, "lr": 2.2415486945117195e-05, "epoch": 5.796842418826333, "percentage": 57.97, "elapsed_time": "2:41:34", "remaining_time": "1:57:09", "throughput": 2315.25, "total_tokens": 22444880} {"current_steps": 38925, "total_steps": 67140, "loss": 0.579, "lr": 2.2409023011191248e-05, "epoch": 5.797587131367292, "percentage": 57.98, "elapsed_time": "2:41:35", "remaining_time": "1:57:07", "throughput": 2315.27, "total_tokens": 22447632} {"current_steps": 38930, "total_steps": 67140, "loss": 0.7684, "lr": 2.2402559252352988e-05, "epoch": 5.798331843908251, "percentage": 57.98, "elapsed_time": "2:41:36", "remaining_time": "1:57:06", "throughput": 2315.29, "total_tokens": 22450288} {"current_steps": 38935, "total_steps": 67140, "loss": 0.7139, "lr": 2.239609566903921e-05, "epoch": 5.799076556449211, "percentage": 57.99, "elapsed_time": "2:41:37", "remaining_time": "1:57:05", "throughput": 2315.31, "total_tokens": 22453136} {"current_steps": 38940, "total_steps": 67140, "loss": 0.7252, "lr": 2.23896322616867e-05, "epoch": 5.79982126899017, "percentage": 58.0, "elapsed_time": "2:41:38", "remaining_time": "1:57:03", "throughput": 2315.33, "total_tokens": 22455888} {"current_steps": 38945, "total_steps": 67140, "loss": 0.5106, "lr": 2.238316903073223e-05, "epoch": 5.800565981531129, "percentage": 58.01, "elapsed_time": "2:41:39", "remaining_time": "1:57:02", "throughput": 2315.36, "total_tokens": 22458896} {"current_steps": 38950, "total_steps": 67140, "loss": 0.6944, "lr": 2.2376705976612555e-05, "epoch": 5.801310694072088, "percentage": 58.01, "elapsed_time": "2:41:41", "remaining_time": "1:57:01", "throughput": 2315.39, "total_tokens": 22461776} {"current_steps": 38955, "total_steps": 67140, "loss": 0.5416, "lr": 2.2370243099764424e-05, "epoch": 5.802055406613047, "percentage": 58.02, "elapsed_time": "2:41:42", "remaining_time": "1:56:59", "throughput": 2315.42, "total_tokens": 22464656} {"current_steps": 38960, "total_steps": 67140, "loss": 0.5208, "lr": 2.2363780400624578e-05, "epoch": 5.802800119154006, "percentage": 58.03, "elapsed_time": "2:41:43", "remaining_time": "1:56:58", "throughput": 2315.44, "total_tokens": 22467536} {"current_steps": 38965, "total_steps": 67140, "loss": 0.6308, "lr": 2.235731787962973e-05, "epoch": 5.803544831694966, "percentage": 58.04, "elapsed_time": "2:41:44", "remaining_time": "1:56:57", "throughput": 2315.47, "total_tokens": 22470512} {"current_steps": 38970, "total_steps": 67140, "loss": 0.6201, "lr": 2.2350855537216603e-05, "epoch": 5.804289544235925, "percentage": 58.04, "elapsed_time": "2:41:45", "remaining_time": "1:56:55", "throughput": 2315.52, "total_tokens": 22473680} {"current_steps": 38975, "total_steps": 67140, "loss": 0.7119, "lr": 2.234439337382188e-05, "epoch": 5.805034256776884, "percentage": 58.05, "elapsed_time": "2:41:46", "remaining_time": "1:56:54", "throughput": 2315.55, "total_tokens": 22476656} {"current_steps": 38980, "total_steps": 67140, "loss": 0.6311, "lr": 2.2337931389882262e-05, "epoch": 5.805778969317843, "percentage": 58.06, "elapsed_time": "2:41:47", "remaining_time": "1:56:53", "throughput": 2315.58, "total_tokens": 22479568} {"current_steps": 38985, "total_steps": 67140, "loss": 0.706, "lr": 2.233146958583441e-05, "epoch": 5.806523681858803, "percentage": 58.07, "elapsed_time": "2:41:49", "remaining_time": "1:56:51", "throughput": 2315.61, "total_tokens": 22482576} {"current_steps": 38990, "total_steps": 67140, "loss": 0.8468, "lr": 2.2325007962115e-05, "epoch": 5.807268394399761, "percentage": 58.07, "elapsed_time": "2:41:50", "remaining_time": "1:56:50", "throughput": 2315.71, "total_tokens": 22486768} {"current_steps": 38995, "total_steps": 67140, "loss": 0.5842, "lr": 2.2318546519160672e-05, "epoch": 5.808013106940721, "percentage": 58.08, "elapsed_time": "2:41:51", "remaining_time": "1:56:49", "throughput": 2315.72, "total_tokens": 22489488} {"current_steps": 39000, "total_steps": 67140, "loss": 0.8199, "lr": 2.2312085257408066e-05, "epoch": 5.80875781948168, "percentage": 58.09, "elapsed_time": "2:41:52", "remaining_time": "1:56:48", "throughput": 2315.77, "total_tokens": 22492720} {"current_steps": 39005, "total_steps": 67140, "loss": 0.5283, "lr": 2.2305624177293816e-05, "epoch": 5.809502532022639, "percentage": 58.1, "elapsed_time": "2:41:53", "remaining_time": "1:56:46", "throughput": 2315.8, "total_tokens": 22495632} {"current_steps": 39010, "total_steps": 67140, "loss": 0.6722, "lr": 2.2299163279254535e-05, "epoch": 5.810247244563598, "percentage": 58.1, "elapsed_time": "2:41:55", "remaining_time": "1:56:45", "throughput": 2315.82, "total_tokens": 22498416} {"current_steps": 39015, "total_steps": 67140, "loss": 0.614, "lr": 2.229270256372681e-05, "epoch": 5.810991957104558, "percentage": 58.11, "elapsed_time": "2:41:56", "remaining_time": "1:56:44", "throughput": 2315.84, "total_tokens": 22501136} {"current_steps": 39020, "total_steps": 67140, "loss": 0.4703, "lr": 2.2286242031147236e-05, "epoch": 5.811736669645517, "percentage": 58.12, "elapsed_time": "2:41:57", "remaining_time": "1:56:42", "throughput": 2315.86, "total_tokens": 22503984} {"current_steps": 39025, "total_steps": 67140, "loss": 0.6252, "lr": 2.22797816819524e-05, "epoch": 5.812481382186476, "percentage": 58.12, "elapsed_time": "2:41:58", "remaining_time": "1:56:41", "throughput": 2315.9, "total_tokens": 22507088} {"current_steps": 39030, "total_steps": 67140, "loss": 0.5953, "lr": 2.227332151657885e-05, "epoch": 5.813226094727435, "percentage": 58.13, "elapsed_time": "2:41:59", "remaining_time": "1:56:40", "throughput": 2315.92, "total_tokens": 22509968} {"current_steps": 39035, "total_steps": 67140, "loss": 0.5595, "lr": 2.226686153546315e-05, "epoch": 5.813970807268395, "percentage": 58.14, "elapsed_time": "2:42:00", "remaining_time": "1:56:38", "throughput": 2315.96, "total_tokens": 22512976} {"current_steps": 39040, "total_steps": 67140, "loss": 0.5779, "lr": 2.2260401739041837e-05, "epoch": 5.814715519809353, "percentage": 58.15, "elapsed_time": "2:42:01", "remaining_time": "1:56:37", "throughput": 2315.99, "total_tokens": 22515952} {"current_steps": 39045, "total_steps": 67140, "loss": 0.7463, "lr": 2.2253942127751432e-05, "epoch": 5.815460232350313, "percentage": 58.15, "elapsed_time": "2:42:03", "remaining_time": "1:56:36", "throughput": 2316.02, "total_tokens": 22518864} {"current_steps": 39050, "total_steps": 67140, "loss": 0.5018, "lr": 2.2247482702028466e-05, "epoch": 5.816204944891272, "percentage": 58.16, "elapsed_time": "2:42:04", "remaining_time": "1:56:34", "throughput": 2316.03, "total_tokens": 22521520} {"current_steps": 39055, "total_steps": 67140, "loss": 0.6419, "lr": 2.2241023462309416e-05, "epoch": 5.8169496574322315, "percentage": 58.17, "elapsed_time": "2:42:05", "remaining_time": "1:56:33", "throughput": 2316.07, "total_tokens": 22524656} {"current_steps": 39060, "total_steps": 67140, "loss": 0.799, "lr": 2.2234564409030788e-05, "epoch": 5.81769436997319, "percentage": 58.18, "elapsed_time": "2:42:06", "remaining_time": "1:56:32", "throughput": 2316.1, "total_tokens": 22527536} {"current_steps": 39065, "total_steps": 67140, "loss": 0.6186, "lr": 2.2228105542629047e-05, "epoch": 5.81843908251415, "percentage": 58.18, "elapsed_time": "2:42:07", "remaining_time": "1:56:31", "throughput": 2316.12, "total_tokens": 22530416} {"current_steps": 39070, "total_steps": 67140, "loss": 0.6461, "lr": 2.2221646863540664e-05, "epoch": 5.819183795055109, "percentage": 58.19, "elapsed_time": "2:42:08", "remaining_time": "1:56:29", "throughput": 2316.15, "total_tokens": 22533296} {"current_steps": 39075, "total_steps": 67140, "loss": 0.6356, "lr": 2.2215188372202097e-05, "epoch": 5.819928507596068, "percentage": 58.2, "elapsed_time": "2:42:09", "remaining_time": "1:56:28", "throughput": 2316.17, "total_tokens": 22536176} {"current_steps": 39080, "total_steps": 67140, "loss": 0.7313, "lr": 2.2208730069049775e-05, "epoch": 5.820673220137027, "percentage": 58.21, "elapsed_time": "2:42:10", "remaining_time": "1:56:26", "throughput": 2316.18, "total_tokens": 22538768} {"current_steps": 39085, "total_steps": 67140, "loss": 0.7511, "lr": 2.220227195452012e-05, "epoch": 5.821417932677987, "percentage": 58.21, "elapsed_time": "2:42:12", "remaining_time": "1:56:25", "throughput": 2316.22, "total_tokens": 22541744} {"current_steps": 39090, "total_steps": 67140, "loss": 0.5959, "lr": 2.2195814029049568e-05, "epoch": 5.822162645218945, "percentage": 58.22, "elapsed_time": "2:42:13", "remaining_time": "1:56:24", "throughput": 2316.24, "total_tokens": 22544624} {"current_steps": 39095, "total_steps": 67140, "loss": 0.6431, "lr": 2.2189356293074495e-05, "epoch": 5.822907357759904, "percentage": 58.23, "elapsed_time": "2:42:14", "remaining_time": "1:56:22", "throughput": 2316.25, "total_tokens": 22547184} {"current_steps": 39100, "total_steps": 67140, "loss": 0.7139, "lr": 2.218289874703129e-05, "epoch": 5.823652070300864, "percentage": 58.24, "elapsed_time": "2:42:15", "remaining_time": "1:56:21", "throughput": 2316.26, "total_tokens": 22549872} {"current_steps": 39105, "total_steps": 67140, "loss": 0.5047, "lr": 2.2176441391356336e-05, "epoch": 5.8243967828418235, "percentage": 58.24, "elapsed_time": "2:42:16", "remaining_time": "1:56:20", "throughput": 2316.29, "total_tokens": 22552816} {"current_steps": 39110, "total_steps": 67140, "loss": 0.7976, "lr": 2.2169984226485998e-05, "epoch": 5.825141495382782, "percentage": 58.25, "elapsed_time": "2:42:17", "remaining_time": "1:56:19", "throughput": 2316.33, "total_tokens": 22555792} {"current_steps": 39115, "total_steps": 67140, "loss": 0.6322, "lr": 2.2163527252856614e-05, "epoch": 5.825886207923741, "percentage": 58.26, "elapsed_time": "2:42:18", "remaining_time": "1:56:17", "throughput": 2316.36, "total_tokens": 22558832} {"current_steps": 39120, "total_steps": 67140, "loss": 0.498, "lr": 2.2157070470904528e-05, "epoch": 5.826630920464701, "percentage": 58.27, "elapsed_time": "2:42:20", "remaining_time": "1:56:16", "throughput": 2316.39, "total_tokens": 22561744} {"current_steps": 39125, "total_steps": 67140, "loss": 0.7198, "lr": 2.2150613881066063e-05, "epoch": 5.82737563300566, "percentage": 58.27, "elapsed_time": "2:42:21", "remaining_time": "1:56:15", "throughput": 2316.41, "total_tokens": 22564528} {"current_steps": 39130, "total_steps": 67140, "loss": 0.6102, "lr": 2.2144157483777538e-05, "epoch": 5.828120345546619, "percentage": 58.28, "elapsed_time": "2:42:22", "remaining_time": "1:56:13", "throughput": 2316.45, "total_tokens": 22567696} {"current_steps": 39135, "total_steps": 67140, "loss": 0.4616, "lr": 2.2137701279475224e-05, "epoch": 5.828865058087578, "percentage": 58.29, "elapsed_time": "2:42:23", "remaining_time": "1:56:12", "throughput": 2316.47, "total_tokens": 22570384} {"current_steps": 39140, "total_steps": 67140, "loss": 0.5268, "lr": 2.213124526859542e-05, "epoch": 5.8296097706285375, "percentage": 58.3, "elapsed_time": "2:42:24", "remaining_time": "1:56:11", "throughput": 2316.5, "total_tokens": 22573360} {"current_steps": 39145, "total_steps": 67140, "loss": 0.6485, "lr": 2.2124789451574405e-05, "epoch": 5.830354483169496, "percentage": 58.3, "elapsed_time": "2:42:25", "remaining_time": "1:56:09", "throughput": 2316.53, "total_tokens": 22576304} {"current_steps": 39150, "total_steps": 67140, "loss": 0.5544, "lr": 2.2118333828848422e-05, "epoch": 5.831099195710456, "percentage": 58.31, "elapsed_time": "2:42:26", "remaining_time": "1:56:08", "throughput": 2316.54, "total_tokens": 22578960} {"current_steps": 39155, "total_steps": 67140, "loss": 0.5895, "lr": 2.2111878400853732e-05, "epoch": 5.831843908251415, "percentage": 58.32, "elapsed_time": "2:42:28", "remaining_time": "1:56:07", "throughput": 2316.58, "total_tokens": 22582160} {"current_steps": 39160, "total_steps": 67140, "loss": 0.6466, "lr": 2.2105423168026545e-05, "epoch": 5.832588620792374, "percentage": 58.33, "elapsed_time": "2:42:29", "remaining_time": "1:56:05", "throughput": 2316.6, "total_tokens": 22584912} {"current_steps": 39165, "total_steps": 67140, "loss": 0.635, "lr": 2.2098968130803096e-05, "epoch": 5.833333333333333, "percentage": 58.33, "elapsed_time": "2:42:30", "remaining_time": "1:56:04", "throughput": 2316.63, "total_tokens": 22587824} {"current_steps": 39170, "total_steps": 67140, "loss": 0.622, "lr": 2.2092513289619597e-05, "epoch": 5.834078045874293, "percentage": 58.34, "elapsed_time": "2:42:31", "remaining_time": "1:56:03", "throughput": 2316.66, "total_tokens": 22590736} {"current_steps": 39175, "total_steps": 67140, "loss": 0.7636, "lr": 2.208605864491222e-05, "epoch": 5.834822758415251, "percentage": 58.35, "elapsed_time": "2:42:32", "remaining_time": "1:56:01", "throughput": 2316.68, "total_tokens": 22593552} {"current_steps": 39180, "total_steps": 67140, "loss": 0.504, "lr": 2.2079604197117152e-05, "epoch": 5.835567470956211, "percentage": 58.36, "elapsed_time": "2:42:33", "remaining_time": "1:56:00", "throughput": 2316.72, "total_tokens": 22596752} {"current_steps": 39185, "total_steps": 67140, "loss": 0.5768, "lr": 2.2073149946670556e-05, "epoch": 5.83631218349717, "percentage": 58.36, "elapsed_time": "2:42:34", "remaining_time": "1:55:59", "throughput": 2316.73, "total_tokens": 22599376} {"current_steps": 39190, "total_steps": 67140, "loss": 0.7411, "lr": 2.2066695894008595e-05, "epoch": 5.8370568960381295, "percentage": 58.37, "elapsed_time": "2:42:35", "remaining_time": "1:55:57", "throughput": 2316.76, "total_tokens": 22602288} {"current_steps": 39195, "total_steps": 67140, "loss": 0.7213, "lr": 2.2060242039567393e-05, "epoch": 5.837801608579088, "percentage": 58.38, "elapsed_time": "2:42:37", "remaining_time": "1:55:56", "throughput": 2316.79, "total_tokens": 22605264} {"current_steps": 39200, "total_steps": 67140, "loss": 0.6387, "lr": 2.205378838378308e-05, "epoch": 5.838546321120048, "percentage": 58.39, "elapsed_time": "2:42:38", "remaining_time": "1:55:55", "throughput": 2316.82, "total_tokens": 22608208} {"current_steps": 39205, "total_steps": 67140, "loss": 0.4073, "lr": 2.204733492709178e-05, "epoch": 5.839291033661007, "percentage": 58.39, "elapsed_time": "2:42:39", "remaining_time": "1:55:53", "throughput": 2316.83, "total_tokens": 22610960} {"current_steps": 39210, "total_steps": 67140, "loss": 0.6423, "lr": 2.2040881669929582e-05, "epoch": 5.840035746201966, "percentage": 58.4, "elapsed_time": "2:42:40", "remaining_time": "1:55:52", "throughput": 2316.86, "total_tokens": 22613840} {"current_steps": 39215, "total_steps": 67140, "loss": 0.6283, "lr": 2.203442861273256e-05, "epoch": 5.840780458742925, "percentage": 58.41, "elapsed_time": "2:42:41", "remaining_time": "1:55:51", "throughput": 2316.88, "total_tokens": 22616592} {"current_steps": 39220, "total_steps": 67140, "loss": 0.6507, "lr": 2.202797575593679e-05, "epoch": 5.841525171283885, "percentage": 58.42, "elapsed_time": "2:42:42", "remaining_time": "1:55:49", "throughput": 2316.9, "total_tokens": 22619376} {"current_steps": 39225, "total_steps": 67140, "loss": 0.6101, "lr": 2.2021523099978347e-05, "epoch": 5.8422698838248435, "percentage": 58.42, "elapsed_time": "2:42:43", "remaining_time": "1:55:48", "throughput": 2316.91, "total_tokens": 22622160} {"current_steps": 39230, "total_steps": 67140, "loss": 0.7133, "lr": 2.2015070645293257e-05, "epoch": 5.843014596365803, "percentage": 58.43, "elapsed_time": "2:42:45", "remaining_time": "1:55:47", "throughput": 2316.92, "total_tokens": 22624816} {"current_steps": 39235, "total_steps": 67140, "loss": 0.5661, "lr": 2.2008618392317557e-05, "epoch": 5.843759308906762, "percentage": 58.44, "elapsed_time": "2:42:46", "remaining_time": "1:55:45", "throughput": 2316.94, "total_tokens": 22627568} {"current_steps": 39240, "total_steps": 67140, "loss": 0.4894, "lr": 2.2002166341487267e-05, "epoch": 5.8445040214477215, "percentage": 58.45, "elapsed_time": "2:42:47", "remaining_time": "1:55:44", "throughput": 2316.95, "total_tokens": 22630192} {"current_steps": 39245, "total_steps": 67140, "loss": 0.6503, "lr": 2.1995714493238383e-05, "epoch": 5.84524873398868, "percentage": 58.45, "elapsed_time": "2:42:48", "remaining_time": "1:55:43", "throughput": 2316.98, "total_tokens": 22633104} {"current_steps": 39250, "total_steps": 67140, "loss": 0.5641, "lr": 2.1989262848006912e-05, "epoch": 5.84599344652964, "percentage": 58.46, "elapsed_time": "2:42:49", "remaining_time": "1:55:41", "throughput": 2317.01, "total_tokens": 22636112} {"current_steps": 39255, "total_steps": 67140, "loss": 0.5274, "lr": 2.1982811406228805e-05, "epoch": 5.846738159070599, "percentage": 58.47, "elapsed_time": "2:42:50", "remaining_time": "1:55:40", "throughput": 2317.03, "total_tokens": 22638960} {"current_steps": 39260, "total_steps": 67140, "loss": 0.7373, "lr": 2.1976360168340042e-05, "epoch": 5.847482871611557, "percentage": 58.47, "elapsed_time": "2:42:51", "remaining_time": "1:55:39", "throughput": 2317.06, "total_tokens": 22641808} {"current_steps": 39265, "total_steps": 67140, "loss": 0.6312, "lr": 2.1969909134776555e-05, "epoch": 5.848227584152517, "percentage": 58.48, "elapsed_time": "2:42:52", "remaining_time": "1:55:37", "throughput": 2317.08, "total_tokens": 22644560} {"current_steps": 39270, "total_steps": 67140, "loss": 0.6023, "lr": 2.1963458305974297e-05, "epoch": 5.848972296693477, "percentage": 58.49, "elapsed_time": "2:42:54", "remaining_time": "1:55:36", "throughput": 2317.09, "total_tokens": 22647248} {"current_steps": 39275, "total_steps": 67140, "loss": 0.5235, "lr": 2.1957007682369182e-05, "epoch": 5.8497170092344355, "percentage": 58.5, "elapsed_time": "2:42:55", "remaining_time": "1:55:35", "throughput": 2317.1, "total_tokens": 22650000} {"current_steps": 39280, "total_steps": 67140, "loss": 0.4599, "lr": 2.195055726439711e-05, "epoch": 5.850461721775394, "percentage": 58.5, "elapsed_time": "2:42:56", "remaining_time": "1:55:33", "throughput": 2317.12, "total_tokens": 22652752} {"current_steps": 39285, "total_steps": 67140, "loss": 0.6045, "lr": 2.1944107052493984e-05, "epoch": 5.851206434316354, "percentage": 58.51, "elapsed_time": "2:42:57", "remaining_time": "1:55:32", "throughput": 2317.17, "total_tokens": 22655952} {"current_steps": 39290, "total_steps": 67140, "loss": 0.6646, "lr": 2.1937657047095687e-05, "epoch": 5.8519511468573135, "percentage": 58.52, "elapsed_time": "2:42:58", "remaining_time": "1:55:31", "throughput": 2317.17, "total_tokens": 22658480} {"current_steps": 39295, "total_steps": 67140, "loss": 0.7829, "lr": 2.193120724863807e-05, "epoch": 5.852695859398272, "percentage": 58.53, "elapsed_time": "2:42:59", "remaining_time": "1:55:30", "throughput": 2317.2, "total_tokens": 22661488} {"current_steps": 39300, "total_steps": 67140, "loss": 0.6433, "lr": 2.1924757657556986e-05, "epoch": 5.853440571939231, "percentage": 58.53, "elapsed_time": "2:43:00", "remaining_time": "1:55:28", "throughput": 2317.24, "total_tokens": 22664496} {"current_steps": 39305, "total_steps": 67140, "loss": 0.4742, "lr": 2.1918308274288278e-05, "epoch": 5.854185284480191, "percentage": 58.54, "elapsed_time": "2:43:01", "remaining_time": "1:55:27", "throughput": 2317.27, "total_tokens": 22667376} {"current_steps": 39310, "total_steps": 67140, "loss": 0.5738, "lr": 2.191185909926777e-05, "epoch": 5.8549299970211495, "percentage": 58.55, "elapsed_time": "2:43:03", "remaining_time": "1:55:26", "throughput": 2317.28, "total_tokens": 22670096} {"current_steps": 39315, "total_steps": 67140, "loss": 0.6715, "lr": 2.1905410132931263e-05, "epoch": 5.855674709562109, "percentage": 58.56, "elapsed_time": "2:43:04", "remaining_time": "1:55:24", "throughput": 2317.29, "total_tokens": 22672752} {"current_steps": 39320, "total_steps": 67140, "loss": 0.5776, "lr": 2.1898961375714567e-05, "epoch": 5.856419422103068, "percentage": 58.56, "elapsed_time": "2:43:05", "remaining_time": "1:55:23", "throughput": 2317.34, "total_tokens": 22676016} {"current_steps": 39325, "total_steps": 67140, "loss": 0.7316, "lr": 2.1892512828053443e-05, "epoch": 5.8571641346440275, "percentage": 58.57, "elapsed_time": "2:43:06", "remaining_time": "1:55:22", "throughput": 2317.38, "total_tokens": 22678992} {"current_steps": 39330, "total_steps": 67140, "loss": 0.6345, "lr": 2.1886064490383682e-05, "epoch": 5.857908847184986, "percentage": 58.58, "elapsed_time": "2:43:07", "remaining_time": "1:55:20", "throughput": 2317.4, "total_tokens": 22681840} {"current_steps": 39335, "total_steps": 67140, "loss": 0.8095, "lr": 2.1879616363141012e-05, "epoch": 5.858653559725946, "percentage": 58.59, "elapsed_time": "2:43:08", "remaining_time": "1:55:19", "throughput": 2317.42, "total_tokens": 22684624} {"current_steps": 39340, "total_steps": 67140, "loss": 0.4139, "lr": 2.1873168446761184e-05, "epoch": 5.859398272266905, "percentage": 58.59, "elapsed_time": "2:43:09", "remaining_time": "1:55:18", "throughput": 2317.43, "total_tokens": 22687280} {"current_steps": 39345, "total_steps": 67140, "loss": 0.721, "lr": 2.1866720741679918e-05, "epoch": 5.860142984807864, "percentage": 58.6, "elapsed_time": "2:43:11", "remaining_time": "1:55:16", "throughput": 2317.47, "total_tokens": 22690480} {"current_steps": 39350, "total_steps": 67140, "loss": 0.5604, "lr": 2.186027324833292e-05, "epoch": 5.860887697348823, "percentage": 58.61, "elapsed_time": "2:43:12", "remaining_time": "1:55:15", "throughput": 2317.52, "total_tokens": 22693744} {"current_steps": 39355, "total_steps": 67140, "loss": 0.6559, "lr": 2.18538259671559e-05, "epoch": 5.861632409889783, "percentage": 58.62, "elapsed_time": "2:43:13", "remaining_time": "1:55:14", "throughput": 2317.57, "total_tokens": 22696816} {"current_steps": 39360, "total_steps": 67140, "loss": 0.6097, "lr": 2.1847378898584524e-05, "epoch": 5.8623771224307415, "percentage": 58.62, "elapsed_time": "2:43:14", "remaining_time": "1:55:12", "throughput": 2317.59, "total_tokens": 22699632} {"current_steps": 39365, "total_steps": 67140, "loss": 0.6469, "lr": 2.184093204305446e-05, "epoch": 5.863121834971701, "percentage": 58.63, "elapsed_time": "2:43:15", "remaining_time": "1:55:11", "throughput": 2317.62, "total_tokens": 22702640} {"current_steps": 39370, "total_steps": 67140, "loss": 0.4626, "lr": 2.1834485401001384e-05, "epoch": 5.86386654751266, "percentage": 58.64, "elapsed_time": "2:43:16", "remaining_time": "1:55:10", "throughput": 2317.65, "total_tokens": 22705648} {"current_steps": 39375, "total_steps": 67140, "loss": 0.6796, "lr": 2.1828038972860904e-05, "epoch": 5.8646112600536195, "percentage": 58.65, "elapsed_time": "2:43:17", "remaining_time": "1:55:08", "throughput": 2317.65, "total_tokens": 22708144} {"current_steps": 39380, "total_steps": 67140, "loss": 0.6462, "lr": 2.182159275906865e-05, "epoch": 5.865355972594578, "percentage": 58.65, "elapsed_time": "2:43:19", "remaining_time": "1:55:07", "throughput": 2317.67, "total_tokens": 22710896} {"current_steps": 39385, "total_steps": 67140, "loss": 0.516, "lr": 2.1815146760060234e-05, "epoch": 5.866100685135538, "percentage": 58.66, "elapsed_time": "2:43:20", "remaining_time": "1:55:06", "throughput": 2317.7, "total_tokens": 22713872} {"current_steps": 39390, "total_steps": 67140, "loss": 0.4244, "lr": 2.1808700976271256e-05, "epoch": 5.866845397676497, "percentage": 58.67, "elapsed_time": "2:43:21", "remaining_time": "1:55:04", "throughput": 2317.73, "total_tokens": 22716688} {"current_steps": 39395, "total_steps": 67140, "loss": 0.7168, "lr": 2.1802255408137286e-05, "epoch": 5.867590110217456, "percentage": 58.68, "elapsed_time": "2:43:22", "remaining_time": "1:55:03", "throughput": 2317.74, "total_tokens": 22719344} {"current_steps": 39400, "total_steps": 67140, "loss": 0.7467, "lr": 2.1795810056093896e-05, "epoch": 5.868334822758415, "percentage": 58.68, "elapsed_time": "2:43:23", "remaining_time": "1:55:02", "throughput": 2317.75, "total_tokens": 22722032} {"current_steps": 39405, "total_steps": 67140, "loss": 0.5669, "lr": 2.178936492057664e-05, "epoch": 5.869079535299375, "percentage": 58.69, "elapsed_time": "2:43:24", "remaining_time": "1:55:00", "throughput": 2317.78, "total_tokens": 22724848} {"current_steps": 39410, "total_steps": 67140, "loss": 0.425, "lr": 2.1782920002021054e-05, "epoch": 5.8698242478403335, "percentage": 58.7, "elapsed_time": "2:43:25", "remaining_time": "1:54:59", "throughput": 2317.86, "total_tokens": 22728880} {"current_steps": 39415, "total_steps": 67140, "loss": 0.7606, "lr": 2.1776475300862646e-05, "epoch": 5.870568960381293, "percentage": 58.71, "elapsed_time": "2:43:27", "remaining_time": "1:54:58", "throughput": 2317.88, "total_tokens": 22731568} {"current_steps": 39420, "total_steps": 67140, "loss": 0.6313, "lr": 2.1770030817536928e-05, "epoch": 5.871313672922252, "percentage": 58.71, "elapsed_time": "2:43:28", "remaining_time": "1:54:57", "throughput": 2317.9, "total_tokens": 22734416} {"current_steps": 39425, "total_steps": 67140, "loss": 0.4779, "lr": 2.17635865524794e-05, "epoch": 5.872058385463212, "percentage": 58.72, "elapsed_time": "2:43:29", "remaining_time": "1:54:55", "throughput": 2317.93, "total_tokens": 22737392} {"current_steps": 39430, "total_steps": 67140, "loss": 0.5584, "lr": 2.1757142506125534e-05, "epoch": 5.87280309800417, "percentage": 58.73, "elapsed_time": "2:43:30", "remaining_time": "1:54:54", "throughput": 2317.93, "total_tokens": 22739920} {"current_steps": 39435, "total_steps": 67140, "loss": 0.6519, "lr": 2.1750698678910788e-05, "epoch": 5.87354781054513, "percentage": 58.74, "elapsed_time": "2:43:31", "remaining_time": "1:54:53", "throughput": 2317.97, "total_tokens": 22742992} {"current_steps": 39440, "total_steps": 67140, "loss": 0.6146, "lr": 2.174425507127062e-05, "epoch": 5.874292523086089, "percentage": 58.74, "elapsed_time": "2:43:32", "remaining_time": "1:54:51", "throughput": 2318.01, "total_tokens": 22746096} {"current_steps": 39445, "total_steps": 67140, "loss": 0.6381, "lr": 2.1737811683640455e-05, "epoch": 5.8750372356270475, "percentage": 58.75, "elapsed_time": "2:43:33", "remaining_time": "1:54:50", "throughput": 2318.05, "total_tokens": 22749200} {"current_steps": 39450, "total_steps": 67140, "loss": 0.5207, "lr": 2.1731368516455723e-05, "epoch": 5.875781948168007, "percentage": 58.76, "elapsed_time": "2:43:35", "remaining_time": "1:54:49", "throughput": 2318.07, "total_tokens": 22752080} {"current_steps": 39455, "total_steps": 67140, "loss": 0.6769, "lr": 2.1724925570151806e-05, "epoch": 5.876526660708967, "percentage": 58.77, "elapsed_time": "2:43:36", "remaining_time": "1:54:47", "throughput": 2318.11, "total_tokens": 22755152} {"current_steps": 39460, "total_steps": 67140, "loss": 0.7239, "lr": 2.171848284516411e-05, "epoch": 5.8772713732499255, "percentage": 58.77, "elapsed_time": "2:43:37", "remaining_time": "1:54:46", "throughput": 2318.13, "total_tokens": 22757968} {"current_steps": 39465, "total_steps": 67140, "loss": 0.6362, "lr": 2.1712040341927998e-05, "epoch": 5.878016085790884, "percentage": 58.78, "elapsed_time": "2:43:38", "remaining_time": "1:54:45", "throughput": 2318.17, "total_tokens": 22761008} {"current_steps": 39470, "total_steps": 67140, "loss": 0.6829, "lr": 2.170559806087883e-05, "epoch": 5.878760798331844, "percentage": 58.79, "elapsed_time": "2:43:39", "remaining_time": "1:54:43", "throughput": 2318.19, "total_tokens": 22763856} {"current_steps": 39475, "total_steps": 67140, "loss": 0.6808, "lr": 2.1699156002451954e-05, "epoch": 5.879505510872804, "percentage": 58.8, "elapsed_time": "2:43:40", "remaining_time": "1:54:42", "throughput": 2318.2, "total_tokens": 22766480} {"current_steps": 39480, "total_steps": 67140, "loss": 0.5651, "lr": 2.169271416708269e-05, "epoch": 5.880250223413762, "percentage": 58.8, "elapsed_time": "2:43:41", "remaining_time": "1:54:41", "throughput": 2318.21, "total_tokens": 22769072} {"current_steps": 39485, "total_steps": 67140, "loss": 0.6263, "lr": 2.1686272555206363e-05, "epoch": 5.880994935954721, "percentage": 58.81, "elapsed_time": "2:43:42", "remaining_time": "1:54:39", "throughput": 2318.23, "total_tokens": 22771888} {"current_steps": 39490, "total_steps": 67140, "loss": 0.7079, "lr": 2.1679831167258267e-05, "epoch": 5.881739648495681, "percentage": 58.82, "elapsed_time": "2:43:44", "remaining_time": "1:54:38", "throughput": 2318.25, "total_tokens": 22774768} {"current_steps": 39495, "total_steps": 67140, "loss": 0.6042, "lr": 2.1673390003673678e-05, "epoch": 5.8824843610366395, "percentage": 58.82, "elapsed_time": "2:43:45", "remaining_time": "1:54:37", "throughput": 2318.27, "total_tokens": 22777584} {"current_steps": 39500, "total_steps": 67140, "loss": 0.8487, "lr": 2.1666949064887862e-05, "epoch": 5.883229073577599, "percentage": 58.83, "elapsed_time": "2:43:46", "remaining_time": "1:54:35", "throughput": 2318.27, "total_tokens": 22780080} {"current_steps": 39505, "total_steps": 67140, "loss": 0.5763, "lr": 2.1660508351336086e-05, "epoch": 5.883973786118558, "percentage": 58.84, "elapsed_time": "2:43:47", "remaining_time": "1:54:34", "throughput": 2318.3, "total_tokens": 22782960} {"current_steps": 39510, "total_steps": 67140, "loss": 0.7407, "lr": 2.1654067863453568e-05, "epoch": 5.884718498659518, "percentage": 58.85, "elapsed_time": "2:43:48", "remaining_time": "1:54:33", "throughput": 2318.31, "total_tokens": 22785648} {"current_steps": 39515, "total_steps": 67140, "loss": 0.5982, "lr": 2.1647627601675542e-05, "epoch": 5.885463211200476, "percentage": 58.85, "elapsed_time": "2:43:49", "remaining_time": "1:54:31", "throughput": 2318.33, "total_tokens": 22788432} {"current_steps": 39520, "total_steps": 67140, "loss": 0.6973, "lr": 2.164118756643722e-05, "epoch": 5.886207923741436, "percentage": 58.86, "elapsed_time": "2:43:50", "remaining_time": "1:54:30", "throughput": 2318.37, "total_tokens": 22791504} {"current_steps": 39525, "total_steps": 67140, "loss": 0.7198, "lr": 2.163474775817378e-05, "epoch": 5.886952636282395, "percentage": 58.87, "elapsed_time": "2:43:51", "remaining_time": "1:54:29", "throughput": 2318.38, "total_tokens": 22794256} {"current_steps": 39530, "total_steps": 67140, "loss": 0.6892, "lr": 2.1628308177320418e-05, "epoch": 5.887697348823354, "percentage": 58.88, "elapsed_time": "2:43:53", "remaining_time": "1:54:27", "throughput": 2318.41, "total_tokens": 22797104} {"current_steps": 39535, "total_steps": 67140, "loss": 0.7224, "lr": 2.1621868824312264e-05, "epoch": 5.888442061364313, "percentage": 58.88, "elapsed_time": "2:43:54", "remaining_time": "1:54:26", "throughput": 2318.43, "total_tokens": 22799952} {"current_steps": 39540, "total_steps": 67140, "loss": 0.4216, "lr": 2.161542969958449e-05, "epoch": 5.889186773905273, "percentage": 58.89, "elapsed_time": "2:43:55", "remaining_time": "1:54:25", "throughput": 2318.44, "total_tokens": 22802608} {"current_steps": 39545, "total_steps": 67140, "loss": 0.5296, "lr": 2.160899080357221e-05, "epoch": 5.8899314864462315, "percentage": 58.9, "elapsed_time": "2:43:56", "remaining_time": "1:54:24", "throughput": 2318.49, "total_tokens": 22805936} {"current_steps": 39550, "total_steps": 67140, "loss": 0.5719, "lr": 2.1602552136710543e-05, "epoch": 5.890676198987191, "percentage": 58.91, "elapsed_time": "2:43:57", "remaining_time": "1:54:22", "throughput": 2318.52, "total_tokens": 22808848} {"current_steps": 39555, "total_steps": 67140, "loss": 0.6272, "lr": 2.1596113699434597e-05, "epoch": 5.89142091152815, "percentage": 58.91, "elapsed_time": "2:43:58", "remaining_time": "1:54:21", "throughput": 2318.54, "total_tokens": 22811696} {"current_steps": 39560, "total_steps": 67140, "loss": 0.4885, "lr": 2.1589675492179444e-05, "epoch": 5.89216562406911, "percentage": 58.92, "elapsed_time": "2:44:00", "remaining_time": "1:54:20", "throughput": 2318.58, "total_tokens": 22814864} {"current_steps": 39565, "total_steps": 67140, "loss": 0.7066, "lr": 2.1583237515380153e-05, "epoch": 5.892910336610068, "percentage": 58.93, "elapsed_time": "2:44:01", "remaining_time": "1:54:18", "throughput": 2318.61, "total_tokens": 22817872} {"current_steps": 39570, "total_steps": 67140, "loss": 0.7558, "lr": 2.1576799769471787e-05, "epoch": 5.893655049151028, "percentage": 58.94, "elapsed_time": "2:44:02", "remaining_time": "1:54:17", "throughput": 2318.64, "total_tokens": 22820720} {"current_steps": 39575, "total_steps": 67140, "loss": 0.6967, "lr": 2.157036225488938e-05, "epoch": 5.894399761691987, "percentage": 58.94, "elapsed_time": "2:44:03", "remaining_time": "1:54:16", "throughput": 2318.66, "total_tokens": 22823536} {"current_steps": 39580, "total_steps": 67140, "loss": 0.586, "lr": 2.1563924972067934e-05, "epoch": 5.895144474232946, "percentage": 58.95, "elapsed_time": "2:44:04", "remaining_time": "1:54:14", "throughput": 2318.7, "total_tokens": 22826608} {"current_steps": 39585, "total_steps": 67140, "loss": 0.645, "lr": 2.155748792144247e-05, "epoch": 5.895889186773905, "percentage": 58.96, "elapsed_time": "2:44:05", "remaining_time": "1:54:13", "throughput": 2318.72, "total_tokens": 22829488} {"current_steps": 39590, "total_steps": 67140, "loss": 0.55, "lr": 2.1551051103447982e-05, "epoch": 5.896633899314865, "percentage": 58.97, "elapsed_time": "2:44:06", "remaining_time": "1:54:12", "throughput": 2318.75, "total_tokens": 22832464} {"current_steps": 39595, "total_steps": 67140, "loss": 0.5326, "lr": 2.1544614518519434e-05, "epoch": 5.897378611855824, "percentage": 58.97, "elapsed_time": "2:44:07", "remaining_time": "1:54:10", "throughput": 2318.77, "total_tokens": 22835184} {"current_steps": 39600, "total_steps": 67140, "loss": 0.5866, "lr": 2.1538178167091787e-05, "epoch": 5.898123324396783, "percentage": 58.98, "elapsed_time": "2:44:09", "remaining_time": "1:54:09", "throughput": 2318.79, "total_tokens": 22838000} {"current_steps": 39605, "total_steps": 67140, "loss": 0.6154, "lr": 2.153174204959999e-05, "epoch": 5.898868036937742, "percentage": 58.99, "elapsed_time": "2:44:10", "remaining_time": "1:54:08", "throughput": 2318.81, "total_tokens": 22840880} {"current_steps": 39610, "total_steps": 67140, "loss": 0.4606, "lr": 2.1525306166478957e-05, "epoch": 5.899612749478701, "percentage": 59.0, "elapsed_time": "2:44:11", "remaining_time": "1:54:07", "throughput": 2318.86, "total_tokens": 22844176} {"current_steps": 39615, "total_steps": 67140, "loss": 0.5593, "lr": 2.151887051816362e-05, "epoch": 5.90035746201966, "percentage": 59.0, "elapsed_time": "2:44:12", "remaining_time": "1:54:05", "throughput": 2318.88, "total_tokens": 22846992} {"current_steps": 39620, "total_steps": 67140, "loss": 0.5118, "lr": 2.1512435105088847e-05, "epoch": 5.90110217456062, "percentage": 59.01, "elapsed_time": "2:44:13", "remaining_time": "1:54:04", "throughput": 2318.9, "total_tokens": 22849680} {"current_steps": 39625, "total_steps": 67140, "loss": 0.6528, "lr": 2.1505999927689536e-05, "epoch": 5.901846887101579, "percentage": 59.02, "elapsed_time": "2:44:14", "remaining_time": "1:54:03", "throughput": 2318.93, "total_tokens": 22852688} {"current_steps": 39630, "total_steps": 67140, "loss": 0.7666, "lr": 2.149956498640054e-05, "epoch": 5.9025915996425375, "percentage": 59.03, "elapsed_time": "2:44:16", "remaining_time": "1:54:01", "throughput": 2318.97, "total_tokens": 22855952} {"current_steps": 39635, "total_steps": 67140, "loss": 0.5883, "lr": 2.1493130281656708e-05, "epoch": 5.903336312183497, "percentage": 59.03, "elapsed_time": "2:44:17", "remaining_time": "1:54:00", "throughput": 2319.0, "total_tokens": 22858768} {"current_steps": 39640, "total_steps": 67140, "loss": 0.9395, "lr": 2.1486695813892883e-05, "epoch": 5.904081024724457, "percentage": 59.04, "elapsed_time": "2:44:18", "remaining_time": "1:53:59", "throughput": 2319.01, "total_tokens": 22861424} {"current_steps": 39645, "total_steps": 67140, "loss": 0.655, "lr": 2.1480261583543866e-05, "epoch": 5.904825737265416, "percentage": 59.05, "elapsed_time": "2:44:19", "remaining_time": "1:53:57", "throughput": 2319.04, "total_tokens": 22864336} {"current_steps": 39650, "total_steps": 67140, "loss": 0.639, "lr": 2.1473827591044464e-05, "epoch": 5.905570449806374, "percentage": 59.06, "elapsed_time": "2:44:20", "remaining_time": "1:53:56", "throughput": 2319.05, "total_tokens": 22867088} {"current_steps": 39655, "total_steps": 67140, "loss": 0.8247, "lr": 2.1467393836829454e-05, "epoch": 5.906315162347334, "percentage": 59.06, "elapsed_time": "2:44:21", "remaining_time": "1:53:55", "throughput": 2319.08, "total_tokens": 22869936} {"current_steps": 39660, "total_steps": 67140, "loss": 0.5592, "lr": 2.146096032133361e-05, "epoch": 5.907059874888293, "percentage": 59.07, "elapsed_time": "2:44:22", "remaining_time": "1:53:53", "throughput": 2319.11, "total_tokens": 22872976} {"current_steps": 39665, "total_steps": 67140, "loss": 0.5526, "lr": 2.1454527044991673e-05, "epoch": 5.907804587429252, "percentage": 59.08, "elapsed_time": "2:44:23", "remaining_time": "1:53:52", "throughput": 2319.13, "total_tokens": 22875824} {"current_steps": 39670, "total_steps": 67140, "loss": 0.5385, "lr": 2.144809400823839e-05, "epoch": 5.908549299970211, "percentage": 59.09, "elapsed_time": "2:44:25", "remaining_time": "1:53:51", "throughput": 2319.16, "total_tokens": 22878672} {"current_steps": 39675, "total_steps": 67140, "loss": 0.4583, "lr": 2.1441661211508465e-05, "epoch": 5.909294012511171, "percentage": 59.09, "elapsed_time": "2:44:26", "remaining_time": "1:53:49", "throughput": 2319.17, "total_tokens": 22881392} {"current_steps": 39680, "total_steps": 67140, "loss": 0.5749, "lr": 2.1435228655236608e-05, "epoch": 5.91003872505213, "percentage": 59.1, "elapsed_time": "2:44:27", "remaining_time": "1:53:48", "throughput": 2319.19, "total_tokens": 22884144} {"current_steps": 39685, "total_steps": 67140, "loss": 0.727, "lr": 2.1428796339857513e-05, "epoch": 5.910783437593089, "percentage": 59.11, "elapsed_time": "2:44:28", "remaining_time": "1:53:47", "throughput": 2319.21, "total_tokens": 22886960} {"current_steps": 39690, "total_steps": 67140, "loss": 0.67, "lr": 2.1422364265805832e-05, "epoch": 5.911528150134048, "percentage": 59.12, "elapsed_time": "2:44:29", "remaining_time": "1:53:45", "throughput": 2319.22, "total_tokens": 22889520} {"current_steps": 39695, "total_steps": 67140, "loss": 0.6575, "lr": 2.1415932433516243e-05, "epoch": 5.912272862675008, "percentage": 59.12, "elapsed_time": "2:44:30", "remaining_time": "1:53:44", "throughput": 2319.23, "total_tokens": 22892240} {"current_steps": 39700, "total_steps": 67140, "loss": 0.5243, "lr": 2.140950084342336e-05, "epoch": 5.913017575215966, "percentage": 59.13, "elapsed_time": "2:44:31", "remaining_time": "1:53:43", "throughput": 2319.25, "total_tokens": 22895024} {"current_steps": 39705, "total_steps": 67140, "loss": 0.5755, "lr": 2.1403069495961813e-05, "epoch": 5.913762287756926, "percentage": 59.14, "elapsed_time": "2:44:32", "remaining_time": "1:53:41", "throughput": 2319.28, "total_tokens": 22898000} {"current_steps": 39710, "total_steps": 67140, "loss": 0.5438, "lr": 2.13966383915662e-05, "epoch": 5.914507000297885, "percentage": 59.15, "elapsed_time": "2:44:34", "remaining_time": "1:53:40", "throughput": 2319.31, "total_tokens": 22900848} {"current_steps": 39715, "total_steps": 67140, "loss": 0.611, "lr": 2.1390207530671115e-05, "epoch": 5.915251712838844, "percentage": 59.15, "elapsed_time": "2:44:35", "remaining_time": "1:53:39", "throughput": 2319.33, "total_tokens": 22903728} {"current_steps": 39720, "total_steps": 67140, "loss": 0.5295, "lr": 2.1383776913711135e-05, "epoch": 5.915996425379803, "percentage": 59.16, "elapsed_time": "2:44:36", "remaining_time": "1:53:37", "throughput": 2319.35, "total_tokens": 22906480} {"current_steps": 39725, "total_steps": 67140, "loss": 0.5174, "lr": 2.1377346541120803e-05, "epoch": 5.916741137920763, "percentage": 59.17, "elapsed_time": "2:44:37", "remaining_time": "1:53:36", "throughput": 2319.35, "total_tokens": 22909072} {"current_steps": 39730, "total_steps": 67140, "loss": 0.618, "lr": 2.1370916413334663e-05, "epoch": 5.917485850461722, "percentage": 59.17, "elapsed_time": "2:44:38", "remaining_time": "1:53:35", "throughput": 2319.41, "total_tokens": 22912368} {"current_steps": 39735, "total_steps": 67140, "loss": 0.5714, "lr": 2.1364486530787247e-05, "epoch": 5.918230563002681, "percentage": 59.18, "elapsed_time": "2:44:39", "remaining_time": "1:53:33", "throughput": 2319.42, "total_tokens": 22915088} {"current_steps": 39740, "total_steps": 67140, "loss": 0.6883, "lr": 2.1358056893913047e-05, "epoch": 5.91897527554364, "percentage": 59.19, "elapsed_time": "2:44:40", "remaining_time": "1:53:32", "throughput": 2319.45, "total_tokens": 22918064} {"current_steps": 39745, "total_steps": 67140, "loss": 0.5724, "lr": 2.1351627503146547e-05, "epoch": 5.9197199880846, "percentage": 59.2, "elapsed_time": "2:44:41", "remaining_time": "1:53:31", "throughput": 2319.46, "total_tokens": 22920688} {"current_steps": 39750, "total_steps": 67140, "loss": 0.7314, "lr": 2.134519835892223e-05, "epoch": 5.920464700625558, "percentage": 59.2, "elapsed_time": "2:44:43", "remaining_time": "1:53:30", "throughput": 2319.5, "total_tokens": 22923760} {"current_steps": 39755, "total_steps": 67140, "loss": 0.3921, "lr": 2.133876946167455e-05, "epoch": 5.921209413166518, "percentage": 59.21, "elapsed_time": "2:44:44", "remaining_time": "1:53:28", "throughput": 2319.52, "total_tokens": 22926704} {"current_steps": 39760, "total_steps": 67140, "loss": 0.4816, "lr": 2.1332340811837944e-05, "epoch": 5.921954125707477, "percentage": 59.22, "elapsed_time": "2:44:45", "remaining_time": "1:53:27", "throughput": 2319.54, "total_tokens": 22929520} {"current_steps": 39765, "total_steps": 67140, "loss": 0.7864, "lr": 2.1325912409846834e-05, "epoch": 5.9226988382484365, "percentage": 59.23, "elapsed_time": "2:44:46", "remaining_time": "1:53:26", "throughput": 2319.58, "total_tokens": 22932496} {"current_steps": 39770, "total_steps": 67140, "loss": 0.7187, "lr": 2.131948425613563e-05, "epoch": 5.923443550789395, "percentage": 59.23, "elapsed_time": "2:44:47", "remaining_time": "1:53:24", "throughput": 2319.59, "total_tokens": 22935216} {"current_steps": 39775, "total_steps": 67140, "loss": 0.6835, "lr": 2.1313056351138715e-05, "epoch": 5.924188263330355, "percentage": 59.24, "elapsed_time": "2:44:48", "remaining_time": "1:53:23", "throughput": 2319.63, "total_tokens": 22938224} {"current_steps": 39780, "total_steps": 67140, "loss": 0.7488, "lr": 2.1306628695290458e-05, "epoch": 5.924932975871314, "percentage": 59.25, "elapsed_time": "2:44:49", "remaining_time": "1:53:22", "throughput": 2319.65, "total_tokens": 22941040} {"current_steps": 39785, "total_steps": 67140, "loss": 0.6443, "lr": 2.1300201289025215e-05, "epoch": 5.925677688412273, "percentage": 59.26, "elapsed_time": "2:44:50", "remaining_time": "1:53:20", "throughput": 2319.65, "total_tokens": 22943504} {"current_steps": 39790, "total_steps": 67140, "loss": 0.8716, "lr": 2.1293774132777332e-05, "epoch": 5.926422400953232, "percentage": 59.26, "elapsed_time": "2:44:52", "remaining_time": "1:53:19", "throughput": 2319.66, "total_tokens": 22946160} {"current_steps": 39795, "total_steps": 67140, "loss": 0.5924, "lr": 2.128734722698112e-05, "epoch": 5.927167113494191, "percentage": 59.27, "elapsed_time": "2:44:53", "remaining_time": "1:53:18", "throughput": 2319.7, "total_tokens": 22949296} {"current_steps": 39800, "total_steps": 67140, "loss": 0.5427, "lr": 2.128092057207089e-05, "epoch": 5.92791182603515, "percentage": 59.28, "elapsed_time": "2:44:54", "remaining_time": "1:53:16", "throughput": 2319.72, "total_tokens": 22952176} {"current_steps": 39805, "total_steps": 67140, "loss": 0.551, "lr": 2.127449416848093e-05, "epoch": 5.92865653857611, "percentage": 59.29, "elapsed_time": "2:44:55", "remaining_time": "1:53:15", "throughput": 2319.73, "total_tokens": 22954864} {"current_steps": 39810, "total_steps": 67140, "loss": 0.7086, "lr": 2.1268068016645505e-05, "epoch": 5.929401251117069, "percentage": 59.29, "elapsed_time": "2:44:56", "remaining_time": "1:53:14", "throughput": 2319.75, "total_tokens": 22957680} {"current_steps": 39815, "total_steps": 67140, "loss": 0.537, "lr": 2.1261642116998877e-05, "epoch": 5.930145963658028, "percentage": 59.3, "elapsed_time": "2:44:57", "remaining_time": "1:53:12", "throughput": 2319.77, "total_tokens": 22960432} {"current_steps": 39820, "total_steps": 67140, "loss": 0.6967, "lr": 2.1255216469975265e-05, "epoch": 5.930890676198987, "percentage": 59.31, "elapsed_time": "2:44:58", "remaining_time": "1:53:11", "throughput": 2319.78, "total_tokens": 22963120} {"current_steps": 39825, "total_steps": 67140, "loss": 0.4979, "lr": 2.1248791076008906e-05, "epoch": 5.931635388739946, "percentage": 59.32, "elapsed_time": "2:44:59", "remaining_time": "1:53:10", "throughput": 2319.8, "total_tokens": 22965872} {"current_steps": 39830, "total_steps": 67140, "loss": 0.5478, "lr": 2.1242365935533988e-05, "epoch": 5.932380101280906, "percentage": 59.32, "elapsed_time": "2:45:01", "remaining_time": "1:53:08", "throughput": 2319.81, "total_tokens": 22968528} {"current_steps": 39835, "total_steps": 67140, "loss": 0.7893, "lr": 2.123594104898471e-05, "epoch": 5.933124813821864, "percentage": 59.33, "elapsed_time": "2:45:02", "remaining_time": "1:53:07", "throughput": 2319.83, "total_tokens": 22971440} {"current_steps": 39840, "total_steps": 67140, "loss": 0.5231, "lr": 2.1229516416795224e-05, "epoch": 5.933869526362824, "percentage": 59.34, "elapsed_time": "2:45:03", "remaining_time": "1:53:06", "throughput": 2319.86, "total_tokens": 22974320} {"current_steps": 39845, "total_steps": 67140, "loss": 0.5573, "lr": 2.1223092039399695e-05, "epoch": 5.934614238903783, "percentage": 59.35, "elapsed_time": "2:45:04", "remaining_time": "1:53:04", "throughput": 2319.9, "total_tokens": 22977616} {"current_steps": 39850, "total_steps": 67140, "loss": 0.743, "lr": 2.121666791723225e-05, "epoch": 5.9353589514447425, "percentage": 59.35, "elapsed_time": "2:45:05", "remaining_time": "1:53:03", "throughput": 2319.93, "total_tokens": 22980432} {"current_steps": 39855, "total_steps": 67140, "loss": 0.4142, "lr": 2.1210244050727014e-05, "epoch": 5.936103663985701, "percentage": 59.36, "elapsed_time": "2:45:06", "remaining_time": "1:53:02", "throughput": 2319.95, "total_tokens": 22983216} {"current_steps": 39860, "total_steps": 67140, "loss": 0.6625, "lr": 2.1203820440318063e-05, "epoch": 5.936848376526661, "percentage": 59.37, "elapsed_time": "2:45:07", "remaining_time": "1:53:00", "throughput": 2319.96, "total_tokens": 22985936} {"current_steps": 39865, "total_steps": 67140, "loss": 0.6314, "lr": 2.1197397086439495e-05, "epoch": 5.93759308906762, "percentage": 59.38, "elapsed_time": "2:45:08", "remaining_time": "1:52:59", "throughput": 2319.96, "total_tokens": 22988528} {"current_steps": 39870, "total_steps": 67140, "loss": 0.5761, "lr": 2.1190973989525377e-05, "epoch": 5.938337801608579, "percentage": 59.38, "elapsed_time": "2:45:10", "remaining_time": "1:52:58", "throughput": 2319.98, "total_tokens": 22991344} {"current_steps": 39875, "total_steps": 67140, "loss": 0.759, "lr": 2.118455115000974e-05, "epoch": 5.939082514149538, "percentage": 59.39, "elapsed_time": "2:45:11", "remaining_time": "1:52:56", "throughput": 2320.0, "total_tokens": 22994096} {"current_steps": 39880, "total_steps": 67140, "loss": 0.5044, "lr": 2.117812856832663e-05, "epoch": 5.939827226690498, "percentage": 59.4, "elapsed_time": "2:45:12", "remaining_time": "1:52:55", "throughput": 2320.03, "total_tokens": 22997040} {"current_steps": 39885, "total_steps": 67140, "loss": 0.4879, "lr": 2.1171706244910055e-05, "epoch": 5.940571939231456, "percentage": 59.41, "elapsed_time": "2:45:13", "remaining_time": "1:52:54", "throughput": 2320.05, "total_tokens": 22999824} {"current_steps": 39890, "total_steps": 67140, "loss": 0.7076, "lr": 2.1165284180194003e-05, "epoch": 5.941316651772416, "percentage": 59.41, "elapsed_time": "2:45:14", "remaining_time": "1:52:52", "throughput": 2320.09, "total_tokens": 23002896} {"current_steps": 39895, "total_steps": 67140, "loss": 0.551, "lr": 2.1158862374612465e-05, "epoch": 5.942061364313375, "percentage": 59.42, "elapsed_time": "2:45:15", "remaining_time": "1:52:51", "throughput": 2320.1, "total_tokens": 23005616} {"current_steps": 39900, "total_steps": 67140, "loss": 0.4851, "lr": 2.1152440828599383e-05, "epoch": 5.9428060768543345, "percentage": 59.43, "elapsed_time": "2:45:16", "remaining_time": "1:52:50", "throughput": 2320.13, "total_tokens": 23008656} {"current_steps": 39905, "total_steps": 67140, "loss": 0.4803, "lr": 2.114601954258871e-05, "epoch": 5.943550789395293, "percentage": 59.44, "elapsed_time": "2:45:18", "remaining_time": "1:52:49", "throughput": 2320.18, "total_tokens": 23011952} {"current_steps": 39910, "total_steps": 67140, "loss": 0.7274, "lr": 2.113959851701436e-05, "epoch": 5.944295501936253, "percentage": 59.44, "elapsed_time": "2:45:19", "remaining_time": "1:52:47", "throughput": 2320.24, "total_tokens": 23015280} {"current_steps": 39915, "total_steps": 67140, "loss": 0.6276, "lr": 2.1133177752310252e-05, "epoch": 5.945040214477212, "percentage": 59.45, "elapsed_time": "2:45:20", "remaining_time": "1:52:46", "throughput": 2320.28, "total_tokens": 23018480} {"current_steps": 39920, "total_steps": 67140, "loss": 0.7346, "lr": 2.112675724891027e-05, "epoch": 5.945784927018171, "percentage": 59.46, "elapsed_time": "2:45:21", "remaining_time": "1:52:45", "throughput": 2320.3, "total_tokens": 23021168} {"current_steps": 39925, "total_steps": 67140, "loss": 0.5359, "lr": 2.1120337007248284e-05, "epoch": 5.94652963955913, "percentage": 59.47, "elapsed_time": "2:45:22", "remaining_time": "1:52:43", "throughput": 2320.32, "total_tokens": 23023952} {"current_steps": 39930, "total_steps": 67140, "loss": 0.5851, "lr": 2.1113917027758145e-05, "epoch": 5.94727435210009, "percentage": 59.47, "elapsed_time": "2:45:23", "remaining_time": "1:52:42", "throughput": 2320.34, "total_tokens": 23026800} {"current_steps": 39935, "total_steps": 67140, "loss": 0.5615, "lr": 2.1107497310873708e-05, "epoch": 5.9480190646410485, "percentage": 59.48, "elapsed_time": "2:45:25", "remaining_time": "1:52:41", "throughput": 2320.36, "total_tokens": 23029552} {"current_steps": 39940, "total_steps": 67140, "loss": 0.6827, "lr": 2.1101077857028774e-05, "epoch": 5.948763777182008, "percentage": 59.49, "elapsed_time": "2:45:26", "remaining_time": "1:52:39", "throughput": 2320.37, "total_tokens": 23032336} {"current_steps": 39945, "total_steps": 67140, "loss": 0.5346, "lr": 2.1094658666657137e-05, "epoch": 5.949508489722967, "percentage": 59.5, "elapsed_time": "2:45:27", "remaining_time": "1:52:38", "throughput": 2320.4, "total_tokens": 23035248} {"current_steps": 39950, "total_steps": 67140, "loss": 0.5423, "lr": 2.1088239740192588e-05, "epoch": 5.9502532022639265, "percentage": 59.5, "elapsed_time": "2:45:28", "remaining_time": "1:52:37", "throughput": 2320.41, "total_tokens": 23037904} {"current_steps": 39955, "total_steps": 67140, "loss": 0.8647, "lr": 2.1081821078068902e-05, "epoch": 5.950997914804885, "percentage": 59.51, "elapsed_time": "2:45:29", "remaining_time": "1:52:35", "throughput": 2320.43, "total_tokens": 23040688} {"current_steps": 39960, "total_steps": 67140, "loss": 0.7906, "lr": 2.1075402680719814e-05, "epoch": 5.951742627345844, "percentage": 59.52, "elapsed_time": "2:45:30", "remaining_time": "1:52:34", "throughput": 2320.46, "total_tokens": 23043632} {"current_steps": 39965, "total_steps": 67140, "loss": 0.5991, "lr": 2.1068984548579053e-05, "epoch": 5.952487339886804, "percentage": 59.52, "elapsed_time": "2:45:31", "remaining_time": "1:52:33", "throughput": 2320.46, "total_tokens": 23046160} {"current_steps": 39970, "total_steps": 67140, "loss": 0.8961, "lr": 2.106256668208034e-05, "epoch": 5.953232052427763, "percentage": 59.53, "elapsed_time": "2:45:32", "remaining_time": "1:52:31", "throughput": 2320.48, "total_tokens": 23049008} {"current_steps": 39975, "total_steps": 67140, "loss": 0.6448, "lr": 2.1056149081657368e-05, "epoch": 5.953976764968722, "percentage": 59.54, "elapsed_time": "2:45:33", "remaining_time": "1:52:30", "throughput": 2320.5, "total_tokens": 23051792} {"current_steps": 39980, "total_steps": 67140, "loss": 0.5646, "lr": 2.1049731747743793e-05, "epoch": 5.954721477509681, "percentage": 59.55, "elapsed_time": "2:45:35", "remaining_time": "1:52:29", "throughput": 2320.53, "total_tokens": 23054768} {"current_steps": 39985, "total_steps": 67140, "loss": 0.7149, "lr": 2.104331468077329e-05, "epoch": 5.9554661900506405, "percentage": 59.55, "elapsed_time": "2:45:36", "remaining_time": "1:52:28", "throughput": 2320.55, "total_tokens": 23057680} {"current_steps": 39990, "total_steps": 67140, "loss": 0.814, "lr": 2.10368978811795e-05, "epoch": 5.9562109025916, "percentage": 59.56, "elapsed_time": "2:45:37", "remaining_time": "1:52:26", "throughput": 2320.6, "total_tokens": 23060944} {"current_steps": 39995, "total_steps": 67140, "loss": 0.5656, "lr": 2.1030481349396028e-05, "epoch": 5.956955615132559, "percentage": 59.57, "elapsed_time": "2:45:38", "remaining_time": "1:52:25", "throughput": 2320.63, "total_tokens": 23063792} {"current_steps": 40000, "total_steps": 67140, "loss": 0.6237, "lr": 2.1024065085856498e-05, "epoch": 5.957700327673518, "percentage": 59.58, "elapsed_time": "2:45:39", "remaining_time": "1:52:24", "throughput": 2320.67, "total_tokens": 23066896} {"current_steps": 40005, "total_steps": 67140, "loss": 0.7391, "lr": 2.1017649090994477e-05, "epoch": 5.958445040214477, "percentage": 59.58, "elapsed_time": "2:45:40", "remaining_time": "1:52:22", "throughput": 2320.69, "total_tokens": 23069712} {"current_steps": 40010, "total_steps": 67140, "loss": 0.5687, "lr": 2.1011233365243538e-05, "epoch": 5.959189752755436, "percentage": 59.59, "elapsed_time": "2:45:42", "remaining_time": "1:52:21", "throughput": 2320.71, "total_tokens": 23072624} {"current_steps": 40015, "total_steps": 67140, "loss": 0.6217, "lr": 2.1004817909037245e-05, "epoch": 5.959934465296396, "percentage": 59.6, "elapsed_time": "2:45:43", "remaining_time": "1:52:20", "throughput": 2320.74, "total_tokens": 23075504} {"current_steps": 40020, "total_steps": 67140, "loss": 0.3785, "lr": 2.0998402722809105e-05, "epoch": 5.9606791778373545, "percentage": 59.61, "elapsed_time": "2:45:44", "remaining_time": "1:52:18", "throughput": 2320.76, "total_tokens": 23078352} {"current_steps": 40025, "total_steps": 67140, "loss": 0.6192, "lr": 2.0991987806992635e-05, "epoch": 5.961423890378314, "percentage": 59.61, "elapsed_time": "2:45:45", "remaining_time": "1:52:17", "throughput": 2320.78, "total_tokens": 23081200} {"current_steps": 40030, "total_steps": 67140, "loss": 0.6256, "lr": 2.0985573162021337e-05, "epoch": 5.962168602919273, "percentage": 59.62, "elapsed_time": "2:45:46", "remaining_time": "1:52:16", "throughput": 2320.79, "total_tokens": 23083824} {"current_steps": 40035, "total_steps": 67140, "loss": 0.5609, "lr": 2.0979158788328684e-05, "epoch": 5.9629133154602325, "percentage": 59.63, "elapsed_time": "2:45:47", "remaining_time": "1:52:14", "throughput": 2320.83, "total_tokens": 23086928} {"current_steps": 40040, "total_steps": 67140, "loss": 0.6563, "lr": 2.097274468634813e-05, "epoch": 5.963658028001191, "percentage": 59.64, "elapsed_time": "2:45:48", "remaining_time": "1:52:13", "throughput": 2320.84, "total_tokens": 23089648} {"current_steps": 40045, "total_steps": 67140, "loss": 0.5402, "lr": 2.0966330856513118e-05, "epoch": 5.964402740542151, "percentage": 59.64, "elapsed_time": "2:45:50", "remaining_time": "1:52:12", "throughput": 2320.87, "total_tokens": 23092688} {"current_steps": 40050, "total_steps": 67140, "loss": 0.7958, "lr": 2.095991729925707e-05, "epoch": 5.96514745308311, "percentage": 59.65, "elapsed_time": "2:45:51", "remaining_time": "1:52:11", "throughput": 2320.91, "total_tokens": 23095824} {"current_steps": 40055, "total_steps": 67140, "loss": 0.6565, "lr": 2.095350401501339e-05, "epoch": 5.965892165624069, "percentage": 59.66, "elapsed_time": "2:45:52", "remaining_time": "1:52:09", "throughput": 2320.94, "total_tokens": 23098768} {"current_steps": 40060, "total_steps": 67140, "loss": 0.5789, "lr": 2.094709100421545e-05, "epoch": 5.966636878165028, "percentage": 59.67, "elapsed_time": "2:45:53", "remaining_time": "1:52:08", "throughput": 2320.96, "total_tokens": 23101488} {"current_steps": 40065, "total_steps": 67140, "loss": 0.7242, "lr": 2.094067826729662e-05, "epoch": 5.967381590705988, "percentage": 59.67, "elapsed_time": "2:45:54", "remaining_time": "1:52:07", "throughput": 2320.99, "total_tokens": 23104528} {"current_steps": 40070, "total_steps": 67140, "loss": 0.5435, "lr": 2.093426580469025e-05, "epoch": 5.9681263032469465, "percentage": 59.68, "elapsed_time": "2:45:55", "remaining_time": "1:52:05", "throughput": 2321.02, "total_tokens": 23107408} {"current_steps": 40075, "total_steps": 67140, "loss": 0.5333, "lr": 2.0927853616829668e-05, "epoch": 5.968871015787906, "percentage": 59.69, "elapsed_time": "2:45:56", "remaining_time": "1:52:04", "throughput": 2321.02, "total_tokens": 23109904} {"current_steps": 40080, "total_steps": 67140, "loss": 0.6541, "lr": 2.0921441704148177e-05, "epoch": 5.969615728328865, "percentage": 59.7, "elapsed_time": "2:45:57", "remaining_time": "1:52:03", "throughput": 2321.04, "total_tokens": 23112688} {"current_steps": 40085, "total_steps": 67140, "loss": 0.5291, "lr": 2.0915030067079084e-05, "epoch": 5.9703604408698245, "percentage": 59.7, "elapsed_time": "2:45:59", "remaining_time": "1:52:01", "throughput": 2321.07, "total_tokens": 23115568} {"current_steps": 40090, "total_steps": 67140, "loss": 0.5926, "lr": 2.090861870605564e-05, "epoch": 5.971105153410783, "percentage": 59.71, "elapsed_time": "2:46:00", "remaining_time": "1:52:00", "throughput": 2321.08, "total_tokens": 23118256} {"current_steps": 40095, "total_steps": 67140, "loss": 0.6622, "lr": 2.0902207621511123e-05, "epoch": 5.971849865951743, "percentage": 59.72, "elapsed_time": "2:46:01", "remaining_time": "1:51:59", "throughput": 2321.12, "total_tokens": 23121360} {"current_steps": 40100, "total_steps": 67140, "loss": 0.7008, "lr": 2.0895796813878743e-05, "epoch": 5.972594578492702, "percentage": 59.73, "elapsed_time": "2:46:02", "remaining_time": "1:51:57", "throughput": 2321.15, "total_tokens": 23124272} {"current_steps": 40105, "total_steps": 67140, "loss": 0.7866, "lr": 2.0889386283591732e-05, "epoch": 5.973339291033661, "percentage": 59.73, "elapsed_time": "2:46:03", "remaining_time": "1:51:56", "throughput": 2321.17, "total_tokens": 23127120} {"current_steps": 40110, "total_steps": 67140, "loss": 0.5054, "lr": 2.088297603108328e-05, "epoch": 5.97408400357462, "percentage": 59.74, "elapsed_time": "2:46:04", "remaining_time": "1:51:55", "throughput": 2321.19, "total_tokens": 23129968} {"current_steps": 40115, "total_steps": 67140, "loss": 0.4786, "lr": 2.0876566056786572e-05, "epoch": 5.97482871611558, "percentage": 59.75, "elapsed_time": "2:46:05", "remaining_time": "1:51:53", "throughput": 2321.21, "total_tokens": 23132784} {"current_steps": 40120, "total_steps": 67140, "loss": 0.7877, "lr": 2.087015636113477e-05, "epoch": 5.9755734286565385, "percentage": 59.76, "elapsed_time": "2:46:06", "remaining_time": "1:51:52", "throughput": 2321.24, "total_tokens": 23135792} {"current_steps": 40125, "total_steps": 67140, "loss": 0.5725, "lr": 2.0863746944561e-05, "epoch": 5.976318141197497, "percentage": 59.76, "elapsed_time": "2:46:08", "remaining_time": "1:51:51", "throughput": 2321.26, "total_tokens": 23138608} {"current_steps": 40130, "total_steps": 67140, "loss": 0.5794, "lr": 2.0857337807498398e-05, "epoch": 5.977062853738457, "percentage": 59.77, "elapsed_time": "2:46:09", "remaining_time": "1:51:49", "throughput": 2321.28, "total_tokens": 23141424} {"current_steps": 40135, "total_steps": 67140, "loss": 0.763, "lr": 2.085092895038007e-05, "epoch": 5.977807566279417, "percentage": 59.78, "elapsed_time": "2:46:10", "remaining_time": "1:51:48", "throughput": 2321.3, "total_tokens": 23144240} {"current_steps": 40140, "total_steps": 67140, "loss": 0.7251, "lr": 2.08445203736391e-05, "epoch": 5.978552278820375, "percentage": 59.79, "elapsed_time": "2:46:11", "remaining_time": "1:51:47", "throughput": 2321.33, "total_tokens": 23147216} {"current_steps": 40145, "total_steps": 67140, "loss": 0.6279, "lr": 2.0838112077708533e-05, "epoch": 5.979296991361334, "percentage": 59.79, "elapsed_time": "2:46:12", "remaining_time": "1:51:45", "throughput": 2321.36, "total_tokens": 23150160} {"current_steps": 40150, "total_steps": 67140, "loss": 0.7744, "lr": 2.0831704063021433e-05, "epoch": 5.980041703902294, "percentage": 59.8, "elapsed_time": "2:46:13", "remaining_time": "1:51:44", "throughput": 2321.39, "total_tokens": 23153104} {"current_steps": 40155, "total_steps": 67140, "loss": 0.6207, "lr": 2.0825296330010834e-05, "epoch": 5.980786416443253, "percentage": 59.81, "elapsed_time": "2:46:14", "remaining_time": "1:51:43", "throughput": 2321.41, "total_tokens": 23155984} {"current_steps": 40160, "total_steps": 67140, "loss": 0.6957, "lr": 2.0818888879109728e-05, "epoch": 5.981531128984212, "percentage": 59.82, "elapsed_time": "2:46:16", "remaining_time": "1:51:42", "throughput": 2321.44, "total_tokens": 23158896} {"current_steps": 40165, "total_steps": 67140, "loss": 0.5999, "lr": 2.0812481710751115e-05, "epoch": 5.982275841525171, "percentage": 59.82, "elapsed_time": "2:46:17", "remaining_time": "1:51:40", "throughput": 2321.47, "total_tokens": 23161904} {"current_steps": 40170, "total_steps": 67140, "loss": 0.7865, "lr": 2.0806074825367965e-05, "epoch": 5.9830205540661305, "percentage": 59.83, "elapsed_time": "2:46:18", "remaining_time": "1:51:39", "throughput": 2321.49, "total_tokens": 23164752} {"current_steps": 40175, "total_steps": 67140, "loss": 0.7334, "lr": 2.079966822339322e-05, "epoch": 5.983765266607089, "percentage": 59.84, "elapsed_time": "2:46:19", "remaining_time": "1:51:38", "throughput": 2321.51, "total_tokens": 23167600} {"current_steps": 40180, "total_steps": 67140, "loss": 0.5083, "lr": 2.079326190525983e-05, "epoch": 5.984509979148049, "percentage": 59.85, "elapsed_time": "2:46:20", "remaining_time": "1:51:36", "throughput": 2321.56, "total_tokens": 23170896} {"current_steps": 40185, "total_steps": 67140, "loss": 0.7102, "lr": 2.0786855871400695e-05, "epoch": 5.985254691689008, "percentage": 59.85, "elapsed_time": "2:46:21", "remaining_time": "1:51:35", "throughput": 2321.58, "total_tokens": 23173712} {"current_steps": 40190, "total_steps": 67140, "loss": 0.6259, "lr": 2.0780450122248706e-05, "epoch": 5.985999404229967, "percentage": 59.86, "elapsed_time": "2:46:22", "remaining_time": "1:51:34", "throughput": 2321.6, "total_tokens": 23176528} {"current_steps": 40195, "total_steps": 67140, "loss": 0.5033, "lr": 2.0774044658236742e-05, "epoch": 5.986744116770926, "percentage": 59.87, "elapsed_time": "2:46:24", "remaining_time": "1:51:32", "throughput": 2321.62, "total_tokens": 23179312} {"current_steps": 40200, "total_steps": 67140, "loss": 0.5842, "lr": 2.0767639479797663e-05, "epoch": 5.987488829311886, "percentage": 59.87, "elapsed_time": "2:46:25", "remaining_time": "1:51:31", "throughput": 2321.65, "total_tokens": 23182352} {"current_steps": 40205, "total_steps": 67140, "loss": 0.5614, "lr": 2.0761234587364294e-05, "epoch": 5.9882335418528445, "percentage": 59.88, "elapsed_time": "2:46:26", "remaining_time": "1:51:30", "throughput": 2321.69, "total_tokens": 23185424} {"current_steps": 40210, "total_steps": 67140, "loss": 0.7661, "lr": 2.0754829981369458e-05, "epoch": 5.988978254393804, "percentage": 59.89, "elapsed_time": "2:46:27", "remaining_time": "1:51:29", "throughput": 2321.72, "total_tokens": 23188368} {"current_steps": 40215, "total_steps": 67140, "loss": 0.6994, "lr": 2.074842566224596e-05, "epoch": 5.989722966934763, "percentage": 59.9, "elapsed_time": "2:46:28", "remaining_time": "1:51:27", "throughput": 2321.74, "total_tokens": 23191312} {"current_steps": 40220, "total_steps": 67140, "loss": 0.6774, "lr": 2.074202163042657e-05, "epoch": 5.990467679475723, "percentage": 59.9, "elapsed_time": "2:46:29", "remaining_time": "1:51:26", "throughput": 2321.79, "total_tokens": 23194448} {"current_steps": 40225, "total_steps": 67140, "loss": 0.621, "lr": 2.0735617886344043e-05, "epoch": 5.991212392016681, "percentage": 59.91, "elapsed_time": "2:46:31", "remaining_time": "1:51:25", "throughput": 2321.8, "total_tokens": 23197104} {"current_steps": 40230, "total_steps": 67140, "loss": 0.5841, "lr": 2.0729214430431118e-05, "epoch": 5.991957104557641, "percentage": 59.92, "elapsed_time": "2:46:32", "remaining_time": "1:51:23", "throughput": 2321.81, "total_tokens": 23199792} {"current_steps": 40235, "total_steps": 67140, "loss": 0.6784, "lr": 2.0722811263120523e-05, "epoch": 5.9927018170986, "percentage": 59.93, "elapsed_time": "2:46:33", "remaining_time": "1:51:22", "throughput": 2321.83, "total_tokens": 23202736} {"current_steps": 40240, "total_steps": 67140, "loss": 0.654, "lr": 2.071640838484495e-05, "epoch": 5.993446529639559, "percentage": 59.93, "elapsed_time": "2:46:34", "remaining_time": "1:51:21", "throughput": 2321.88, "total_tokens": 23206032} {"current_steps": 40245, "total_steps": 67140, "loss": 0.5425, "lr": 2.0710005796037078e-05, "epoch": 5.994191242180518, "percentage": 59.94, "elapsed_time": "2:46:35", "remaining_time": "1:51:19", "throughput": 2321.93, "total_tokens": 23209168} {"current_steps": 40250, "total_steps": 67140, "loss": 0.7345, "lr": 2.0703603497129584e-05, "epoch": 5.994935954721478, "percentage": 59.95, "elapsed_time": "2:46:36", "remaining_time": "1:51:18", "throughput": 2321.95, "total_tokens": 23211952} {"current_steps": 40255, "total_steps": 67140, "loss": 0.7222, "lr": 2.0697201488555087e-05, "epoch": 5.9956806672624365, "percentage": 59.96, "elapsed_time": "2:46:37", "remaining_time": "1:51:17", "throughput": 2321.97, "total_tokens": 23214832} {"current_steps": 40260, "total_steps": 67140, "loss": 0.7685, "lr": 2.0690799770746232e-05, "epoch": 5.996425379803396, "percentage": 59.96, "elapsed_time": "2:46:39", "remaining_time": "1:51:15", "throughput": 2322.0, "total_tokens": 23217776} {"current_steps": 40265, "total_steps": 67140, "loss": 0.3607, "lr": 2.06843983441356e-05, "epoch": 5.997170092344355, "percentage": 59.97, "elapsed_time": "2:46:40", "remaining_time": "1:51:14", "throughput": 2322.01, "total_tokens": 23220560} {"current_steps": 40270, "total_steps": 67140, "loss": 0.5077, "lr": 2.0677997209155785e-05, "epoch": 5.997914804885315, "percentage": 59.98, "elapsed_time": "2:46:41", "remaining_time": "1:51:13", "throughput": 2322.01, "total_tokens": 23223056} {"current_steps": 40275, "total_steps": 67140, "loss": 0.5968, "lr": 2.0671596366239343e-05, "epoch": 5.998659517426273, "percentage": 59.99, "elapsed_time": "2:46:42", "remaining_time": "1:51:11", "throughput": 2322.04, "total_tokens": 23225872} {"current_steps": 40280, "total_steps": 67140, "loss": 0.6494, "lr": 2.066519581581882e-05, "epoch": 5.999404229967233, "percentage": 59.99, "elapsed_time": "2:46:43", "remaining_time": "1:51:10", "throughput": 2322.06, "total_tokens": 23228752} {"current_steps": 40284, "total_steps": 67140, "eval_loss": 0.6619589328765869, "epoch": 6.0, "percentage": 60.0, "elapsed_time": "2:47:58", "remaining_time": "1:51:59", "throughput": 2304.93, "total_tokens": 23230504} {"current_steps": 40285, "total_steps": 67140, "loss": 0.5724, "lr": 2.0658795558326743e-05, "epoch": 6.000148942508192, "percentage": 60.0, "elapsed_time": "2:48:00", "remaining_time": "1:52:00", "throughput": 2304.52, "total_tokens": 23231080} {"current_steps": 40290, "total_steps": 67140, "loss": 0.618, "lr": 2.065239559419561e-05, "epoch": 6.000893655049151, "percentage": 60.01, "elapsed_time": "2:48:01", "remaining_time": "1:51:58", "throughput": 2304.53, "total_tokens": 23233672} {"current_steps": 40295, "total_steps": 67140, "loss": 0.5271, "lr": 2.0645995923857902e-05, "epoch": 6.00163836759011, "percentage": 60.02, "elapsed_time": "2:48:02", "remaining_time": "1:51:57", "throughput": 2304.55, "total_tokens": 23236488} {"current_steps": 40300, "total_steps": 67140, "loss": 0.6336, "lr": 2.0639596547746104e-05, "epoch": 6.00238308013107, "percentage": 60.02, "elapsed_time": "2:48:04", "remaining_time": "1:51:56", "throughput": 2304.6, "total_tokens": 23239656} {"current_steps": 40305, "total_steps": 67140, "loss": 0.6084, "lr": 2.0633197466292633e-05, "epoch": 6.003127792672029, "percentage": 60.03, "elapsed_time": "2:48:05", "remaining_time": "1:51:54", "throughput": 2304.65, "total_tokens": 23242824} {"current_steps": 40310, "total_steps": 67140, "loss": 0.5745, "lr": 2.062679867992992e-05, "epoch": 6.003872505212988, "percentage": 60.04, "elapsed_time": "2:48:06", "remaining_time": "1:51:53", "throughput": 2304.67, "total_tokens": 23245704} {"current_steps": 40315, "total_steps": 67140, "loss": 0.5962, "lr": 2.062040018909037e-05, "epoch": 6.004617217753947, "percentage": 60.05, "elapsed_time": "2:48:07", "remaining_time": "1:51:52", "throughput": 2304.7, "total_tokens": 23248648} {"current_steps": 40320, "total_steps": 67140, "loss": 0.7518, "lr": 2.0614001994206378e-05, "epoch": 6.005361930294906, "percentage": 60.05, "elapsed_time": "2:48:08", "remaining_time": "1:51:50", "throughput": 2304.72, "total_tokens": 23251432} {"current_steps": 40325, "total_steps": 67140, "loss": 0.6322, "lr": 2.060760409571029e-05, "epoch": 6.006106642835865, "percentage": 60.06, "elapsed_time": "2:48:09", "remaining_time": "1:51:49", "throughput": 2304.74, "total_tokens": 23254312} {"current_steps": 40330, "total_steps": 67140, "loss": 0.5416, "lr": 2.0601206494034465e-05, "epoch": 6.006851355376824, "percentage": 60.07, "elapsed_time": "2:48:10", "remaining_time": "1:51:48", "throughput": 2304.78, "total_tokens": 23257352} {"current_steps": 40335, "total_steps": 67140, "loss": 0.7079, "lr": 2.0594809189611218e-05, "epoch": 6.007596067917784, "percentage": 60.08, "elapsed_time": "2:48:12", "remaining_time": "1:51:46", "throughput": 2304.81, "total_tokens": 23260264} {"current_steps": 40340, "total_steps": 67140, "loss": 0.6887, "lr": 2.058841218287287e-05, "epoch": 6.0083407804587425, "percentage": 60.08, "elapsed_time": "2:48:13", "remaining_time": "1:51:45", "throughput": 2304.82, "total_tokens": 23262920} {"current_steps": 40345, "total_steps": 67140, "loss": 0.5988, "lr": 2.0582015474251672e-05, "epoch": 6.009085492999702, "percentage": 60.09, "elapsed_time": "2:48:14", "remaining_time": "1:51:44", "throughput": 2304.83, "total_tokens": 23265640} {"current_steps": 40350, "total_steps": 67140, "loss": 0.5812, "lr": 2.0575619064179912e-05, "epoch": 6.009830205540661, "percentage": 60.1, "elapsed_time": "2:48:15", "remaining_time": "1:51:42", "throughput": 2304.85, "total_tokens": 23268424} {"current_steps": 40355, "total_steps": 67140, "loss": 0.557, "lr": 2.0569222953089827e-05, "epoch": 6.010574918081621, "percentage": 60.11, "elapsed_time": "2:48:16", "remaining_time": "1:51:41", "throughput": 2304.86, "total_tokens": 23271112} {"current_steps": 40360, "total_steps": 67140, "loss": 0.6664, "lr": 2.0562827141413637e-05, "epoch": 6.011319630622579, "percentage": 60.11, "elapsed_time": "2:48:17", "remaining_time": "1:51:40", "throughput": 2304.9, "total_tokens": 23274088} {"current_steps": 40365, "total_steps": 67140, "loss": 0.4929, "lr": 2.0556431629583557e-05, "epoch": 6.012064343163539, "percentage": 60.12, "elapsed_time": "2:48:18", "remaining_time": "1:51:38", "throughput": 2304.93, "total_tokens": 23277000} {"current_steps": 40370, "total_steps": 67140, "loss": 0.6692, "lr": 2.0550036418031752e-05, "epoch": 6.012809055704498, "percentage": 60.13, "elapsed_time": "2:48:19", "remaining_time": "1:51:37", "throughput": 2304.94, "total_tokens": 23279752} {"current_steps": 40375, "total_steps": 67140, "loss": 0.543, "lr": 2.0543641507190396e-05, "epoch": 6.013553768245457, "percentage": 60.14, "elapsed_time": "2:48:21", "remaining_time": "1:51:36", "throughput": 2304.99, "total_tokens": 23282888} {"current_steps": 40380, "total_steps": 67140, "loss": 0.6249, "lr": 2.0537246897491638e-05, "epoch": 6.014298480786416, "percentage": 60.14, "elapsed_time": "2:48:22", "remaining_time": "1:51:34", "throughput": 2305.02, "total_tokens": 23285832} {"current_steps": 40385, "total_steps": 67140, "loss": 0.6662, "lr": 2.0530852589367587e-05, "epoch": 6.015043193327376, "percentage": 60.15, "elapsed_time": "2:48:23", "remaining_time": "1:51:33", "throughput": 2305.04, "total_tokens": 23288776} {"current_steps": 40390, "total_steps": 67140, "loss": 0.5428, "lr": 2.052445858325034e-05, "epoch": 6.015787905868335, "percentage": 60.16, "elapsed_time": "2:48:24", "remaining_time": "1:51:32", "throughput": 2305.08, "total_tokens": 23291816} {"current_steps": 40395, "total_steps": 67140, "loss": 0.5584, "lr": 2.051806487957199e-05, "epoch": 6.016532618409294, "percentage": 60.17, "elapsed_time": "2:48:25", "remaining_time": "1:51:30", "throughput": 2305.12, "total_tokens": 23294824} {"current_steps": 40400, "total_steps": 67140, "loss": 0.5159, "lr": 2.0511671478764593e-05, "epoch": 6.017277330950253, "percentage": 60.17, "elapsed_time": "2:48:26", "remaining_time": "1:51:29", "throughput": 2305.15, "total_tokens": 23297768} {"current_steps": 40405, "total_steps": 67140, "loss": 0.6344, "lr": 2.0505278381260187e-05, "epoch": 6.018022043491213, "percentage": 60.18, "elapsed_time": "2:48:27", "remaining_time": "1:51:28", "throughput": 2305.18, "total_tokens": 23300648} {"current_steps": 40410, "total_steps": 67140, "loss": 0.5549, "lr": 2.0498885587490794e-05, "epoch": 6.018766756032171, "percentage": 60.19, "elapsed_time": "2:48:29", "remaining_time": "1:51:26", "throughput": 2305.22, "total_tokens": 23303720} {"current_steps": 40415, "total_steps": 67140, "loss": 0.6336, "lr": 2.0492493097888414e-05, "epoch": 6.019511468573131, "percentage": 60.2, "elapsed_time": "2:48:30", "remaining_time": "1:51:25", "throughput": 2305.23, "total_tokens": 23306536} {"current_steps": 40420, "total_steps": 67140, "loss": 0.7776, "lr": 2.0486100912885036e-05, "epoch": 6.02025618111409, "percentage": 60.2, "elapsed_time": "2:48:31", "remaining_time": "1:51:24", "throughput": 2305.26, "total_tokens": 23309384} {"current_steps": 40425, "total_steps": 67140, "loss": 0.7986, "lr": 2.047970903291259e-05, "epoch": 6.021000893655049, "percentage": 60.21, "elapsed_time": "2:48:32", "remaining_time": "1:51:22", "throughput": 2305.27, "total_tokens": 23312008} {"current_steps": 40430, "total_steps": 67140, "loss": 0.558, "lr": 2.0473317458403036e-05, "epoch": 6.021745606196008, "percentage": 60.22, "elapsed_time": "2:48:33", "remaining_time": "1:51:21", "throughput": 2305.29, "total_tokens": 23314792} {"current_steps": 40435, "total_steps": 67140, "loss": 0.6891, "lr": 2.0466926189788286e-05, "epoch": 6.022490318736968, "percentage": 60.22, "elapsed_time": "2:48:34", "remaining_time": "1:51:20", "throughput": 2305.3, "total_tokens": 23317352} {"current_steps": 40440, "total_steps": 67140, "loss": 0.6006, "lr": 2.0460535227500226e-05, "epoch": 6.023235031277927, "percentage": 60.23, "elapsed_time": "2:48:35", "remaining_time": "1:51:18", "throughput": 2305.32, "total_tokens": 23320136} {"current_steps": 40445, "total_steps": 67140, "loss": 0.5777, "lr": 2.045414457197074e-05, "epoch": 6.023979743818886, "percentage": 60.24, "elapsed_time": "2:48:36", "remaining_time": "1:51:17", "throughput": 2305.33, "total_tokens": 23322856} {"current_steps": 40450, "total_steps": 67140, "loss": 0.6875, "lr": 2.044775422363169e-05, "epoch": 6.024724456359845, "percentage": 60.25, "elapsed_time": "2:48:38", "remaining_time": "1:51:16", "throughput": 2305.36, "total_tokens": 23325736} {"current_steps": 40455, "total_steps": 67140, "loss": 0.5541, "lr": 2.0441364182914893e-05, "epoch": 6.025469168900805, "percentage": 60.25, "elapsed_time": "2:48:39", "remaining_time": "1:51:14", "throughput": 2305.4, "total_tokens": 23328840} {"current_steps": 40460, "total_steps": 67140, "loss": 0.5856, "lr": 2.0434974450252183e-05, "epoch": 6.026213881441763, "percentage": 60.26, "elapsed_time": "2:48:40", "remaining_time": "1:51:13", "throughput": 2305.43, "total_tokens": 23331816} {"current_steps": 40465, "total_steps": 67140, "loss": 0.4056, "lr": 2.042858502607533e-05, "epoch": 6.026958593982723, "percentage": 60.27, "elapsed_time": "2:48:41", "remaining_time": "1:51:12", "throughput": 2305.44, "total_tokens": 23334504} {"current_steps": 40470, "total_steps": 67140, "loss": 0.5394, "lr": 2.0422195910816116e-05, "epoch": 6.027703306523682, "percentage": 60.28, "elapsed_time": "2:48:42", "remaining_time": "1:51:10", "throughput": 2305.46, "total_tokens": 23337192} {"current_steps": 40475, "total_steps": 67140, "loss": 0.7492, "lr": 2.041580710490629e-05, "epoch": 6.0284480190646414, "percentage": 60.28, "elapsed_time": "2:48:43", "remaining_time": "1:51:09", "throughput": 2305.49, "total_tokens": 23340104} {"current_steps": 40480, "total_steps": 67140, "loss": 0.5629, "lr": 2.040941860877758e-05, "epoch": 6.0291927316056, "percentage": 60.29, "elapsed_time": "2:48:44", "remaining_time": "1:51:08", "throughput": 2305.51, "total_tokens": 23342888} {"current_steps": 40485, "total_steps": 67140, "loss": 0.5262, "lr": 2.04030304228617e-05, "epoch": 6.02993744414656, "percentage": 60.3, "elapsed_time": "2:48:46", "remaining_time": "1:51:06", "throughput": 2305.55, "total_tokens": 23346024} {"current_steps": 40490, "total_steps": 67140, "loss": 0.426, "lr": 2.039664254759033e-05, "epoch": 6.030682156687519, "percentage": 60.31, "elapsed_time": "2:48:47", "remaining_time": "1:51:05", "throughput": 2305.56, "total_tokens": 23348744} {"current_steps": 40495, "total_steps": 67140, "loss": 0.7222, "lr": 2.0390254983395146e-05, "epoch": 6.031426869228477, "percentage": 60.31, "elapsed_time": "2:48:48", "remaining_time": "1:51:04", "throughput": 2305.59, "total_tokens": 23351720} {"current_steps": 40500, "total_steps": 67140, "loss": 0.6985, "lr": 2.038386773070779e-05, "epoch": 6.032171581769437, "percentage": 60.32, "elapsed_time": "2:48:49", "remaining_time": "1:51:02", "throughput": 2305.62, "total_tokens": 23354728} {"current_steps": 40505, "total_steps": 67140, "loss": 0.565, "lr": 2.0377480789959882e-05, "epoch": 6.032916294310396, "percentage": 60.33, "elapsed_time": "2:48:50", "remaining_time": "1:51:01", "throughput": 2305.67, "total_tokens": 23357928} {"current_steps": 40510, "total_steps": 67140, "loss": 0.5642, "lr": 2.0371094161583026e-05, "epoch": 6.033661006851355, "percentage": 60.34, "elapsed_time": "2:48:51", "remaining_time": "1:51:00", "throughput": 2305.68, "total_tokens": 23360488} {"current_steps": 40515, "total_steps": 67140, "loss": 0.5919, "lr": 2.036470784600881e-05, "epoch": 6.034405719392314, "percentage": 60.34, "elapsed_time": "2:48:52", "remaining_time": "1:50:58", "throughput": 2305.69, "total_tokens": 23363240} {"current_steps": 40520, "total_steps": 67140, "loss": 0.5835, "lr": 2.035832184366879e-05, "epoch": 6.035150431933274, "percentage": 60.35, "elapsed_time": "2:48:54", "remaining_time": "1:50:57", "throughput": 2305.73, "total_tokens": 23366344} {"current_steps": 40525, "total_steps": 67140, "loss": 0.7463, "lr": 2.0351936154994503e-05, "epoch": 6.035895144474233, "percentage": 60.36, "elapsed_time": "2:48:55", "remaining_time": "1:50:56", "throughput": 2305.77, "total_tokens": 23369416} {"current_steps": 40530, "total_steps": 67140, "loss": 0.4929, "lr": 2.034555078041748e-05, "epoch": 6.036639857015192, "percentage": 60.37, "elapsed_time": "2:48:56", "remaining_time": "1:50:55", "throughput": 2305.78, "total_tokens": 23372168} {"current_steps": 40535, "total_steps": 67140, "loss": 0.6541, "lr": 2.0339165720369207e-05, "epoch": 6.037384569556151, "percentage": 60.37, "elapsed_time": "2:48:57", "remaining_time": "1:50:53", "throughput": 2305.83, "total_tokens": 23375336} {"current_steps": 40540, "total_steps": 67140, "loss": 0.2941, "lr": 2.0332780975281177e-05, "epoch": 6.038129282097111, "percentage": 60.38, "elapsed_time": "2:48:58", "remaining_time": "1:50:52", "throughput": 2305.83, "total_tokens": 23377864} {"current_steps": 40545, "total_steps": 67140, "loss": 0.6494, "lr": 2.0326396545584822e-05, "epoch": 6.038873994638069, "percentage": 60.39, "elapsed_time": "2:48:59", "remaining_time": "1:50:51", "throughput": 2305.86, "total_tokens": 23380840} {"current_steps": 40550, "total_steps": 67140, "loss": 0.6451, "lr": 2.032001243171159e-05, "epoch": 6.039618707179029, "percentage": 60.4, "elapsed_time": "2:49:00", "remaining_time": "1:50:49", "throughput": 2305.89, "total_tokens": 23383656} {"current_steps": 40555, "total_steps": 67140, "loss": 0.696, "lr": 2.0313628634092887e-05, "epoch": 6.040363419719988, "percentage": 60.4, "elapsed_time": "2:49:02", "remaining_time": "1:50:48", "throughput": 2305.93, "total_tokens": 23386792} {"current_steps": 40560, "total_steps": 67140, "loss": 0.5289, "lr": 2.030724515316011e-05, "epoch": 6.0411081322609474, "percentage": 60.41, "elapsed_time": "2:49:03", "remaining_time": "1:50:47", "throughput": 2305.94, "total_tokens": 23389480} {"current_steps": 40565, "total_steps": 67140, "loss": 0.4241, "lr": 2.0300861989344627e-05, "epoch": 6.041852844801906, "percentage": 60.42, "elapsed_time": "2:49:04", "remaining_time": "1:50:45", "throughput": 2305.97, "total_tokens": 23392424} {"current_steps": 40570, "total_steps": 67140, "loss": 0.6008, "lr": 2.0294479143077783e-05, "epoch": 6.042597557342866, "percentage": 60.43, "elapsed_time": "2:49:05", "remaining_time": "1:50:44", "throughput": 2306.0, "total_tokens": 23395336} {"current_steps": 40575, "total_steps": 67140, "loss": 0.6247, "lr": 2.0288096614790905e-05, "epoch": 6.043342269883825, "percentage": 60.43, "elapsed_time": "2:49:06", "remaining_time": "1:50:43", "throughput": 2306.02, "total_tokens": 23398152} {"current_steps": 40580, "total_steps": 67140, "loss": 0.3768, "lr": 2.0281714404915313e-05, "epoch": 6.044086982424784, "percentage": 60.44, "elapsed_time": "2:49:07", "remaining_time": "1:50:41", "throughput": 2306.05, "total_tokens": 23401064} {"current_steps": 40585, "total_steps": 67140, "loss": 0.6083, "lr": 2.027533251388227e-05, "epoch": 6.044831694965743, "percentage": 60.45, "elapsed_time": "2:49:08", "remaining_time": "1:50:40", "throughput": 2306.08, "total_tokens": 23404008} {"current_steps": 40590, "total_steps": 67140, "loss": 0.5169, "lr": 2.0268950942123046e-05, "epoch": 6.045576407506703, "percentage": 60.46, "elapsed_time": "2:49:10", "remaining_time": "1:50:39", "throughput": 2306.12, "total_tokens": 23407144} {"current_steps": 40595, "total_steps": 67140, "loss": 0.7292, "lr": 2.0262569690068882e-05, "epoch": 6.046321120047661, "percentage": 60.46, "elapsed_time": "2:49:11", "remaining_time": "1:50:37", "throughput": 2306.13, "total_tokens": 23409832} {"current_steps": 40600, "total_steps": 67140, "loss": 0.387, "lr": 2.0256188758151e-05, "epoch": 6.047065832588621, "percentage": 60.47, "elapsed_time": "2:49:12", "remaining_time": "1:50:36", "throughput": 2306.15, "total_tokens": 23412616} {"current_steps": 40605, "total_steps": 67140, "loss": 0.4972, "lr": 2.024980814680059e-05, "epoch": 6.04781054512958, "percentage": 60.48, "elapsed_time": "2:49:13", "remaining_time": "1:50:35", "throughput": 2306.16, "total_tokens": 23415272} {"current_steps": 40610, "total_steps": 67140, "loss": 0.5792, "lr": 2.0243427856448834e-05, "epoch": 6.0485552576705395, "percentage": 60.49, "elapsed_time": "2:49:14", "remaining_time": "1:50:33", "throughput": 2306.2, "total_tokens": 23418280} {"current_steps": 40615, "total_steps": 67140, "loss": 0.8554, "lr": 2.0237047887526887e-05, "epoch": 6.049299970211498, "percentage": 60.49, "elapsed_time": "2:49:15", "remaining_time": "1:50:32", "throughput": 2306.23, "total_tokens": 23421192} {"current_steps": 40620, "total_steps": 67140, "loss": 0.6489, "lr": 2.0230668240465886e-05, "epoch": 6.050044682752458, "percentage": 60.5, "elapsed_time": "2:49:16", "remaining_time": "1:50:31", "throughput": 2306.25, "total_tokens": 23424072} {"current_steps": 40625, "total_steps": 67140, "loss": 0.7566, "lr": 2.0224288915696924e-05, "epoch": 6.050789395293417, "percentage": 60.51, "elapsed_time": "2:49:17", "remaining_time": "1:50:29", "throughput": 2306.29, "total_tokens": 23427080} {"current_steps": 40630, "total_steps": 67140, "loss": 0.5814, "lr": 2.0217909913651102e-05, "epoch": 6.051534107834376, "percentage": 60.52, "elapsed_time": "2:49:19", "remaining_time": "1:50:28", "throughput": 2306.31, "total_tokens": 23429928} {"current_steps": 40635, "total_steps": 67140, "loss": 0.5632, "lr": 2.0211531234759487e-05, "epoch": 6.052278820375335, "percentage": 60.52, "elapsed_time": "2:49:20", "remaining_time": "1:50:27", "throughput": 2306.31, "total_tokens": 23432456} {"current_steps": 40640, "total_steps": 67140, "loss": 0.5436, "lr": 2.020515287945312e-05, "epoch": 6.053023532916295, "percentage": 60.53, "elapsed_time": "2:49:21", "remaining_time": "1:50:25", "throughput": 2306.34, "total_tokens": 23435432} {"current_steps": 40645, "total_steps": 67140, "loss": 0.5899, "lr": 2.0198774848163027e-05, "epoch": 6.0537682454572534, "percentage": 60.54, "elapsed_time": "2:49:22", "remaining_time": "1:50:24", "throughput": 2306.36, "total_tokens": 23438216} {"current_steps": 40650, "total_steps": 67140, "loss": 0.5469, "lr": 2.0192397141320212e-05, "epoch": 6.054512957998213, "percentage": 60.55, "elapsed_time": "2:49:23", "remaining_time": "1:50:23", "throughput": 2306.39, "total_tokens": 23441192} {"current_steps": 40655, "total_steps": 67140, "loss": 0.6279, "lr": 2.018601975935565e-05, "epoch": 6.055257670539172, "percentage": 60.55, "elapsed_time": "2:49:24", "remaining_time": "1:50:21", "throughput": 2306.42, "total_tokens": 23444040} {"current_steps": 40660, "total_steps": 67140, "loss": 0.5026, "lr": 2.017964270270031e-05, "epoch": 6.0560023830801315, "percentage": 60.56, "elapsed_time": "2:49:25", "remaining_time": "1:50:20", "throughput": 2306.42, "total_tokens": 23446568} {"current_steps": 40665, "total_steps": 67140, "loss": 0.6005, "lr": 2.0173265971785108e-05, "epoch": 6.05674709562109, "percentage": 60.57, "elapsed_time": "2:49:26", "remaining_time": "1:50:19", "throughput": 2306.44, "total_tokens": 23449384} {"current_steps": 40670, "total_steps": 67140, "loss": 0.7546, "lr": 2.0166889567040973e-05, "epoch": 6.057491808162049, "percentage": 60.57, "elapsed_time": "2:49:28", "remaining_time": "1:50:17", "throughput": 2306.46, "total_tokens": 23452232} {"current_steps": 40675, "total_steps": 67140, "loss": 0.5355, "lr": 2.0160513488898784e-05, "epoch": 6.058236520703009, "percentage": 60.58, "elapsed_time": "2:49:29", "remaining_time": "1:50:16", "throughput": 2306.49, "total_tokens": 23455080} {"current_steps": 40680, "total_steps": 67140, "loss": 0.3746, "lr": 2.0154137737789426e-05, "epoch": 6.058981233243967, "percentage": 60.59, "elapsed_time": "2:49:30", "remaining_time": "1:50:15", "throughput": 2306.52, "total_tokens": 23457992} {"current_steps": 40685, "total_steps": 67140, "loss": 0.5846, "lr": 2.0147762314143727e-05, "epoch": 6.059725945784927, "percentage": 60.6, "elapsed_time": "2:49:31", "remaining_time": "1:50:13", "throughput": 2306.53, "total_tokens": 23460616} {"current_steps": 40690, "total_steps": 67140, "loss": 0.6169, "lr": 2.0141387218392525e-05, "epoch": 6.060470658325886, "percentage": 60.6, "elapsed_time": "2:49:32", "remaining_time": "1:50:12", "throughput": 2306.56, "total_tokens": 23463528} {"current_steps": 40695, "total_steps": 67140, "loss": 0.6815, "lr": 2.0135012450966632e-05, "epoch": 6.0612153708668455, "percentage": 60.61, "elapsed_time": "2:49:33", "remaining_time": "1:50:11", "throughput": 2306.59, "total_tokens": 23466664} {"current_steps": 40700, "total_steps": 67140, "loss": 0.3843, "lr": 2.0128638012296817e-05, "epoch": 6.061960083407804, "percentage": 60.62, "elapsed_time": "2:49:34", "remaining_time": "1:50:09", "throughput": 2306.61, "total_tokens": 23469416} {"current_steps": 40705, "total_steps": 67140, "loss": 0.5734, "lr": 2.0122263902813832e-05, "epoch": 6.062704795948764, "percentage": 60.63, "elapsed_time": "2:49:36", "remaining_time": "1:50:08", "throughput": 2306.66, "total_tokens": 23472680} {"current_steps": 40710, "total_steps": 67140, "loss": 0.5306, "lr": 2.011589012294842e-05, "epoch": 6.063449508489723, "percentage": 60.63, "elapsed_time": "2:49:37", "remaining_time": "1:50:07", "throughput": 2306.69, "total_tokens": 23475688} {"current_steps": 40715, "total_steps": 67140, "loss": 0.564, "lr": 2.01095166731313e-05, "epoch": 6.064194221030682, "percentage": 60.64, "elapsed_time": "2:49:38", "remaining_time": "1:50:06", "throughput": 2306.74, "total_tokens": 23478920} {"current_steps": 40720, "total_steps": 67140, "loss": 0.6007, "lr": 2.0103143553793158e-05, "epoch": 6.064938933571641, "percentage": 60.65, "elapsed_time": "2:49:39", "remaining_time": "1:50:04", "throughput": 2306.77, "total_tokens": 23481832} {"current_steps": 40725, "total_steps": 67140, "loss": 0.5997, "lr": 2.0096770765364665e-05, "epoch": 6.065683646112601, "percentage": 60.66, "elapsed_time": "2:49:40", "remaining_time": "1:50:03", "throughput": 2306.79, "total_tokens": 23484680} {"current_steps": 40730, "total_steps": 67140, "loss": 0.7244, "lr": 2.009039830827647e-05, "epoch": 6.0664283586535594, "percentage": 60.66, "elapsed_time": "2:49:41", "remaining_time": "1:50:02", "throughput": 2306.82, "total_tokens": 23487688} {"current_steps": 40735, "total_steps": 67140, "loss": 0.6317, "lr": 2.0084026182959195e-05, "epoch": 6.067173071194519, "percentage": 60.67, "elapsed_time": "2:49:42", "remaining_time": "1:50:00", "throughput": 2306.84, "total_tokens": 23490472} {"current_steps": 40740, "total_steps": 67140, "loss": 0.5555, "lr": 2.0077654389843455e-05, "epoch": 6.067917783735478, "percentage": 60.68, "elapsed_time": "2:49:44", "remaining_time": "1:49:59", "throughput": 2306.86, "total_tokens": 23493256} {"current_steps": 40745, "total_steps": 67140, "loss": 0.5083, "lr": 2.0071282929359802e-05, "epoch": 6.0686624962764375, "percentage": 60.69, "elapsed_time": "2:49:45", "remaining_time": "1:49:58", "throughput": 2306.88, "total_tokens": 23496072} {"current_steps": 40750, "total_steps": 67140, "loss": 0.5066, "lr": 2.0064911801938822e-05, "epoch": 6.069407208817396, "percentage": 60.69, "elapsed_time": "2:49:46", "remaining_time": "1:49:56", "throughput": 2306.91, "total_tokens": 23499048} {"current_steps": 40755, "total_steps": 67140, "loss": 0.7797, "lr": 2.0058541008011028e-05, "epoch": 6.070151921358356, "percentage": 60.7, "elapsed_time": "2:49:47", "remaining_time": "1:49:55", "throughput": 2306.93, "total_tokens": 23501736} {"current_steps": 40760, "total_steps": 67140, "loss": 0.6252, "lr": 2.0052170548006944e-05, "epoch": 6.070896633899315, "percentage": 60.71, "elapsed_time": "2:49:48", "remaining_time": "1:49:54", "throughput": 2306.95, "total_tokens": 23504584} {"current_steps": 40765, "total_steps": 67140, "loss": 0.5202, "lr": 2.0045800422357066e-05, "epoch": 6.071641346440274, "percentage": 60.72, "elapsed_time": "2:49:49", "remaining_time": "1:49:52", "throughput": 2306.96, "total_tokens": 23507272} {"current_steps": 40770, "total_steps": 67140, "loss": 0.565, "lr": 2.003943063149184e-05, "epoch": 6.072386058981233, "percentage": 60.72, "elapsed_time": "2:49:50", "remaining_time": "1:49:51", "throughput": 2307.0, "total_tokens": 23510408} {"current_steps": 40775, "total_steps": 67140, "loss": 0.6543, "lr": 2.003306117584173e-05, "epoch": 6.073130771522193, "percentage": 60.73, "elapsed_time": "2:49:51", "remaining_time": "1:49:50", "throughput": 2307.02, "total_tokens": 23513192} {"current_steps": 40780, "total_steps": 67140, "loss": 0.5203, "lr": 2.0026692055837155e-05, "epoch": 6.0738754840631515, "percentage": 60.74, "elapsed_time": "2:49:53", "remaining_time": "1:49:48", "throughput": 2307.06, "total_tokens": 23516200} {"current_steps": 40785, "total_steps": 67140, "loss": 0.5696, "lr": 2.0020323271908518e-05, "epoch": 6.074620196604111, "percentage": 60.75, "elapsed_time": "2:49:54", "remaining_time": "1:49:47", "throughput": 2307.08, "total_tokens": 23519080} {"current_steps": 40790, "total_steps": 67140, "loss": 0.5242, "lr": 2.0013954824486176e-05, "epoch": 6.07536490914507, "percentage": 60.75, "elapsed_time": "2:49:55", "remaining_time": "1:49:46", "throughput": 2307.1, "total_tokens": 23521768} {"current_steps": 40795, "total_steps": 67140, "loss": 0.5715, "lr": 2.0007586714000497e-05, "epoch": 6.0761096216860295, "percentage": 60.76, "elapsed_time": "2:49:56", "remaining_time": "1:49:44", "throughput": 2307.12, "total_tokens": 23524712} {"current_steps": 40800, "total_steps": 67140, "loss": 0.4494, "lr": 2.000121894088181e-05, "epoch": 6.076854334226988, "percentage": 60.77, "elapsed_time": "2:49:57", "remaining_time": "1:49:43", "throughput": 2307.16, "total_tokens": 23527816} {"current_steps": 40805, "total_steps": 67140, "loss": 0.5204, "lr": 1.9994851505560424e-05, "epoch": 6.077599046767948, "percentage": 60.78, "elapsed_time": "2:49:58", "remaining_time": "1:49:42", "throughput": 2307.19, "total_tokens": 23530760} {"current_steps": 40810, "total_steps": 67140, "loss": 0.566, "lr": 1.9988484408466622e-05, "epoch": 6.078343759308907, "percentage": 60.78, "elapsed_time": "2:49:59", "remaining_time": "1:49:40", "throughput": 2307.21, "total_tokens": 23533576} {"current_steps": 40815, "total_steps": 67140, "loss": 0.6186, "lr": 1.9982117650030674e-05, "epoch": 6.079088471849866, "percentage": 60.79, "elapsed_time": "2:50:01", "remaining_time": "1:49:39", "throughput": 2307.25, "total_tokens": 23536712} {"current_steps": 40820, "total_steps": 67140, "loss": 0.6413, "lr": 1.9975751230682808e-05, "epoch": 6.079833184390825, "percentage": 60.8, "elapsed_time": "2:50:02", "remaining_time": "1:49:38", "throughput": 2307.28, "total_tokens": 23539592} {"current_steps": 40825, "total_steps": 67140, "loss": 0.7, "lr": 1.996938515085326e-05, "epoch": 6.080577896931785, "percentage": 60.81, "elapsed_time": "2:50:03", "remaining_time": "1:49:36", "throughput": 2307.31, "total_tokens": 23542536} {"current_steps": 40830, "total_steps": 67140, "loss": 0.7742, "lr": 1.9963019410972194e-05, "epoch": 6.0813226094727435, "percentage": 60.81, "elapsed_time": "2:50:04", "remaining_time": "1:49:35", "throughput": 2307.33, "total_tokens": 23545320} {"current_steps": 40835, "total_steps": 67140, "loss": 0.5693, "lr": 1.9956654011469808e-05, "epoch": 6.082067322013703, "percentage": 60.82, "elapsed_time": "2:50:05", "remaining_time": "1:49:34", "throughput": 2307.34, "total_tokens": 23548008} {"current_steps": 40840, "total_steps": 67140, "loss": 0.5588, "lr": 1.995028895277623e-05, "epoch": 6.082812034554662, "percentage": 60.83, "elapsed_time": "2:50:06", "remaining_time": "1:49:32", "throughput": 2307.36, "total_tokens": 23550728} {"current_steps": 40845, "total_steps": 67140, "loss": 0.7163, "lr": 1.9943924235321605e-05, "epoch": 6.083556747095621, "percentage": 60.84, "elapsed_time": "2:50:07", "remaining_time": "1:49:31", "throughput": 2307.39, "total_tokens": 23553768} {"current_steps": 40850, "total_steps": 67140, "loss": 0.7456, "lr": 1.9937559859536016e-05, "epoch": 6.08430145963658, "percentage": 60.84, "elapsed_time": "2:50:09", "remaining_time": "1:49:30", "throughput": 2307.4, "total_tokens": 23556488} {"current_steps": 40855, "total_steps": 67140, "loss": 0.7107, "lr": 1.9931195825849544e-05, "epoch": 6.085046172177539, "percentage": 60.85, "elapsed_time": "2:50:10", "remaining_time": "1:49:28", "throughput": 2307.4, "total_tokens": 23559048} {"current_steps": 40860, "total_steps": 67140, "loss": 0.6105, "lr": 1.9924832134692262e-05, "epoch": 6.085790884718499, "percentage": 60.86, "elapsed_time": "2:50:11", "remaining_time": "1:49:27", "throughput": 2307.42, "total_tokens": 23561768} {"current_steps": 40865, "total_steps": 67140, "loss": 0.5639, "lr": 1.991846878649419e-05, "epoch": 6.0865355972594575, "percentage": 60.87, "elapsed_time": "2:50:12", "remaining_time": "1:49:26", "throughput": 2307.45, "total_tokens": 23564680} {"current_steps": 40870, "total_steps": 67140, "loss": 0.7965, "lr": 1.991210578168533e-05, "epoch": 6.087280309800417, "percentage": 60.87, "elapsed_time": "2:50:13", "remaining_time": "1:49:24", "throughput": 2307.48, "total_tokens": 23567656} {"current_steps": 40875, "total_steps": 67140, "loss": 0.624, "lr": 1.9905743120695675e-05, "epoch": 6.088025022341376, "percentage": 60.88, "elapsed_time": "2:50:14", "remaining_time": "1:49:23", "throughput": 2307.53, "total_tokens": 23570888} {"current_steps": 40880, "total_steps": 67140, "loss": 0.3843, "lr": 1.9899380803955193e-05, "epoch": 6.0887697348823355, "percentage": 60.89, "elapsed_time": "2:50:15", "remaining_time": "1:49:22", "throughput": 2307.55, "total_tokens": 23573736} {"current_steps": 40885, "total_steps": 67140, "loss": 0.5119, "lr": 1.9893018831893816e-05, "epoch": 6.089514447423294, "percentage": 60.9, "elapsed_time": "2:50:17", "remaining_time": "1:49:21", "throughput": 2307.56, "total_tokens": 23576392} {"current_steps": 40890, "total_steps": 67140, "loss": 0.513, "lr": 1.9886657204941458e-05, "epoch": 6.090259159964254, "percentage": 60.9, "elapsed_time": "2:50:18", "remaining_time": "1:49:19", "throughput": 2307.58, "total_tokens": 23579176} {"current_steps": 40895, "total_steps": 67140, "loss": 0.54, "lr": 1.9880295923528025e-05, "epoch": 6.091003872505213, "percentage": 60.91, "elapsed_time": "2:50:19", "remaining_time": "1:49:18", "throughput": 2307.6, "total_tokens": 23582024} {"current_steps": 40900, "total_steps": 67140, "loss": 0.7043, "lr": 1.9873934988083373e-05, "epoch": 6.091748585046172, "percentage": 60.92, "elapsed_time": "2:50:20", "remaining_time": "1:49:17", "throughput": 2307.63, "total_tokens": 23584968} {"current_steps": 40905, "total_steps": 67140, "loss": 0.5861, "lr": 1.9867574399037365e-05, "epoch": 6.092493297587131, "percentage": 60.92, "elapsed_time": "2:50:21", "remaining_time": "1:49:15", "throughput": 2307.66, "total_tokens": 23587976} {"current_steps": 40910, "total_steps": 67140, "loss": 0.7356, "lr": 1.98612141568198e-05, "epoch": 6.093238010128091, "percentage": 60.93, "elapsed_time": "2:50:22", "remaining_time": "1:49:14", "throughput": 2307.7, "total_tokens": 23590952} {"current_steps": 40915, "total_steps": 67140, "loss": 0.5542, "lr": 1.9854854261860496e-05, "epoch": 6.0939827226690495, "percentage": 60.94, "elapsed_time": "2:50:23", "remaining_time": "1:49:13", "throughput": 2307.72, "total_tokens": 23593736} {"current_steps": 40920, "total_steps": 67140, "loss": 0.5857, "lr": 1.9848494714589214e-05, "epoch": 6.094727435210009, "percentage": 60.95, "elapsed_time": "2:50:24", "remaining_time": "1:49:11", "throughput": 2307.74, "total_tokens": 23596584} {"current_steps": 40925, "total_steps": 67140, "loss": 0.7014, "lr": 1.9842135515435717e-05, "epoch": 6.095472147750968, "percentage": 60.95, "elapsed_time": "2:50:26", "remaining_time": "1:49:10", "throughput": 2307.76, "total_tokens": 23599464} {"current_steps": 40930, "total_steps": 67140, "loss": 0.6452, "lr": 1.9835776664829735e-05, "epoch": 6.0962168602919276, "percentage": 60.96, "elapsed_time": "2:50:27", "remaining_time": "1:49:09", "throughput": 2307.8, "total_tokens": 23602408} {"current_steps": 40935, "total_steps": 67140, "loss": 0.5895, "lr": 1.9829418163200968e-05, "epoch": 6.096961572832886, "percentage": 60.97, "elapsed_time": "2:50:28", "remaining_time": "1:49:07", "throughput": 2307.82, "total_tokens": 23605224} {"current_steps": 40940, "total_steps": 67140, "loss": 0.564, "lr": 1.9823060010979096e-05, "epoch": 6.097706285373846, "percentage": 60.98, "elapsed_time": "2:50:29", "remaining_time": "1:49:06", "throughput": 2307.84, "total_tokens": 23608040} {"current_steps": 40945, "total_steps": 67140, "loss": 0.628, "lr": 1.9816702208593795e-05, "epoch": 6.098450997914805, "percentage": 60.98, "elapsed_time": "2:50:30", "remaining_time": "1:49:05", "throughput": 2307.87, "total_tokens": 23611048} {"current_steps": 40950, "total_steps": 67140, "loss": 0.5597, "lr": 1.9810344756474676e-05, "epoch": 6.099195710455764, "percentage": 60.99, "elapsed_time": "2:50:31", "remaining_time": "1:49:03", "throughput": 2307.88, "total_tokens": 23613736} {"current_steps": 40955, "total_steps": 67140, "loss": 0.643, "lr": 1.9803987655051354e-05, "epoch": 6.099940422996723, "percentage": 61.0, "elapsed_time": "2:50:32", "remaining_time": "1:49:02", "throughput": 2307.91, "total_tokens": 23616648} {"current_steps": 40960, "total_steps": 67140, "loss": 0.7114, "lr": 1.979763090475342e-05, "epoch": 6.100685135537683, "percentage": 61.01, "elapsed_time": "2:50:34", "remaining_time": "1:49:01", "throughput": 2307.93, "total_tokens": 23619432} {"current_steps": 40965, "total_steps": 67140, "loss": 0.4881, "lr": 1.979127450601045e-05, "epoch": 6.1014298480786415, "percentage": 61.01, "elapsed_time": "2:50:35", "remaining_time": "1:48:59", "throughput": 2307.95, "total_tokens": 23622280} {"current_steps": 40970, "total_steps": 67140, "loss": 0.6102, "lr": 1.978491845925196e-05, "epoch": 6.102174560619601, "percentage": 61.02, "elapsed_time": "2:50:36", "remaining_time": "1:48:58", "throughput": 2307.99, "total_tokens": 23625384} {"current_steps": 40975, "total_steps": 67140, "loss": 0.6843, "lr": 1.9778562764907475e-05, "epoch": 6.10291927316056, "percentage": 61.03, "elapsed_time": "2:50:37", "remaining_time": "1:48:57", "throughput": 2308.03, "total_tokens": 23628488} {"current_steps": 40980, "total_steps": 67140, "loss": 0.4945, "lr": 1.97722074234065e-05, "epoch": 6.10366398570152, "percentage": 61.04, "elapsed_time": "2:50:38", "remaining_time": "1:48:55", "throughput": 2308.07, "total_tokens": 23631560} {"current_steps": 40985, "total_steps": 67140, "loss": 0.5485, "lr": 1.97658524351785e-05, "epoch": 6.104408698242478, "percentage": 61.04, "elapsed_time": "2:50:39", "remaining_time": "1:48:54", "throughput": 2308.1, "total_tokens": 23634568} {"current_steps": 40990, "total_steps": 67140, "loss": 0.5859, "lr": 1.9759497800652897e-05, "epoch": 6.105153410783438, "percentage": 61.05, "elapsed_time": "2:50:40", "remaining_time": "1:48:53", "throughput": 2308.13, "total_tokens": 23637416} {"current_steps": 40995, "total_steps": 67140, "loss": 0.6359, "lr": 1.975314352025913e-05, "epoch": 6.105898123324397, "percentage": 61.06, "elapsed_time": "2:50:42", "remaining_time": "1:48:52", "throughput": 2308.16, "total_tokens": 23640488} {"current_steps": 41000, "total_steps": 67140, "loss": 0.5393, "lr": 1.9746789594426593e-05, "epoch": 6.106642835865356, "percentage": 61.07, "elapsed_time": "2:50:43", "remaining_time": "1:48:50", "throughput": 2308.22, "total_tokens": 23643848} {"current_steps": 41005, "total_steps": 67140, "loss": 0.6739, "lr": 1.9740436023584653e-05, "epoch": 6.107387548406315, "percentage": 61.07, "elapsed_time": "2:50:44", "remaining_time": "1:48:49", "throughput": 2308.22, "total_tokens": 23646440} {"current_steps": 41010, "total_steps": 67140, "loss": 0.5173, "lr": 1.973408280816267e-05, "epoch": 6.108132260947274, "percentage": 61.08, "elapsed_time": "2:50:45", "remaining_time": "1:48:48", "throughput": 2308.24, "total_tokens": 23649224} {"current_steps": 41015, "total_steps": 67140, "loss": 0.6476, "lr": 1.9727729948589955e-05, "epoch": 6.1088769734882336, "percentage": 61.09, "elapsed_time": "2:50:46", "remaining_time": "1:48:46", "throughput": 2308.27, "total_tokens": 23652072} {"current_steps": 41020, "total_steps": 67140, "loss": 0.6922, "lr": 1.9721377445295813e-05, "epoch": 6.109621686029192, "percentage": 61.1, "elapsed_time": "2:50:47", "remaining_time": "1:48:45", "throughput": 2308.28, "total_tokens": 23654760} {"current_steps": 41025, "total_steps": 67140, "loss": 0.6501, "lr": 1.9715025298709532e-05, "epoch": 6.110366398570152, "percentage": 61.1, "elapsed_time": "2:50:48", "remaining_time": "1:48:44", "throughput": 2308.31, "total_tokens": 23657672} {"current_steps": 41030, "total_steps": 67140, "loss": 0.639, "lr": 1.970867350926035e-05, "epoch": 6.111111111111111, "percentage": 61.11, "elapsed_time": "2:50:50", "remaining_time": "1:48:42", "throughput": 2308.33, "total_tokens": 23660456} {"current_steps": 41035, "total_steps": 67140, "loss": 0.8587, "lr": 1.9702322077377493e-05, "epoch": 6.11185582365207, "percentage": 61.12, "elapsed_time": "2:50:51", "remaining_time": "1:48:41", "throughput": 2308.33, "total_tokens": 23662888} {"current_steps": 41040, "total_steps": 67140, "loss": 0.5225, "lr": 1.9695971003490175e-05, "epoch": 6.112600536193029, "percentage": 61.13, "elapsed_time": "2:50:52", "remaining_time": "1:48:40", "throughput": 2308.35, "total_tokens": 23665800} {"current_steps": 41045, "total_steps": 67140, "loss": 0.4842, "lr": 1.9689620288027574e-05, "epoch": 6.113345248733989, "percentage": 61.13, "elapsed_time": "2:50:53", "remaining_time": "1:48:38", "throughput": 2308.37, "total_tokens": 23668616} {"current_steps": 41050, "total_steps": 67140, "loss": 0.6495, "lr": 1.9683269931418842e-05, "epoch": 6.1140899612749475, "percentage": 61.14, "elapsed_time": "2:50:54", "remaining_time": "1:48:37", "throughput": 2308.4, "total_tokens": 23671496} {"current_steps": 41055, "total_steps": 67140, "loss": 0.615, "lr": 1.9676919934093108e-05, "epoch": 6.114834673815907, "percentage": 61.15, "elapsed_time": "2:50:55", "remaining_time": "1:48:36", "throughput": 2308.42, "total_tokens": 23674408} {"current_steps": 41060, "total_steps": 67140, "loss": 0.5503, "lr": 1.9670570296479488e-05, "epoch": 6.115579386356866, "percentage": 61.16, "elapsed_time": "2:50:56", "remaining_time": "1:48:34", "throughput": 2308.45, "total_tokens": 23677384} {"current_steps": 41065, "total_steps": 67140, "loss": 0.5786, "lr": 1.9664221019007065e-05, "epoch": 6.116324098897826, "percentage": 61.16, "elapsed_time": "2:50:57", "remaining_time": "1:48:33", "throughput": 2308.49, "total_tokens": 23680392} {"current_steps": 41070, "total_steps": 67140, "loss": 0.5613, "lr": 1.9657872102104882e-05, "epoch": 6.117068811438784, "percentage": 61.17, "elapsed_time": "2:50:59", "remaining_time": "1:48:32", "throughput": 2308.49, "total_tokens": 23682888} {"current_steps": 41075, "total_steps": 67140, "loss": 0.5061, "lr": 1.9651523546201982e-05, "epoch": 6.117813523979744, "percentage": 61.18, "elapsed_time": "2:51:00", "remaining_time": "1:48:30", "throughput": 2308.51, "total_tokens": 23685736} {"current_steps": 41080, "total_steps": 67140, "loss": 0.5478, "lr": 1.9645175351727383e-05, "epoch": 6.118558236520703, "percentage": 61.19, "elapsed_time": "2:51:01", "remaining_time": "1:48:29", "throughput": 2308.55, "total_tokens": 23688872} {"current_steps": 41085, "total_steps": 67140, "loss": 0.7478, "lr": 1.9638827519110057e-05, "epoch": 6.119302949061662, "percentage": 61.19, "elapsed_time": "2:51:02", "remaining_time": "1:48:28", "throughput": 2308.59, "total_tokens": 23691912} {"current_steps": 41090, "total_steps": 67140, "loss": 0.694, "lr": 1.9632480048778968e-05, "epoch": 6.120047661602621, "percentage": 61.2, "elapsed_time": "2:51:03", "remaining_time": "1:48:26", "throughput": 2308.6, "total_tokens": 23694600} {"current_steps": 41095, "total_steps": 67140, "loss": 0.5382, "lr": 1.962613294116306e-05, "epoch": 6.120792374143581, "percentage": 61.21, "elapsed_time": "2:51:04", "remaining_time": "1:48:25", "throughput": 2308.64, "total_tokens": 23697768} {"current_steps": 41100, "total_steps": 67140, "loss": 0.6571, "lr": 1.9619786196691238e-05, "epoch": 6.1215370866845396, "percentage": 61.22, "elapsed_time": "2:51:05", "remaining_time": "1:48:24", "throughput": 2308.65, "total_tokens": 23700424} {"current_steps": 41105, "total_steps": 67140, "loss": 0.4823, "lr": 1.9613439815792394e-05, "epoch": 6.122281799225499, "percentage": 61.22, "elapsed_time": "2:51:07", "remaining_time": "1:48:22", "throughput": 2308.69, "total_tokens": 23703528} {"current_steps": 41110, "total_steps": 67140, "loss": 0.5358, "lr": 1.9607093798895382e-05, "epoch": 6.123026511766458, "percentage": 61.23, "elapsed_time": "2:51:08", "remaining_time": "1:48:21", "throughput": 2308.72, "total_tokens": 23706440} {"current_steps": 41115, "total_steps": 67140, "loss": 0.5265, "lr": 1.960074814642905e-05, "epoch": 6.123771224307418, "percentage": 61.24, "elapsed_time": "2:51:09", "remaining_time": "1:48:20", "throughput": 2308.74, "total_tokens": 23709224} {"current_steps": 41120, "total_steps": 67140, "loss": 0.5727, "lr": 1.95944028588222e-05, "epoch": 6.124515936848376, "percentage": 61.25, "elapsed_time": "2:51:10", "remaining_time": "1:48:18", "throughput": 2308.75, "total_tokens": 23711848} {"current_steps": 41125, "total_steps": 67140, "loss": 0.5447, "lr": 1.9588057936503627e-05, "epoch": 6.125260649389336, "percentage": 61.25, "elapsed_time": "2:51:11", "remaining_time": "1:48:17", "throughput": 2308.78, "total_tokens": 23714888} {"current_steps": 41130, "total_steps": 67140, "loss": 0.5898, "lr": 1.95817133799021e-05, "epoch": 6.126005361930295, "percentage": 61.26, "elapsed_time": "2:51:12", "remaining_time": "1:48:16", "throughput": 2308.8, "total_tokens": 23717576} {"current_steps": 41135, "total_steps": 67140, "loss": 0.5306, "lr": 1.957536918944635e-05, "epoch": 6.126750074471254, "percentage": 61.27, "elapsed_time": "2:51:13", "remaining_time": "1:48:15", "throughput": 2308.83, "total_tokens": 23720680} {"current_steps": 41140, "total_steps": 67140, "loss": 0.6328, "lr": 1.9569025365565095e-05, "epoch": 6.127494787012213, "percentage": 61.27, "elapsed_time": "2:51:15", "remaining_time": "1:48:13", "throughput": 2308.86, "total_tokens": 23723624} {"current_steps": 41145, "total_steps": 67140, "loss": 0.5453, "lr": 1.9562681908687035e-05, "epoch": 6.128239499553173, "percentage": 61.28, "elapsed_time": "2:51:16", "remaining_time": "1:48:12", "throughput": 2308.88, "total_tokens": 23726408} {"current_steps": 41150, "total_steps": 67140, "loss": 0.5483, "lr": 1.955633881924082e-05, "epoch": 6.128984212094132, "percentage": 61.29, "elapsed_time": "2:51:17", "remaining_time": "1:48:11", "throughput": 2308.89, "total_tokens": 23729064} {"current_steps": 41155, "total_steps": 67140, "loss": 0.5026, "lr": 1.954999609765509e-05, "epoch": 6.129728924635091, "percentage": 61.3, "elapsed_time": "2:51:18", "remaining_time": "1:48:09", "throughput": 2308.93, "total_tokens": 23732008} {"current_steps": 41160, "total_steps": 67140, "loss": 0.6131, "lr": 1.9543653744358465e-05, "epoch": 6.13047363717605, "percentage": 61.3, "elapsed_time": "2:51:19", "remaining_time": "1:48:08", "throughput": 2308.95, "total_tokens": 23734920} {"current_steps": 41165, "total_steps": 67140, "loss": 0.7448, "lr": 1.953731175977954e-05, "epoch": 6.13121834971701, "percentage": 61.31, "elapsed_time": "2:51:20", "remaining_time": "1:48:07", "throughput": 2308.98, "total_tokens": 23737896} {"current_steps": 41170, "total_steps": 67140, "loss": 0.606, "lr": 1.9530970144346874e-05, "epoch": 6.131963062257968, "percentage": 61.32, "elapsed_time": "2:51:21", "remaining_time": "1:48:05", "throughput": 2309.01, "total_tokens": 23740712} {"current_steps": 41175, "total_steps": 67140, "loss": 0.7289, "lr": 1.9524628898489016e-05, "epoch": 6.132707774798928, "percentage": 61.33, "elapsed_time": "2:51:23", "remaining_time": "1:48:04", "throughput": 2309.07, "total_tokens": 23744200} {"current_steps": 41180, "total_steps": 67140, "loss": 0.5151, "lr": 1.9518288022634468e-05, "epoch": 6.133452487339887, "percentage": 61.33, "elapsed_time": "2:51:24", "remaining_time": "1:48:03", "throughput": 2309.09, "total_tokens": 23746984} {"current_steps": 41185, "total_steps": 67140, "loss": 0.5116, "lr": 1.9511947517211742e-05, "epoch": 6.134197199880846, "percentage": 61.34, "elapsed_time": "2:51:25", "remaining_time": "1:48:01", "throughput": 2309.12, "total_tokens": 23750024} {"current_steps": 41190, "total_steps": 67140, "loss": 0.587, "lr": 1.9505607382649276e-05, "epoch": 6.134941912421805, "percentage": 61.35, "elapsed_time": "2:51:26", "remaining_time": "1:48:00", "throughput": 2309.17, "total_tokens": 23753160} {"current_steps": 41195, "total_steps": 67140, "loss": 0.652, "lr": 1.9499267619375534e-05, "epoch": 6.135686624962764, "percentage": 61.36, "elapsed_time": "2:51:27", "remaining_time": "1:47:59", "throughput": 2309.19, "total_tokens": 23755976} {"current_steps": 41200, "total_steps": 67140, "loss": 0.546, "lr": 1.9492928227818914e-05, "epoch": 6.136431337503724, "percentage": 61.36, "elapsed_time": "2:51:28", "remaining_time": "1:47:57", "throughput": 2309.22, "total_tokens": 23758888} {"current_steps": 41205, "total_steps": 67140, "loss": 0.4308, "lr": 1.9486589208407812e-05, "epoch": 6.137176050044682, "percentage": 61.37, "elapsed_time": "2:51:29", "remaining_time": "1:47:56", "throughput": 2309.23, "total_tokens": 23761544} {"current_steps": 41210, "total_steps": 67140, "loss": 0.5732, "lr": 1.9480250561570603e-05, "epoch": 6.137920762585642, "percentage": 61.38, "elapsed_time": "2:51:30", "remaining_time": "1:47:55", "throughput": 2309.25, "total_tokens": 23764488} {"current_steps": 41215, "total_steps": 67140, "loss": 0.714, "lr": 1.9473912287735614e-05, "epoch": 6.138665475126601, "percentage": 61.39, "elapsed_time": "2:51:32", "remaining_time": "1:47:53", "throughput": 2309.27, "total_tokens": 23767304} {"current_steps": 41220, "total_steps": 67140, "loss": 0.6507, "lr": 1.9467574387331167e-05, "epoch": 6.13941018766756, "percentage": 61.39, "elapsed_time": "2:51:33", "remaining_time": "1:47:52", "throughput": 2309.27, "total_tokens": 23769800} {"current_steps": 41225, "total_steps": 67140, "loss": 0.6256, "lr": 1.9461236860785558e-05, "epoch": 6.140154900208519, "percentage": 61.4, "elapsed_time": "2:51:34", "remaining_time": "1:47:51", "throughput": 2309.29, "total_tokens": 23772680} {"current_steps": 41230, "total_steps": 67140, "loss": 0.4797, "lr": 1.9454899708527038e-05, "epoch": 6.140899612749479, "percentage": 61.41, "elapsed_time": "2:51:35", "remaining_time": "1:47:49", "throughput": 2309.31, "total_tokens": 23775400} {"current_steps": 41235, "total_steps": 67140, "loss": 0.5976, "lr": 1.9448562930983848e-05, "epoch": 6.141644325290438, "percentage": 61.42, "elapsed_time": "2:51:36", "remaining_time": "1:47:48", "throughput": 2309.33, "total_tokens": 23778216} {"current_steps": 41240, "total_steps": 67140, "loss": 0.485, "lr": 1.94422265285842e-05, "epoch": 6.142389037831397, "percentage": 61.42, "elapsed_time": "2:51:37", "remaining_time": "1:47:47", "throughput": 2309.36, "total_tokens": 23781256} {"current_steps": 41245, "total_steps": 67140, "loss": 0.5919, "lr": 1.9435890501756294e-05, "epoch": 6.143133750372356, "percentage": 61.43, "elapsed_time": "2:51:38", "remaining_time": "1:47:45", "throughput": 2309.37, "total_tokens": 23783848} {"current_steps": 41250, "total_steps": 67140, "loss": 0.5796, "lr": 1.9429554850928284e-05, "epoch": 6.143878462913316, "percentage": 61.44, "elapsed_time": "2:51:39", "remaining_time": "1:47:44", "throughput": 2309.4, "total_tokens": 23786792} {"current_steps": 41255, "total_steps": 67140, "loss": 0.36, "lr": 1.9423219576528306e-05, "epoch": 6.144623175454274, "percentage": 61.45, "elapsed_time": "2:51:41", "remaining_time": "1:47:43", "throughput": 2309.44, "total_tokens": 23789832} {"current_steps": 41260, "total_steps": 67140, "loss": 0.509, "lr": 1.941688467898448e-05, "epoch": 6.145367887995234, "percentage": 61.45, "elapsed_time": "2:51:42", "remaining_time": "1:47:42", "throughput": 2309.46, "total_tokens": 23792680} {"current_steps": 41265, "total_steps": 67140, "loss": 0.7558, "lr": 1.9410550158724898e-05, "epoch": 6.146112600536193, "percentage": 61.46, "elapsed_time": "2:51:43", "remaining_time": "1:47:40", "throughput": 2309.49, "total_tokens": 23795624} {"current_steps": 41270, "total_steps": 67140, "loss": 0.4866, "lr": 1.9404216016177594e-05, "epoch": 6.146857313077152, "percentage": 61.47, "elapsed_time": "2:51:44", "remaining_time": "1:47:39", "throughput": 2309.51, "total_tokens": 23798472} {"current_steps": 41275, "total_steps": 67140, "loss": 0.6415, "lr": 1.9397882251770627e-05, "epoch": 6.147602025618111, "percentage": 61.48, "elapsed_time": "2:51:45", "remaining_time": "1:47:38", "throughput": 2309.57, "total_tokens": 23801864} {"current_steps": 41280, "total_steps": 67140, "loss": 0.5831, "lr": 1.9391548865932e-05, "epoch": 6.148346738159071, "percentage": 61.48, "elapsed_time": "2:51:46", "remaining_time": "1:47:36", "throughput": 2309.58, "total_tokens": 23804616} {"current_steps": 41285, "total_steps": 67140, "loss": 0.6788, "lr": 1.9385215859089702e-05, "epoch": 6.14909145070003, "percentage": 61.49, "elapsed_time": "2:51:48", "remaining_time": "1:47:35", "throughput": 2309.59, "total_tokens": 23807304} {"current_steps": 41290, "total_steps": 67140, "loss": 0.5187, "lr": 1.937888323167168e-05, "epoch": 6.149836163240989, "percentage": 61.5, "elapsed_time": "2:51:49", "remaining_time": "1:47:34", "throughput": 2309.62, "total_tokens": 23810216} {"current_steps": 41295, "total_steps": 67140, "loss": 0.5557, "lr": 1.9372550984105885e-05, "epoch": 6.150580875781948, "percentage": 61.51, "elapsed_time": "2:51:50", "remaining_time": "1:47:32", "throughput": 2309.64, "total_tokens": 23813032} {"current_steps": 41300, "total_steps": 67140, "loss": 0.659, "lr": 1.9366219116820205e-05, "epoch": 6.151325588322908, "percentage": 61.51, "elapsed_time": "2:51:51", "remaining_time": "1:47:31", "throughput": 2309.65, "total_tokens": 23815752} {"current_steps": 41305, "total_steps": 67140, "loss": 0.4805, "lr": 1.9359887630242547e-05, "epoch": 6.152070300863866, "percentage": 61.52, "elapsed_time": "2:51:52", "remaining_time": "1:47:30", "throughput": 2309.68, "total_tokens": 23818664} {"current_steps": 41310, "total_steps": 67140, "loss": 0.6625, "lr": 1.9353556524800743e-05, "epoch": 6.152815013404826, "percentage": 61.53, "elapsed_time": "2:51:53", "remaining_time": "1:47:28", "throughput": 2309.7, "total_tokens": 23821576} {"current_steps": 41315, "total_steps": 67140, "loss": 0.691, "lr": 1.934722580092263e-05, "epoch": 6.153559725945785, "percentage": 61.54, "elapsed_time": "2:51:54", "remaining_time": "1:47:27", "throughput": 2309.73, "total_tokens": 23824584} {"current_steps": 41320, "total_steps": 67140, "loss": 0.6417, "lr": 1.9340895459036014e-05, "epoch": 6.1543044384867445, "percentage": 61.54, "elapsed_time": "2:51:55", "remaining_time": "1:47:26", "throughput": 2309.75, "total_tokens": 23827336} {"current_steps": 41325, "total_steps": 67140, "loss": 0.6713, "lr": 1.9334565499568676e-05, "epoch": 6.155049151027703, "percentage": 61.55, "elapsed_time": "2:51:57", "remaining_time": "1:47:24", "throughput": 2309.76, "total_tokens": 23830056} {"current_steps": 41330, "total_steps": 67140, "loss": 0.4706, "lr": 1.9328235922948375e-05, "epoch": 6.155793863568663, "percentage": 61.56, "elapsed_time": "2:51:58", "remaining_time": "1:47:23", "throughput": 2309.78, "total_tokens": 23832712} {"current_steps": 41335, "total_steps": 67140, "loss": 0.5631, "lr": 1.932190672960282e-05, "epoch": 6.156538576109622, "percentage": 61.57, "elapsed_time": "2:51:59", "remaining_time": "1:47:22", "throughput": 2309.81, "total_tokens": 23835720} {"current_steps": 41340, "total_steps": 67140, "loss": 0.7873, "lr": 1.931557791995973e-05, "epoch": 6.157283288650581, "percentage": 61.57, "elapsed_time": "2:52:00", "remaining_time": "1:47:20", "throughput": 2309.82, "total_tokens": 23838472} {"current_steps": 41345, "total_steps": 67140, "loss": 0.5803, "lr": 1.930924949444677e-05, "epoch": 6.15802800119154, "percentage": 61.58, "elapsed_time": "2:52:01", "remaining_time": "1:47:19", "throughput": 2309.84, "total_tokens": 23841192} {"current_steps": 41350, "total_steps": 67140, "loss": 0.8778, "lr": 1.9302921453491596e-05, "epoch": 6.1587727137325, "percentage": 61.59, "elapsed_time": "2:52:02", "remaining_time": "1:47:18", "throughput": 2309.86, "total_tokens": 23844072} {"current_steps": 41355, "total_steps": 67140, "loss": 0.6435, "lr": 1.9296593797521823e-05, "epoch": 6.159517426273458, "percentage": 61.6, "elapsed_time": "2:52:03", "remaining_time": "1:47:16", "throughput": 2309.89, "total_tokens": 23846952} {"current_steps": 41360, "total_steps": 67140, "loss": 0.5368, "lr": 1.9290266526965056e-05, "epoch": 6.160262138814417, "percentage": 61.6, "elapsed_time": "2:52:05", "remaining_time": "1:47:15", "throughput": 2309.92, "total_tokens": 23849928} {"current_steps": 41365, "total_steps": 67140, "loss": 0.6637, "lr": 1.9283939642248858e-05, "epoch": 6.161006851355377, "percentage": 61.61, "elapsed_time": "2:52:06", "remaining_time": "1:47:14", "throughput": 2309.94, "total_tokens": 23852776} {"current_steps": 41370, "total_steps": 67140, "loss": 0.7381, "lr": 1.927761314380078e-05, "epoch": 6.161751563896336, "percentage": 61.62, "elapsed_time": "2:52:07", "remaining_time": "1:47:13", "throughput": 2309.99, "total_tokens": 23856008} {"current_steps": 41375, "total_steps": 67140, "loss": 0.5443, "lr": 1.9271287032048343e-05, "epoch": 6.162496276437295, "percentage": 61.62, "elapsed_time": "2:52:08", "remaining_time": "1:47:11", "throughput": 2310.0, "total_tokens": 23858632} {"current_steps": 41380, "total_steps": 67140, "loss": 0.539, "lr": 1.9264961307419037e-05, "epoch": 6.163240988978254, "percentage": 61.63, "elapsed_time": "2:52:09", "remaining_time": "1:47:10", "throughput": 2310.03, "total_tokens": 23861512} {"current_steps": 41385, "total_steps": 67140, "loss": 0.651, "lr": 1.9258635970340326e-05, "epoch": 6.163985701519214, "percentage": 61.64, "elapsed_time": "2:52:10", "remaining_time": "1:47:09", "throughput": 2310.05, "total_tokens": 23864328} {"current_steps": 41390, "total_steps": 67140, "loss": 0.6068, "lr": 1.925231102123966e-05, "epoch": 6.164730414060172, "percentage": 61.65, "elapsed_time": "2:52:11", "remaining_time": "1:47:07", "throughput": 2310.08, "total_tokens": 23867368} {"current_steps": 41395, "total_steps": 67140, "loss": 0.7837, "lr": 1.9245986460544448e-05, "epoch": 6.165475126601132, "percentage": 61.65, "elapsed_time": "2:52:12", "remaining_time": "1:47:06", "throughput": 2310.11, "total_tokens": 23870248} {"current_steps": 41400, "total_steps": 67140, "loss": 0.7565, "lr": 1.9239662288682067e-05, "epoch": 6.166219839142091, "percentage": 61.66, "elapsed_time": "2:52:14", "remaining_time": "1:47:05", "throughput": 2310.11, "total_tokens": 23872872} {"current_steps": 41405, "total_steps": 67140, "loss": 0.7321, "lr": 1.923333850607989e-05, "epoch": 6.1669645516830505, "percentage": 61.67, "elapsed_time": "2:52:15", "remaining_time": "1:47:03", "throughput": 2310.14, "total_tokens": 23875784} {"current_steps": 41410, "total_steps": 67140, "loss": 0.5404, "lr": 1.922701511316526e-05, "epoch": 6.167709264224009, "percentage": 61.68, "elapsed_time": "2:52:16", "remaining_time": "1:47:02", "throughput": 2310.16, "total_tokens": 23878632} {"current_steps": 41415, "total_steps": 67140, "loss": 0.5034, "lr": 1.9220692110365468e-05, "epoch": 6.168453976764969, "percentage": 61.68, "elapsed_time": "2:52:17", "remaining_time": "1:47:01", "throughput": 2310.21, "total_tokens": 23881832} {"current_steps": 41420, "total_steps": 67140, "loss": 0.6961, "lr": 1.9214369498107806e-05, "epoch": 6.169198689305928, "percentage": 61.69, "elapsed_time": "2:52:18", "remaining_time": "1:46:59", "throughput": 2310.27, "total_tokens": 23885224} {"current_steps": 41425, "total_steps": 67140, "loss": 0.567, "lr": 1.9208047276819537e-05, "epoch": 6.169943401846887, "percentage": 61.7, "elapsed_time": "2:52:19", "remaining_time": "1:46:58", "throughput": 2310.29, "total_tokens": 23888136} {"current_steps": 41430, "total_steps": 67140, "loss": 0.6181, "lr": 1.920172544692789e-05, "epoch": 6.170688114387846, "percentage": 61.71, "elapsed_time": "2:52:21", "remaining_time": "1:46:57", "throughput": 2310.32, "total_tokens": 23891112} {"current_steps": 41435, "total_steps": 67140, "loss": 0.5844, "lr": 1.9195404008860053e-05, "epoch": 6.171432826928806, "percentage": 61.71, "elapsed_time": "2:52:22", "remaining_time": "1:46:55", "throughput": 2310.34, "total_tokens": 23893896} {"current_steps": 41440, "total_steps": 67140, "loss": 0.599, "lr": 1.9189082963043213e-05, "epoch": 6.172177539469764, "percentage": 61.72, "elapsed_time": "2:52:23", "remaining_time": "1:46:54", "throughput": 2310.35, "total_tokens": 23896648} {"current_steps": 41445, "total_steps": 67140, "loss": 0.7797, "lr": 1.918276230990453e-05, "epoch": 6.172922252010724, "percentage": 61.73, "elapsed_time": "2:52:24", "remaining_time": "1:46:53", "throughput": 2310.38, "total_tokens": 23899624} {"current_steps": 41450, "total_steps": 67140, "loss": 0.6511, "lr": 1.9176442049871108e-05, "epoch": 6.173666964551683, "percentage": 61.74, "elapsed_time": "2:52:25", "remaining_time": "1:46:52", "throughput": 2310.41, "total_tokens": 23902504} {"current_steps": 41455, "total_steps": 67140, "loss": 0.517, "lr": 1.9170122183370058e-05, "epoch": 6.1744116770926425, "percentage": 61.74, "elapsed_time": "2:52:26", "remaining_time": "1:46:50", "throughput": 2310.44, "total_tokens": 23905352} {"current_steps": 41460, "total_steps": 67140, "loss": 0.5533, "lr": 1.9163802710828453e-05, "epoch": 6.175156389633601, "percentage": 61.75, "elapsed_time": "2:52:27", "remaining_time": "1:46:49", "throughput": 2310.48, "total_tokens": 23908552} {"current_steps": 41465, "total_steps": 67140, "loss": 0.789, "lr": 1.9157483632673328e-05, "epoch": 6.175901102174561, "percentage": 61.76, "elapsed_time": "2:52:29", "remaining_time": "1:46:48", "throughput": 2310.51, "total_tokens": 23911432} {"current_steps": 41470, "total_steps": 67140, "loss": 0.5911, "lr": 1.9151164949331714e-05, "epoch": 6.17664581471552, "percentage": 61.77, "elapsed_time": "2:52:30", "remaining_time": "1:46:46", "throughput": 2310.51, "total_tokens": 23913992} {"current_steps": 41475, "total_steps": 67140, "loss": 0.6561, "lr": 1.914484666123058e-05, "epoch": 6.177390527256479, "percentage": 61.77, "elapsed_time": "2:52:31", "remaining_time": "1:46:45", "throughput": 2310.56, "total_tokens": 23917224} {"current_steps": 41480, "total_steps": 67140, "loss": 0.5628, "lr": 1.9138528768796915e-05, "epoch": 6.178135239797438, "percentage": 61.78, "elapsed_time": "2:52:32", "remaining_time": "1:46:44", "throughput": 2310.57, "total_tokens": 23919880} {"current_steps": 41485, "total_steps": 67140, "loss": 0.5716, "lr": 1.9132211272457634e-05, "epoch": 6.178879952338398, "percentage": 61.79, "elapsed_time": "2:52:33", "remaining_time": "1:46:42", "throughput": 2310.59, "total_tokens": 23922664} {"current_steps": 41490, "total_steps": 67140, "loss": 0.4917, "lr": 1.9125894172639663e-05, "epoch": 6.1796246648793565, "percentage": 61.8, "elapsed_time": "2:52:34", "remaining_time": "1:46:41", "throughput": 2310.61, "total_tokens": 23925576} {"current_steps": 41495, "total_steps": 67140, "loss": 0.5454, "lr": 1.9119577469769883e-05, "epoch": 6.180369377420316, "percentage": 61.8, "elapsed_time": "2:52:35", "remaining_time": "1:46:40", "throughput": 2310.64, "total_tokens": 23928456} {"current_steps": 41500, "total_steps": 67140, "loss": 0.5424, "lr": 1.9113261164275147e-05, "epoch": 6.181114089961275, "percentage": 61.81, "elapsed_time": "2:52:36", "remaining_time": "1:46:38", "throughput": 2310.67, "total_tokens": 23931432} {"current_steps": 41505, "total_steps": 67140, "loss": 0.6359, "lr": 1.9106945256582293e-05, "epoch": 6.1818588025022345, "percentage": 61.82, "elapsed_time": "2:52:38", "remaining_time": "1:46:37", "throughput": 2310.69, "total_tokens": 23934184} {"current_steps": 41510, "total_steps": 67140, "loss": 0.4562, "lr": 1.9100629747118117e-05, "epoch": 6.182603515043193, "percentage": 61.83, "elapsed_time": "2:52:39", "remaining_time": "1:46:36", "throughput": 2310.71, "total_tokens": 23937128} {"current_steps": 41515, "total_steps": 67140, "loss": 0.5148, "lr": 1.90943146363094e-05, "epoch": 6.183348227584153, "percentage": 61.83, "elapsed_time": "2:52:40", "remaining_time": "1:46:34", "throughput": 2310.72, "total_tokens": 23939816} {"current_steps": 41520, "total_steps": 67140, "loss": 0.614, "lr": 1.9087999924582884e-05, "epoch": 6.184092940125112, "percentage": 61.84, "elapsed_time": "2:52:41", "remaining_time": "1:46:33", "throughput": 2310.76, "total_tokens": 23942888} {"current_steps": 41525, "total_steps": 67140, "loss": 0.7767, "lr": 1.9081685612365298e-05, "epoch": 6.18483765266607, "percentage": 61.85, "elapsed_time": "2:52:42", "remaining_time": "1:46:32", "throughput": 2310.79, "total_tokens": 23945896} {"current_steps": 41530, "total_steps": 67140, "loss": 0.5963, "lr": 1.9075371700083333e-05, "epoch": 6.18558236520703, "percentage": 61.86, "elapsed_time": "2:52:43", "remaining_time": "1:46:30", "throughput": 2310.82, "total_tokens": 23948712} {"current_steps": 41535, "total_steps": 67140, "loss": 0.5778, "lr": 1.906905818816366e-05, "epoch": 6.18632707774799, "percentage": 61.86, "elapsed_time": "2:52:44", "remaining_time": "1:46:29", "throughput": 2310.85, "total_tokens": 23951688} {"current_steps": 41540, "total_steps": 67140, "loss": 0.6565, "lr": 1.906274507703293e-05, "epoch": 6.1870717902889485, "percentage": 61.87, "elapsed_time": "2:52:46", "remaining_time": "1:46:28", "throughput": 2310.88, "total_tokens": 23954728} {"current_steps": 41545, "total_steps": 67140, "loss": 0.4568, "lr": 1.9056432367117744e-05, "epoch": 6.187816502829907, "percentage": 61.88, "elapsed_time": "2:52:47", "remaining_time": "1:46:26", "throughput": 2310.9, "total_tokens": 23957448} {"current_steps": 41550, "total_steps": 67140, "loss": 0.8642, "lr": 1.90501200588447e-05, "epoch": 6.188561215370867, "percentage": 61.89, "elapsed_time": "2:52:48", "remaining_time": "1:46:25", "throughput": 2310.92, "total_tokens": 23960328} {"current_steps": 41555, "total_steps": 67140, "loss": 0.568, "lr": 1.9043808152640342e-05, "epoch": 6.189305927911826, "percentage": 61.89, "elapsed_time": "2:52:49", "remaining_time": "1:46:24", "throughput": 2310.95, "total_tokens": 23963240} {"current_steps": 41560, "total_steps": 67140, "loss": 0.6068, "lr": 1.903749664893122e-05, "epoch": 6.190050640452785, "percentage": 61.9, "elapsed_time": "2:52:50", "remaining_time": "1:46:23", "throughput": 2310.99, "total_tokens": 23966344} {"current_steps": 41565, "total_steps": 67140, "loss": 0.5061, "lr": 1.9031185548143827e-05, "epoch": 6.190795352993744, "percentage": 61.91, "elapsed_time": "2:52:51", "remaining_time": "1:46:21", "throughput": 2310.99, "total_tokens": 23968904} {"current_steps": 41570, "total_steps": 67140, "loss": 0.7013, "lr": 1.9024874850704646e-05, "epoch": 6.191540065534704, "percentage": 61.92, "elapsed_time": "2:52:52", "remaining_time": "1:46:20", "throughput": 2311.04, "total_tokens": 23972200} {"current_steps": 41575, "total_steps": 67140, "loss": 0.4544, "lr": 1.9018564557040135e-05, "epoch": 6.1922847780756625, "percentage": 61.92, "elapsed_time": "2:52:53", "remaining_time": "1:46:19", "throughput": 2311.04, "total_tokens": 23974760} {"current_steps": 41580, "total_steps": 67140, "loss": 0.5753, "lr": 1.9012254667576707e-05, "epoch": 6.193029490616622, "percentage": 61.93, "elapsed_time": "2:52:55", "remaining_time": "1:46:17", "throughput": 2311.08, "total_tokens": 23977896} {"current_steps": 41585, "total_steps": 67140, "loss": 0.6232, "lr": 1.9005945182740765e-05, "epoch": 6.193774203157581, "percentage": 61.94, "elapsed_time": "2:52:56", "remaining_time": "1:46:16", "throughput": 2311.11, "total_tokens": 23980872} {"current_steps": 41590, "total_steps": 67140, "loss": 0.5434, "lr": 1.899963610295869e-05, "epoch": 6.1945189156985405, "percentage": 61.95, "elapsed_time": "2:52:57", "remaining_time": "1:46:15", "throughput": 2311.13, "total_tokens": 23983592} {"current_steps": 41595, "total_steps": 67140, "loss": 0.498, "lr": 1.8993327428656805e-05, "epoch": 6.195263628239499, "percentage": 61.95, "elapsed_time": "2:52:58", "remaining_time": "1:46:13", "throughput": 2311.14, "total_tokens": 23986184} {"current_steps": 41600, "total_steps": 67140, "loss": 0.5633, "lr": 1.898701916026142e-05, "epoch": 6.196008340780459, "percentage": 61.96, "elapsed_time": "2:52:59", "remaining_time": "1:46:12", "throughput": 2311.16, "total_tokens": 23989032} {"current_steps": 41605, "total_steps": 67140, "loss": 0.5172, "lr": 1.8980711298198843e-05, "epoch": 6.196753053321418, "percentage": 61.97, "elapsed_time": "2:53:00", "remaining_time": "1:46:11", "throughput": 2311.21, "total_tokens": 23992328} {"current_steps": 41610, "total_steps": 67140, "loss": 0.4727, "lr": 1.897440384289532e-05, "epoch": 6.197497765862377, "percentage": 61.97, "elapsed_time": "2:53:02", "remaining_time": "1:46:09", "throughput": 2311.24, "total_tokens": 23995368} {"current_steps": 41615, "total_steps": 67140, "loss": 0.6101, "lr": 1.8968096794777087e-05, "epoch": 6.198242478403336, "percentage": 61.98, "elapsed_time": "2:53:03", "remaining_time": "1:46:08", "throughput": 2311.26, "total_tokens": 23998120} {"current_steps": 41620, "total_steps": 67140, "loss": 0.5714, "lr": 1.896179015427035e-05, "epoch": 6.198987190944296, "percentage": 61.99, "elapsed_time": "2:53:04", "remaining_time": "1:46:07", "throughput": 2311.27, "total_tokens": 24000840} {"current_steps": 41625, "total_steps": 67140, "loss": 0.8524, "lr": 1.8955483921801286e-05, "epoch": 6.1997319034852545, "percentage": 62.0, "elapsed_time": "2:53:05", "remaining_time": "1:46:05", "throughput": 2311.29, "total_tokens": 24003592} {"current_steps": 41630, "total_steps": 67140, "loss": 0.4961, "lr": 1.894917809779605e-05, "epoch": 6.200476616026214, "percentage": 62.0, "elapsed_time": "2:53:06", "remaining_time": "1:46:04", "throughput": 2311.31, "total_tokens": 24006408} {"current_steps": 41635, "total_steps": 67140, "loss": 0.5499, "lr": 1.8942872682680747e-05, "epoch": 6.201221328567173, "percentage": 62.01, "elapsed_time": "2:53:07", "remaining_time": "1:46:03", "throughput": 2311.32, "total_tokens": 24009160} {"current_steps": 41640, "total_steps": 67140, "loss": 0.567, "lr": 1.893656767688148e-05, "epoch": 6.2019660411081325, "percentage": 62.02, "elapsed_time": "2:53:08", "remaining_time": "1:46:01", "throughput": 2311.34, "total_tokens": 24011912} {"current_steps": 41645, "total_steps": 67140, "loss": 0.4701, "lr": 1.8930263080824327e-05, "epoch": 6.202710753649091, "percentage": 62.03, "elapsed_time": "2:53:09", "remaining_time": "1:46:00", "throughput": 2311.39, "total_tokens": 24015144} {"current_steps": 41650, "total_steps": 67140, "loss": 0.5629, "lr": 1.892395889493531e-05, "epoch": 6.203455466190051, "percentage": 62.03, "elapsed_time": "2:53:11", "remaining_time": "1:45:59", "throughput": 2311.42, "total_tokens": 24018184} {"current_steps": 41655, "total_steps": 67140, "loss": 0.9012, "lr": 1.8917655119640446e-05, "epoch": 6.20420017873101, "percentage": 62.04, "elapsed_time": "2:53:12", "remaining_time": "1:45:58", "throughput": 2311.43, "total_tokens": 24020872} {"current_steps": 41660, "total_steps": 67140, "loss": 0.5658, "lr": 1.8911351755365726e-05, "epoch": 6.204944891271969, "percentage": 62.05, "elapsed_time": "2:53:13", "remaining_time": "1:45:56", "throughput": 2311.48, "total_tokens": 24024136} {"current_steps": 41665, "total_steps": 67140, "loss": 0.7164, "lr": 1.890504880253709e-05, "epoch": 6.205689603812928, "percentage": 62.06, "elapsed_time": "2:53:14", "remaining_time": "1:45:55", "throughput": 2311.51, "total_tokens": 24027240} {"current_steps": 41670, "total_steps": 67140, "loss": 0.5595, "lr": 1.8898746261580493e-05, "epoch": 6.206434316353888, "percentage": 62.06, "elapsed_time": "2:53:15", "remaining_time": "1:45:54", "throughput": 2311.52, "total_tokens": 24029928} {"current_steps": 41675, "total_steps": 67140, "loss": 0.486, "lr": 1.8892444132921803e-05, "epoch": 6.2071790288948465, "percentage": 62.07, "elapsed_time": "2:53:16", "remaining_time": "1:45:52", "throughput": 2311.56, "total_tokens": 24032936} {"current_steps": 41680, "total_steps": 67140, "loss": 0.4879, "lr": 1.8886142416986917e-05, "epoch": 6.207923741435806, "percentage": 62.08, "elapsed_time": "2:53:17", "remaining_time": "1:45:51", "throughput": 2311.59, "total_tokens": 24035880} {"current_steps": 41685, "total_steps": 67140, "loss": 0.5618, "lr": 1.887984111420166e-05, "epoch": 6.208668453976765, "percentage": 62.09, "elapsed_time": "2:53:19", "remaining_time": "1:45:50", "throughput": 2311.62, "total_tokens": 24038888} {"current_steps": 41690, "total_steps": 67140, "loss": 0.4305, "lr": 1.8873540224991864e-05, "epoch": 6.209413166517725, "percentage": 62.09, "elapsed_time": "2:53:20", "remaining_time": "1:45:48", "throughput": 2311.64, "total_tokens": 24041608} {"current_steps": 41695, "total_steps": 67140, "loss": 0.7637, "lr": 1.8867239749783307e-05, "epoch": 6.210157879058683, "percentage": 62.1, "elapsed_time": "2:53:21", "remaining_time": "1:45:47", "throughput": 2311.66, "total_tokens": 24044456} {"current_steps": 41700, "total_steps": 67140, "loss": 0.6706, "lr": 1.8860939689001754e-05, "epoch": 6.210902591599643, "percentage": 62.11, "elapsed_time": "2:53:22", "remaining_time": "1:45:46", "throughput": 2311.67, "total_tokens": 24047176} {"current_steps": 41705, "total_steps": 67140, "loss": 0.6327, "lr": 1.885464004307294e-05, "epoch": 6.211647304140602, "percentage": 62.12, "elapsed_time": "2:53:23", "remaining_time": "1:45:44", "throughput": 2311.71, "total_tokens": 24050184} {"current_steps": 41710, "total_steps": 67140, "loss": 0.6634, "lr": 1.8848340812422574e-05, "epoch": 6.2123920166815605, "percentage": 62.12, "elapsed_time": "2:53:24", "remaining_time": "1:45:43", "throughput": 2311.73, "total_tokens": 24053000} {"current_steps": 41715, "total_steps": 67140, "loss": 0.4495, "lr": 1.884204199747631e-05, "epoch": 6.21313672922252, "percentage": 62.13, "elapsed_time": "2:53:25", "remaining_time": "1:45:42", "throughput": 2311.75, "total_tokens": 24055976} {"current_steps": 41720, "total_steps": 67140, "loss": 0.7687, "lr": 1.8835743598659815e-05, "epoch": 6.213881441763479, "percentage": 62.14, "elapsed_time": "2:53:27", "remaining_time": "1:45:41", "throughput": 2311.77, "total_tokens": 24058696} {"current_steps": 41725, "total_steps": 67140, "loss": 0.5648, "lr": 1.8829445616398713e-05, "epoch": 6.2146261543044385, "percentage": 62.15, "elapsed_time": "2:53:28", "remaining_time": "1:45:39", "throughput": 2311.8, "total_tokens": 24061736} {"current_steps": 41730, "total_steps": 67140, "loss": 0.7123, "lr": 1.8823148051118585e-05, "epoch": 6.215370866845397, "percentage": 62.15, "elapsed_time": "2:53:29", "remaining_time": "1:45:38", "throughput": 2311.84, "total_tokens": 24064808} {"current_steps": 41735, "total_steps": 67140, "loss": 0.6474, "lr": 1.8816850903244994e-05, "epoch": 6.216115579386357, "percentage": 62.16, "elapsed_time": "2:53:30", "remaining_time": "1:45:37", "throughput": 2311.87, "total_tokens": 24067752} {"current_steps": 41740, "total_steps": 67140, "loss": 0.6029, "lr": 1.8810554173203486e-05, "epoch": 6.216860291927316, "percentage": 62.17, "elapsed_time": "2:53:31", "remaining_time": "1:45:35", "throughput": 2311.88, "total_tokens": 24070408} {"current_steps": 41745, "total_steps": 67140, "loss": 0.6927, "lr": 1.8804257861419556e-05, "epoch": 6.217605004468275, "percentage": 62.18, "elapsed_time": "2:53:32", "remaining_time": "1:45:34", "throughput": 2311.9, "total_tokens": 24073256} {"current_steps": 41750, "total_steps": 67140, "loss": 0.4418, "lr": 1.87979619683187e-05, "epoch": 6.218349717009234, "percentage": 62.18, "elapsed_time": "2:53:33", "remaining_time": "1:45:33", "throughput": 2311.94, "total_tokens": 24076424} {"current_steps": 41755, "total_steps": 67140, "loss": 0.5181, "lr": 1.8791666494326353e-05, "epoch": 6.219094429550194, "percentage": 62.19, "elapsed_time": "2:53:35", "remaining_time": "1:45:31", "throughput": 2311.97, "total_tokens": 24079400} {"current_steps": 41760, "total_steps": 67140, "loss": 0.6467, "lr": 1.8785371439867945e-05, "epoch": 6.2198391420911525, "percentage": 62.2, "elapsed_time": "2:53:36", "remaining_time": "1:45:30", "throughput": 2311.97, "total_tokens": 24081960} {"current_steps": 41765, "total_steps": 67140, "loss": 0.6951, "lr": 1.8779076805368862e-05, "epoch": 6.220583854632112, "percentage": 62.21, "elapsed_time": "2:53:37", "remaining_time": "1:45:29", "throughput": 2312.01, "total_tokens": 24085000} {"current_steps": 41770, "total_steps": 67140, "loss": 0.545, "lr": 1.8772782591254474e-05, "epoch": 6.221328567173071, "percentage": 62.21, "elapsed_time": "2:53:38", "remaining_time": "1:45:27", "throughput": 2312.03, "total_tokens": 24087848} {"current_steps": 41775, "total_steps": 67140, "loss": 0.4709, "lr": 1.876648879795013e-05, "epoch": 6.222073279714031, "percentage": 62.22, "elapsed_time": "2:53:39", "remaining_time": "1:45:26", "throughput": 2312.05, "total_tokens": 24090792} {"current_steps": 41780, "total_steps": 67140, "loss": 0.6649, "lr": 1.8760195425881122e-05, "epoch": 6.222817992254989, "percentage": 62.23, "elapsed_time": "2:53:40", "remaining_time": "1:45:25", "throughput": 2312.07, "total_tokens": 24093640} {"current_steps": 41785, "total_steps": 67140, "loss": 0.6241, "lr": 1.8753902475472738e-05, "epoch": 6.223562704795949, "percentage": 62.24, "elapsed_time": "2:53:41", "remaining_time": "1:45:24", "throughput": 2312.12, "total_tokens": 24096776} {"current_steps": 41790, "total_steps": 67140, "loss": 0.6407, "lr": 1.874760994715024e-05, "epoch": 6.224307417336908, "percentage": 62.24, "elapsed_time": "2:53:43", "remaining_time": "1:45:22", "throughput": 2312.14, "total_tokens": 24099624} {"current_steps": 41795, "total_steps": 67140, "loss": 0.5211, "lr": 1.874131784133884e-05, "epoch": 6.225052129877867, "percentage": 62.25, "elapsed_time": "2:53:44", "remaining_time": "1:45:21", "throughput": 2312.17, "total_tokens": 24102600} {"current_steps": 41800, "total_steps": 67140, "loss": 0.5794, "lr": 1.8735026158463724e-05, "epoch": 6.225796842418826, "percentage": 62.26, "elapsed_time": "2:53:45", "remaining_time": "1:45:20", "throughput": 2312.2, "total_tokens": 24105512} {"current_steps": 41805, "total_steps": 67140, "loss": 0.6844, "lr": 1.8728734898950072e-05, "epoch": 6.226541554959786, "percentage": 62.27, "elapsed_time": "2:53:46", "remaining_time": "1:45:18", "throughput": 2312.2, "total_tokens": 24108264} {"current_steps": 41810, "total_steps": 67140, "loss": 0.552, "lr": 1.8722444063223023e-05, "epoch": 6.2272862675007445, "percentage": 62.27, "elapsed_time": "2:53:47", "remaining_time": "1:45:17", "throughput": 2312.21, "total_tokens": 24111016} {"current_steps": 41815, "total_steps": 67140, "loss": 0.7191, "lr": 1.871615365170768e-05, "epoch": 6.228030980041704, "percentage": 62.28, "elapsed_time": "2:53:48", "remaining_time": "1:45:16", "throughput": 2312.23, "total_tokens": 24113832} {"current_steps": 41820, "total_steps": 67140, "loss": 0.7685, "lr": 1.870986366482912e-05, "epoch": 6.228775692582663, "percentage": 62.29, "elapsed_time": "2:53:50", "remaining_time": "1:45:14", "throughput": 2312.27, "total_tokens": 24117032} {"current_steps": 41825, "total_steps": 67140, "loss": 0.4698, "lr": 1.8703574103012407e-05, "epoch": 6.229520405123623, "percentage": 62.3, "elapsed_time": "2:53:51", "remaining_time": "1:45:13", "throughput": 2312.29, "total_tokens": 24119784} {"current_steps": 41830, "total_steps": 67140, "loss": 0.5265, "lr": 1.869728496668256e-05, "epoch": 6.230265117664581, "percentage": 62.3, "elapsed_time": "2:53:52", "remaining_time": "1:45:12", "throughput": 2312.36, "total_tokens": 24123464} {"current_steps": 41835, "total_steps": 67140, "loss": 0.4547, "lr": 1.869099625626456e-05, "epoch": 6.231009830205541, "percentage": 62.31, "elapsed_time": "2:53:53", "remaining_time": "1:45:10", "throughput": 2312.36, "total_tokens": 24126056} {"current_steps": 41840, "total_steps": 67140, "loss": 0.6074, "lr": 1.8684707972183383e-05, "epoch": 6.2317545427465, "percentage": 62.32, "elapsed_time": "2:53:54", "remaining_time": "1:45:09", "throughput": 2312.4, "total_tokens": 24129096} {"current_steps": 41845, "total_steps": 67140, "loss": 0.3585, "lr": 1.867842011486397e-05, "epoch": 6.232499255287459, "percentage": 62.32, "elapsed_time": "2:53:55", "remaining_time": "1:45:08", "throughput": 2312.42, "total_tokens": 24131848} {"current_steps": 41850, "total_steps": 67140, "loss": 0.6458, "lr": 1.867213268473122e-05, "epoch": 6.233243967828418, "percentage": 62.33, "elapsed_time": "2:53:56", "remaining_time": "1:45:07", "throughput": 2312.45, "total_tokens": 24134920} {"current_steps": 41855, "total_steps": 67140, "loss": 0.4996, "lr": 1.866584568221002e-05, "epoch": 6.233988680369378, "percentage": 62.34, "elapsed_time": "2:53:58", "remaining_time": "1:45:05", "throughput": 2312.48, "total_tokens": 24137832} {"current_steps": 41860, "total_steps": 67140, "loss": 0.5606, "lr": 1.865955910772521e-05, "epoch": 6.234733392910337, "percentage": 62.35, "elapsed_time": "2:53:59", "remaining_time": "1:45:04", "throughput": 2312.51, "total_tokens": 24140776} {"current_steps": 41865, "total_steps": 67140, "loss": 0.5834, "lr": 1.8653272961701618e-05, "epoch": 6.235478105451296, "percentage": 62.35, "elapsed_time": "2:54:00", "remaining_time": "1:45:03", "throughput": 2312.53, "total_tokens": 24143560} {"current_steps": 41870, "total_steps": 67140, "loss": 0.6363, "lr": 1.8646987244564047e-05, "epoch": 6.236222817992255, "percentage": 62.36, "elapsed_time": "2:54:01", "remaining_time": "1:45:01", "throughput": 2312.56, "total_tokens": 24146568} {"current_steps": 41875, "total_steps": 67140, "loss": 0.5549, "lr": 1.8640701956737238e-05, "epoch": 6.236967530533214, "percentage": 62.37, "elapsed_time": "2:54:02", "remaining_time": "1:45:00", "throughput": 2312.58, "total_tokens": 24149384} {"current_steps": 41880, "total_steps": 67140, "loss": 0.5963, "lr": 1.8634417098645937e-05, "epoch": 6.237712243074173, "percentage": 62.38, "elapsed_time": "2:54:03", "remaining_time": "1:44:59", "throughput": 2312.61, "total_tokens": 24152360} {"current_steps": 41885, "total_steps": 67140, "loss": 0.6701, "lr": 1.8628132670714846e-05, "epoch": 6.238456955615132, "percentage": 62.38, "elapsed_time": "2:54:04", "remaining_time": "1:44:57", "throughput": 2312.63, "total_tokens": 24155336} {"current_steps": 41890, "total_steps": 67140, "loss": 0.6685, "lr": 1.8621848673368648e-05, "epoch": 6.239201668156092, "percentage": 62.39, "elapsed_time": "2:54:06", "remaining_time": "1:44:56", "throughput": 2312.67, "total_tokens": 24158408} {"current_steps": 41895, "total_steps": 67140, "loss": 0.6864, "lr": 1.861556510703198e-05, "epoch": 6.2399463806970505, "percentage": 62.4, "elapsed_time": "2:54:07", "remaining_time": "1:44:55", "throughput": 2312.72, "total_tokens": 24161640} {"current_steps": 41900, "total_steps": 67140, "loss": 0.5112, "lr": 1.8609281972129464e-05, "epoch": 6.24069109323801, "percentage": 62.41, "elapsed_time": "2:54:08", "remaining_time": "1:44:54", "throughput": 2312.75, "total_tokens": 24164712} {"current_steps": 41905, "total_steps": 67140, "loss": 0.6192, "lr": 1.8602999269085693e-05, "epoch": 6.241435805778969, "percentage": 62.41, "elapsed_time": "2:54:09", "remaining_time": "1:44:52", "throughput": 2312.76, "total_tokens": 24167368} {"current_steps": 41910, "total_steps": 67140, "loss": 0.597, "lr": 1.859671699832523e-05, "epoch": 6.242180518319929, "percentage": 62.42, "elapsed_time": "2:54:10", "remaining_time": "1:44:51", "throughput": 2312.79, "total_tokens": 24170312} {"current_steps": 41915, "total_steps": 67140, "loss": 0.6386, "lr": 1.859043516027259e-05, "epoch": 6.242925230860887, "percentage": 62.43, "elapsed_time": "2:54:11", "remaining_time": "1:44:50", "throughput": 2312.82, "total_tokens": 24173224} {"current_steps": 41920, "total_steps": 67140, "loss": 0.6453, "lr": 1.8584153755352282e-05, "epoch": 6.243669943401847, "percentage": 62.44, "elapsed_time": "2:54:12", "remaining_time": "1:44:48", "throughput": 2312.83, "total_tokens": 24175848} {"current_steps": 41925, "total_steps": 67140, "loss": 0.4892, "lr": 1.857787278398878e-05, "epoch": 6.244414655942806, "percentage": 62.44, "elapsed_time": "2:54:14", "remaining_time": "1:44:47", "throughput": 2312.89, "total_tokens": 24179336} {"current_steps": 41930, "total_steps": 67140, "loss": 0.712, "lr": 1.8571592246606522e-05, "epoch": 6.245159368483765, "percentage": 62.45, "elapsed_time": "2:54:15", "remaining_time": "1:44:46", "throughput": 2312.91, "total_tokens": 24182152} {"current_steps": 41935, "total_steps": 67140, "loss": 0.4646, "lr": 1.8565312143629926e-05, "epoch": 6.245904081024724, "percentage": 62.46, "elapsed_time": "2:54:16", "remaining_time": "1:44:44", "throughput": 2312.94, "total_tokens": 24185128} {"current_steps": 41940, "total_steps": 67140, "loss": 0.714, "lr": 1.855903247548338e-05, "epoch": 6.246648793565684, "percentage": 62.47, "elapsed_time": "2:54:17", "remaining_time": "1:44:43", "throughput": 2312.98, "total_tokens": 24188168} {"current_steps": 41945, "total_steps": 67140, "loss": 0.6667, "lr": 1.855275324259122e-05, "epoch": 6.247393506106643, "percentage": 62.47, "elapsed_time": "2:54:18", "remaining_time": "1:44:42", "throughput": 2313.0, "total_tokens": 24190984} {"current_steps": 41950, "total_steps": 67140, "loss": 0.4221, "lr": 1.8546474445377786e-05, "epoch": 6.248138218647602, "percentage": 62.48, "elapsed_time": "2:54:19", "remaining_time": "1:44:40", "throughput": 2313.03, "total_tokens": 24193960} {"current_steps": 41955, "total_steps": 67140, "loss": 0.4858, "lr": 1.8540196084267386e-05, "epoch": 6.248882931188561, "percentage": 62.49, "elapsed_time": "2:54:20", "remaining_time": "1:44:39", "throughput": 2313.04, "total_tokens": 24196616} {"current_steps": 41960, "total_steps": 67140, "loss": 0.6968, "lr": 1.8533918159684262e-05, "epoch": 6.249627643729521, "percentage": 62.5, "elapsed_time": "2:54:22", "remaining_time": "1:44:38", "throughput": 2313.06, "total_tokens": 24199368} {"current_steps": 41965, "total_steps": 67140, "loss": 1.0358, "lr": 1.8527640672052655e-05, "epoch": 6.250372356270479, "percentage": 62.5, "elapsed_time": "2:54:23", "remaining_time": "1:44:36", "throughput": 2313.09, "total_tokens": 24202440} {"current_steps": 41970, "total_steps": 67140, "loss": 0.6652, "lr": 1.8521363621796774e-05, "epoch": 6.251117068811439, "percentage": 62.51, "elapsed_time": "2:54:24", "remaining_time": "1:44:35", "throughput": 2313.11, "total_tokens": 24205288} {"current_steps": 41975, "total_steps": 67140, "loss": 0.685, "lr": 1.8515087009340808e-05, "epoch": 6.251861781352398, "percentage": 62.52, "elapsed_time": "2:54:25", "remaining_time": "1:44:34", "throughput": 2313.16, "total_tokens": 24208424} {"current_steps": 41980, "total_steps": 67140, "loss": 0.6684, "lr": 1.850881083510889e-05, "epoch": 6.252606493893357, "percentage": 62.53, "elapsed_time": "2:54:26", "remaining_time": "1:44:33", "throughput": 2313.19, "total_tokens": 24211400} {"current_steps": 41985, "total_steps": 67140, "loss": 0.6862, "lr": 1.850253509952514e-05, "epoch": 6.253351206434316, "percentage": 62.53, "elapsed_time": "2:54:27", "remaining_time": "1:44:31", "throughput": 2313.22, "total_tokens": 24214376} {"current_steps": 41990, "total_steps": 67140, "loss": 0.5113, "lr": 1.8496259803013667e-05, "epoch": 6.254095918975276, "percentage": 62.54, "elapsed_time": "2:54:28", "remaining_time": "1:44:30", "throughput": 2313.24, "total_tokens": 24217224} {"current_steps": 41995, "total_steps": 67140, "loss": 0.6262, "lr": 1.8489984945998512e-05, "epoch": 6.254840631516235, "percentage": 62.55, "elapsed_time": "2:54:30", "remaining_time": "1:44:29", "throughput": 2313.3, "total_tokens": 24220712} {"current_steps": 42000, "total_steps": 67140, "loss": 0.5853, "lr": 1.8483710528903698e-05, "epoch": 6.255585344057194, "percentage": 62.56, "elapsed_time": "2:54:31", "remaining_time": "1:44:27", "throughput": 2313.33, "total_tokens": 24223752} {"current_steps": 42005, "total_steps": 67140, "loss": 0.718, "lr": 1.847743655215323e-05, "epoch": 6.256330056598153, "percentage": 62.56, "elapsed_time": "2:54:32", "remaining_time": "1:44:26", "throughput": 2313.38, "total_tokens": 24226984} {"current_steps": 42010, "total_steps": 67140, "loss": 0.4991, "lr": 1.8471163016171088e-05, "epoch": 6.257074769139113, "percentage": 62.57, "elapsed_time": "2:54:33", "remaining_time": "1:44:25", "throughput": 2313.41, "total_tokens": 24229960} {"current_steps": 42015, "total_steps": 67140, "loss": 0.5189, "lr": 1.84648899213812e-05, "epoch": 6.257819481680071, "percentage": 62.58, "elapsed_time": "2:54:34", "remaining_time": "1:44:23", "throughput": 2313.43, "total_tokens": 24232904} {"current_steps": 42020, "total_steps": 67140, "loss": 0.5862, "lr": 1.845861726820749e-05, "epoch": 6.258564194221031, "percentage": 62.59, "elapsed_time": "2:54:35", "remaining_time": "1:44:22", "throughput": 2313.43, "total_tokens": 24235400} {"current_steps": 42025, "total_steps": 67140, "loss": 0.5605, "lr": 1.845234505707382e-05, "epoch": 6.25930890676199, "percentage": 62.59, "elapsed_time": "2:54:37", "remaining_time": "1:44:21", "throughput": 2313.46, "total_tokens": 24238280} {"current_steps": 42030, "total_steps": 67140, "loss": 0.4922, "lr": 1.844607328840405e-05, "epoch": 6.2600536193029495, "percentage": 62.6, "elapsed_time": "2:54:38", "remaining_time": "1:44:19", "throughput": 2313.48, "total_tokens": 24241064} {"current_steps": 42035, "total_steps": 67140, "loss": 0.696, "lr": 1.8439801962622016e-05, "epoch": 6.260798331843908, "percentage": 62.61, "elapsed_time": "2:54:39", "remaining_time": "1:44:18", "throughput": 2313.51, "total_tokens": 24244104} {"current_steps": 42040, "total_steps": 67140, "loss": 0.5501, "lr": 1.8433531080151482e-05, "epoch": 6.261543044384867, "percentage": 62.62, "elapsed_time": "2:54:40", "remaining_time": "1:44:17", "throughput": 2313.53, "total_tokens": 24246920} {"current_steps": 42045, "total_steps": 67140, "loss": 0.6278, "lr": 1.842726064141622e-05, "epoch": 6.262287756925827, "percentage": 62.62, "elapsed_time": "2:54:41", "remaining_time": "1:44:16", "throughput": 2313.54, "total_tokens": 24249640} {"current_steps": 42050, "total_steps": 67140, "loss": 0.5449, "lr": 1.8420990646839957e-05, "epoch": 6.263032469466786, "percentage": 62.63, "elapsed_time": "2:54:42", "remaining_time": "1:44:14", "throughput": 2313.57, "total_tokens": 24252584} {"current_steps": 42055, "total_steps": 67140, "loss": 0.5572, "lr": 1.841472109684641e-05, "epoch": 6.263777182007745, "percentage": 62.64, "elapsed_time": "2:54:43", "remaining_time": "1:44:13", "throughput": 2313.63, "total_tokens": 24256072} {"current_steps": 42060, "total_steps": 67140, "loss": 0.5365, "lr": 1.8408451991859228e-05, "epoch": 6.264521894548704, "percentage": 62.65, "elapsed_time": "2:54:45", "remaining_time": "1:44:12", "throughput": 2313.64, "total_tokens": 24258760} {"current_steps": 42065, "total_steps": 67140, "loss": 0.6258, "lr": 1.840218333230206e-05, "epoch": 6.265266607089663, "percentage": 62.65, "elapsed_time": "2:54:46", "remaining_time": "1:44:10", "throughput": 2313.66, "total_tokens": 24261480} {"current_steps": 42070, "total_steps": 67140, "loss": 0.7049, "lr": 1.8395915118598523e-05, "epoch": 6.266011319630622, "percentage": 62.66, "elapsed_time": "2:54:47", "remaining_time": "1:44:09", "throughput": 2313.67, "total_tokens": 24264136} {"current_steps": 42075, "total_steps": 67140, "loss": 0.621, "lr": 1.83896473511722e-05, "epoch": 6.266756032171582, "percentage": 62.67, "elapsed_time": "2:54:48", "remaining_time": "1:44:08", "throughput": 2313.67, "total_tokens": 24266696} {"current_steps": 42080, "total_steps": 67140, "loss": 0.8419, "lr": 1.838338003044662e-05, "epoch": 6.267500744712541, "percentage": 62.68, "elapsed_time": "2:54:49", "remaining_time": "1:44:06", "throughput": 2313.7, "total_tokens": 24269608} {"current_steps": 42085, "total_steps": 67140, "loss": 0.5359, "lr": 1.8377113156845317e-05, "epoch": 6.2682454572535, "percentage": 62.68, "elapsed_time": "2:54:50", "remaining_time": "1:44:05", "throughput": 2313.72, "total_tokens": 24272328} {"current_steps": 42090, "total_steps": 67140, "loss": 0.6802, "lr": 1.8370846730791786e-05, "epoch": 6.268990169794459, "percentage": 62.69, "elapsed_time": "2:54:51", "remaining_time": "1:44:04", "throughput": 2313.74, "total_tokens": 24275336} {"current_steps": 42095, "total_steps": 67140, "loss": 0.627, "lr": 1.8364580752709475e-05, "epoch": 6.269734882335419, "percentage": 62.7, "elapsed_time": "2:54:52", "remaining_time": "1:44:02", "throughput": 2313.79, "total_tokens": 24278536} {"current_steps": 42100, "total_steps": 67140, "loss": 0.5774, "lr": 1.8358315223021814e-05, "epoch": 6.270479594876377, "percentage": 62.7, "elapsed_time": "2:54:54", "remaining_time": "1:44:01", "throughput": 2313.8, "total_tokens": 24281224} {"current_steps": 42105, "total_steps": 67140, "loss": 0.3776, "lr": 1.835205014215222e-05, "epoch": 6.271224307417337, "percentage": 62.71, "elapsed_time": "2:54:55", "remaining_time": "1:44:00", "throughput": 2313.83, "total_tokens": 24284104} {"current_steps": 42110, "total_steps": 67140, "loss": 0.6347, "lr": 1.8345785510524042e-05, "epoch": 6.271969019958296, "percentage": 62.72, "elapsed_time": "2:54:56", "remaining_time": "1:43:58", "throughput": 2313.84, "total_tokens": 24286856} {"current_steps": 42115, "total_steps": 67140, "loss": 0.5996, "lr": 1.833952132856063e-05, "epoch": 6.2727137324992555, "percentage": 62.73, "elapsed_time": "2:54:57", "remaining_time": "1:43:57", "throughput": 2313.87, "total_tokens": 24289864} {"current_steps": 42120, "total_steps": 67140, "loss": 0.8873, "lr": 1.8333257596685284e-05, "epoch": 6.273458445040214, "percentage": 62.73, "elapsed_time": "2:54:58", "remaining_time": "1:43:56", "throughput": 2313.89, "total_tokens": 24292584} {"current_steps": 42125, "total_steps": 67140, "loss": 0.6405, "lr": 1.832699431532129e-05, "epoch": 6.274203157581174, "percentage": 62.74, "elapsed_time": "2:54:59", "remaining_time": "1:43:55", "throughput": 2313.93, "total_tokens": 24295816} {"current_steps": 42130, "total_steps": 67140, "loss": 0.6415, "lr": 1.832073148489188e-05, "epoch": 6.274947870122133, "percentage": 62.75, "elapsed_time": "2:55:00", "remaining_time": "1:43:53", "throughput": 2313.96, "total_tokens": 24298792} {"current_steps": 42135, "total_steps": 67140, "loss": 0.6389, "lr": 1.831446910582028e-05, "epoch": 6.275692582663092, "percentage": 62.76, "elapsed_time": "2:55:02", "remaining_time": "1:43:52", "throughput": 2313.99, "total_tokens": 24301672} {"current_steps": 42140, "total_steps": 67140, "loss": 0.6519, "lr": 1.8308207178529684e-05, "epoch": 6.276437295204051, "percentage": 62.76, "elapsed_time": "2:55:03", "remaining_time": "1:43:51", "throughput": 2314.0, "total_tokens": 24304424} {"current_steps": 42145, "total_steps": 67140, "loss": 0.7543, "lr": 1.8301945703443236e-05, "epoch": 6.277182007745011, "percentage": 62.77, "elapsed_time": "2:55:04", "remaining_time": "1:43:49", "throughput": 2314.01, "total_tokens": 24307144} {"current_steps": 42150, "total_steps": 67140, "loss": 0.7591, "lr": 1.8295684680984062e-05, "epoch": 6.277926720285969, "percentage": 62.78, "elapsed_time": "2:55:05", "remaining_time": "1:43:48", "throughput": 2314.03, "total_tokens": 24309832} {"current_steps": 42155, "total_steps": 67140, "loss": 0.6734, "lr": 1.828942411157527e-05, "epoch": 6.278671432826929, "percentage": 62.79, "elapsed_time": "2:55:06", "remaining_time": "1:43:47", "throughput": 2314.06, "total_tokens": 24312808} {"current_steps": 42160, "total_steps": 67140, "loss": 0.5738, "lr": 1.828316399563991e-05, "epoch": 6.279416145367888, "percentage": 62.79, "elapsed_time": "2:55:07", "remaining_time": "1:43:45", "throughput": 2314.1, "total_tokens": 24315880} {"current_steps": 42165, "total_steps": 67140, "loss": 0.6318, "lr": 1.8276904333601015e-05, "epoch": 6.2801608579088475, "percentage": 62.8, "elapsed_time": "2:55:08", "remaining_time": "1:43:44", "throughput": 2314.12, "total_tokens": 24318728} {"current_steps": 42170, "total_steps": 67140, "loss": 0.5801, "lr": 1.8270645125881585e-05, "epoch": 6.280905570449806, "percentage": 62.81, "elapsed_time": "2:55:09", "remaining_time": "1:43:43", "throughput": 2314.12, "total_tokens": 24321320} {"current_steps": 42175, "total_steps": 67140, "loss": 0.6964, "lr": 1.8264386372904608e-05, "epoch": 6.281650282990766, "percentage": 62.82, "elapsed_time": "2:55:11", "remaining_time": "1:43:41", "throughput": 2314.14, "total_tokens": 24324072} {"current_steps": 42180, "total_steps": 67140, "loss": 0.634, "lr": 1.825812807509301e-05, "epoch": 6.282394995531725, "percentage": 62.82, "elapsed_time": "2:55:12", "remaining_time": "1:43:40", "throughput": 2314.16, "total_tokens": 24326984} {"current_steps": 42185, "total_steps": 67140, "loss": 0.717, "lr": 1.825187023286971e-05, "epoch": 6.283139708072684, "percentage": 62.83, "elapsed_time": "2:55:13", "remaining_time": "1:43:39", "throughput": 2314.2, "total_tokens": 24330120} {"current_steps": 42190, "total_steps": 67140, "loss": 0.7345, "lr": 1.824561284665758e-05, "epoch": 6.283884420613643, "percentage": 62.84, "elapsed_time": "2:55:14", "remaining_time": "1:43:38", "throughput": 2314.23, "total_tokens": 24333032} {"current_steps": 42195, "total_steps": 67140, "loss": 0.5533, "lr": 1.823935591687948e-05, "epoch": 6.284629133154603, "percentage": 62.85, "elapsed_time": "2:55:15", "remaining_time": "1:43:36", "throughput": 2314.26, "total_tokens": 24336072} {"current_steps": 42200, "total_steps": 67140, "loss": 0.5639, "lr": 1.8233099443958212e-05, "epoch": 6.2853738456955615, "percentage": 62.85, "elapsed_time": "2:55:16", "remaining_time": "1:43:35", "throughput": 2314.28, "total_tokens": 24338952} {"current_steps": 42205, "total_steps": 67140, "loss": 0.7063, "lr": 1.8226843428316576e-05, "epoch": 6.286118558236521, "percentage": 62.86, "elapsed_time": "2:55:17", "remaining_time": "1:43:34", "throughput": 2314.31, "total_tokens": 24341864} {"current_steps": 42210, "total_steps": 67140, "loss": 0.7105, "lr": 1.8220587870377315e-05, "epoch": 6.28686327077748, "percentage": 62.87, "elapsed_time": "2:55:19", "remaining_time": "1:43:32", "throughput": 2314.34, "total_tokens": 24344840} {"current_steps": 42215, "total_steps": 67140, "loss": 0.4717, "lr": 1.8214332770563165e-05, "epoch": 6.2876079833184395, "percentage": 62.88, "elapsed_time": "2:55:20", "remaining_time": "1:43:31", "throughput": 2314.38, "total_tokens": 24347976} {"current_steps": 42220, "total_steps": 67140, "loss": 0.7291, "lr": 1.8208078129296827e-05, "epoch": 6.288352695859398, "percentage": 62.88, "elapsed_time": "2:55:21", "remaining_time": "1:43:30", "throughput": 2314.41, "total_tokens": 24350952} {"current_steps": 42225, "total_steps": 67140, "loss": 0.4841, "lr": 1.8201823947000947e-05, "epoch": 6.289097408400357, "percentage": 62.89, "elapsed_time": "2:55:22", "remaining_time": "1:43:28", "throughput": 2314.43, "total_tokens": 24353768} {"current_steps": 42230, "total_steps": 67140, "loss": 0.6089, "lr": 1.8195570224098162e-05, "epoch": 6.289842120941317, "percentage": 62.9, "elapsed_time": "2:55:23", "remaining_time": "1:43:27", "throughput": 2314.46, "total_tokens": 24356680} {"current_steps": 42235, "total_steps": 67140, "loss": 0.6113, "lr": 1.8189316961011092e-05, "epoch": 6.290586833482275, "percentage": 62.91, "elapsed_time": "2:55:24", "remaining_time": "1:43:26", "throughput": 2314.47, "total_tokens": 24359336} {"current_steps": 42240, "total_steps": 67140, "loss": 0.4109, "lr": 1.818306415816228e-05, "epoch": 6.291331546023235, "percentage": 62.91, "elapsed_time": "2:55:25", "remaining_time": "1:43:24", "throughput": 2314.48, "total_tokens": 24362056} {"current_steps": 42245, "total_steps": 67140, "loss": 0.6495, "lr": 1.817681181597428e-05, "epoch": 6.292076258564194, "percentage": 62.92, "elapsed_time": "2:55:27", "remaining_time": "1:43:23", "throughput": 2314.5, "total_tokens": 24364968} {"current_steps": 42250, "total_steps": 67140, "loss": 0.4468, "lr": 1.817055993486959e-05, "epoch": 6.2928209711051535, "percentage": 62.93, "elapsed_time": "2:55:28", "remaining_time": "1:43:22", "throughput": 2314.53, "total_tokens": 24367912} {"current_steps": 42255, "total_steps": 67140, "loss": 0.6004, "lr": 1.81643085152707e-05, "epoch": 6.293565683646112, "percentage": 62.94, "elapsed_time": "2:55:29", "remaining_time": "1:43:20", "throughput": 2314.55, "total_tokens": 24370728} {"current_steps": 42260, "total_steps": 67140, "loss": 0.5734, "lr": 1.8158057557600045e-05, "epoch": 6.294310396187072, "percentage": 62.94, "elapsed_time": "2:55:30", "remaining_time": "1:43:19", "throughput": 2314.57, "total_tokens": 24373544} {"current_steps": 42265, "total_steps": 67140, "loss": 0.562, "lr": 1.815180706228004e-05, "epoch": 6.295055108728031, "percentage": 62.95, "elapsed_time": "2:55:31", "remaining_time": "1:43:18", "throughput": 2314.61, "total_tokens": 24376680} {"current_steps": 42270, "total_steps": 67140, "loss": 0.6554, "lr": 1.814555702973308e-05, "epoch": 6.29579982126899, "percentage": 62.96, "elapsed_time": "2:55:32", "remaining_time": "1:43:17", "throughput": 2314.63, "total_tokens": 24379496} {"current_steps": 42275, "total_steps": 67140, "loss": 0.7411, "lr": 1.813930746038151e-05, "epoch": 6.296544533809949, "percentage": 62.97, "elapsed_time": "2:55:33", "remaining_time": "1:43:15", "throughput": 2314.67, "total_tokens": 24382664} {"current_steps": 42280, "total_steps": 67140, "loss": 0.633, "lr": 1.813305835464764e-05, "epoch": 6.297289246350909, "percentage": 62.97, "elapsed_time": "2:55:35", "remaining_time": "1:43:14", "throughput": 2314.69, "total_tokens": 24385448} {"current_steps": 42285, "total_steps": 67140, "loss": 0.653, "lr": 1.8126809712953766e-05, "epoch": 6.2980339588918675, "percentage": 62.98, "elapsed_time": "2:55:36", "remaining_time": "1:43:13", "throughput": 2314.71, "total_tokens": 24388232} {"current_steps": 42290, "total_steps": 67140, "loss": 0.6766, "lr": 1.8120561535722153e-05, "epoch": 6.298778671432827, "percentage": 62.99, "elapsed_time": "2:55:37", "remaining_time": "1:43:11", "throughput": 2314.73, "total_tokens": 24391048} {"current_steps": 42295, "total_steps": 67140, "loss": 0.5829, "lr": 1.8114313823375015e-05, "epoch": 6.299523383973786, "percentage": 63.0, "elapsed_time": "2:55:38", "remaining_time": "1:43:10", "throughput": 2314.75, "total_tokens": 24393896} {"current_steps": 42300, "total_steps": 67140, "loss": 0.7098, "lr": 1.8108066576334554e-05, "epoch": 6.3002680965147455, "percentage": 63.0, "elapsed_time": "2:55:39", "remaining_time": "1:43:09", "throughput": 2314.77, "total_tokens": 24396712} {"current_steps": 42305, "total_steps": 67140, "loss": 0.5343, "lr": 1.810181979502294e-05, "epoch": 6.301012809055704, "percentage": 63.01, "elapsed_time": "2:55:40", "remaining_time": "1:43:07", "throughput": 2314.81, "total_tokens": 24399816} {"current_steps": 42310, "total_steps": 67140, "loss": 0.5665, "lr": 1.8095573479862294e-05, "epoch": 6.301757521596664, "percentage": 63.02, "elapsed_time": "2:55:41", "remaining_time": "1:43:06", "throughput": 2314.83, "total_tokens": 24402600} {"current_steps": 42315, "total_steps": 67140, "loss": 0.633, "lr": 1.8089327631274726e-05, "epoch": 6.302502234137623, "percentage": 63.03, "elapsed_time": "2:55:43", "remaining_time": "1:43:05", "throughput": 2314.85, "total_tokens": 24405448} {"current_steps": 42320, "total_steps": 67140, "loss": 0.5207, "lr": 1.8083082249682294e-05, "epoch": 6.303246946678582, "percentage": 63.03, "elapsed_time": "2:55:44", "remaining_time": "1:43:03", "throughput": 2314.87, "total_tokens": 24408392} {"current_steps": 42325, "total_steps": 67140, "loss": 0.5817, "lr": 1.8076837335507047e-05, "epoch": 6.303991659219541, "percentage": 63.04, "elapsed_time": "2:55:45", "remaining_time": "1:43:02", "throughput": 2314.91, "total_tokens": 24411400} {"current_steps": 42330, "total_steps": 67140, "loss": 0.6795, "lr": 1.8070592889170977e-05, "epoch": 6.304736371760501, "percentage": 63.05, "elapsed_time": "2:55:46", "remaining_time": "1:43:01", "throughput": 2314.94, "total_tokens": 24414408} {"current_steps": 42335, "total_steps": 67140, "loss": 0.5969, "lr": 1.806434891109607e-05, "epoch": 6.3054810843014595, "percentage": 63.05, "elapsed_time": "2:55:47", "remaining_time": "1:43:00", "throughput": 2314.96, "total_tokens": 24417256} {"current_steps": 42340, "total_steps": 67140, "loss": 0.6074, "lr": 1.8058105401704267e-05, "epoch": 6.306225796842419, "percentage": 63.06, "elapsed_time": "2:55:48", "remaining_time": "1:42:58", "throughput": 2315.0, "total_tokens": 24420424} {"current_steps": 42345, "total_steps": 67140, "loss": 0.693, "lr": 1.8051862361417478e-05, "epoch": 6.306970509383378, "percentage": 63.07, "elapsed_time": "2:55:49", "remaining_time": "1:42:57", "throughput": 2315.02, "total_tokens": 24423240} {"current_steps": 42350, "total_steps": 67140, "loss": 0.614, "lr": 1.804561979065758e-05, "epoch": 6.3077152219243375, "percentage": 63.08, "elapsed_time": "2:55:51", "remaining_time": "1:42:56", "throughput": 2315.04, "total_tokens": 24426088} {"current_steps": 42355, "total_steps": 67140, "loss": 0.5414, "lr": 1.8039377689846427e-05, "epoch": 6.308459934465296, "percentage": 63.08, "elapsed_time": "2:55:52", "remaining_time": "1:42:54", "throughput": 2315.08, "total_tokens": 24429224} {"current_steps": 42360, "total_steps": 67140, "loss": 0.6232, "lr": 1.8033136059405826e-05, "epoch": 6.309204647006256, "percentage": 63.09, "elapsed_time": "2:55:53", "remaining_time": "1:42:53", "throughput": 2315.12, "total_tokens": 24432296} {"current_steps": 42365, "total_steps": 67140, "loss": 0.508, "lr": 1.8026894899757562e-05, "epoch": 6.309949359547215, "percentage": 63.1, "elapsed_time": "2:55:54", "remaining_time": "1:42:52", "throughput": 2315.15, "total_tokens": 24435240} {"current_steps": 42370, "total_steps": 67140, "loss": 0.6747, "lr": 1.8020654211323396e-05, "epoch": 6.310694072088174, "percentage": 63.11, "elapsed_time": "2:55:55", "remaining_time": "1:42:50", "throughput": 2315.16, "total_tokens": 24437992} {"current_steps": 42375, "total_steps": 67140, "loss": 0.5784, "lr": 1.8014413994525036e-05, "epoch": 6.311438784629133, "percentage": 63.11, "elapsed_time": "2:55:56", "remaining_time": "1:42:49", "throughput": 2315.18, "total_tokens": 24440712} {"current_steps": 42380, "total_steps": 67140, "loss": 0.4788, "lr": 1.8008174249784175e-05, "epoch": 6.312183497170093, "percentage": 63.12, "elapsed_time": "2:55:57", "remaining_time": "1:42:48", "throughput": 2315.2, "total_tokens": 24443496} {"current_steps": 42385, "total_steps": 67140, "loss": 0.5174, "lr": 1.8001934977522477e-05, "epoch": 6.3129282097110515, "percentage": 63.13, "elapsed_time": "2:55:59", "remaining_time": "1:42:47", "throughput": 2315.24, "total_tokens": 24446728} {"current_steps": 42390, "total_steps": 67140, "loss": 0.7158, "lr": 1.799569617816156e-05, "epoch": 6.31367292225201, "percentage": 63.14, "elapsed_time": "2:56:00", "remaining_time": "1:42:45", "throughput": 2315.27, "total_tokens": 24449608} {"current_steps": 42395, "total_steps": 67140, "loss": 0.6569, "lr": 1.7989457852123026e-05, "epoch": 6.31441763479297, "percentage": 63.14, "elapsed_time": "2:56:01", "remaining_time": "1:42:44", "throughput": 2315.3, "total_tokens": 24452712} {"current_steps": 42400, "total_steps": 67140, "loss": 0.749, "lr": 1.7983219999828417e-05, "epoch": 6.31516234733393, "percentage": 63.15, "elapsed_time": "2:56:02", "remaining_time": "1:42:43", "throughput": 2315.32, "total_tokens": 24455496} {"current_steps": 42405, "total_steps": 67140, "loss": 0.6081, "lr": 1.7976982621699278e-05, "epoch": 6.315907059874888, "percentage": 63.16, "elapsed_time": "2:56:03", "remaining_time": "1:42:41", "throughput": 2315.35, "total_tokens": 24458376} {"current_steps": 42410, "total_steps": 67140, "loss": 0.5662, "lr": 1.7970745718157095e-05, "epoch": 6.316651772415847, "percentage": 63.17, "elapsed_time": "2:56:04", "remaining_time": "1:42:40", "throughput": 2315.35, "total_tokens": 24461032} {"current_steps": 42415, "total_steps": 67140, "loss": 0.6752, "lr": 1.7964509289623335e-05, "epoch": 6.317396484956807, "percentage": 63.17, "elapsed_time": "2:56:05", "remaining_time": "1:42:39", "throughput": 2315.39, "total_tokens": 24464104} {"current_steps": 42420, "total_steps": 67140, "loss": 0.665, "lr": 1.795827333651944e-05, "epoch": 6.3181411974977655, "percentage": 63.18, "elapsed_time": "2:56:07", "remaining_time": "1:42:37", "throughput": 2315.43, "total_tokens": 24467368} {"current_steps": 42425, "total_steps": 67140, "loss": 0.5474, "lr": 1.7952037859266795e-05, "epoch": 6.318885910038725, "percentage": 63.19, "elapsed_time": "2:56:08", "remaining_time": "1:42:36", "throughput": 2315.45, "total_tokens": 24470184} {"current_steps": 42430, "total_steps": 67140, "loss": 0.4879, "lr": 1.7945802858286782e-05, "epoch": 6.319630622579684, "percentage": 63.2, "elapsed_time": "2:56:09", "remaining_time": "1:42:35", "throughput": 2315.48, "total_tokens": 24473192} {"current_steps": 42435, "total_steps": 67140, "loss": 0.7711, "lr": 1.793956833400074e-05, "epoch": 6.3203753351206435, "percentage": 63.2, "elapsed_time": "2:56:10", "remaining_time": "1:42:33", "throughput": 2315.49, "total_tokens": 24475880} {"current_steps": 42440, "total_steps": 67140, "loss": 0.5731, "lr": 1.793333428682996e-05, "epoch": 6.321120047661602, "percentage": 63.21, "elapsed_time": "2:56:11", "remaining_time": "1:42:32", "throughput": 2315.53, "total_tokens": 24478952} {"current_steps": 42445, "total_steps": 67140, "loss": 0.6247, "lr": 1.7927100717195712e-05, "epoch": 6.321864760202562, "percentage": 63.22, "elapsed_time": "2:56:12", "remaining_time": "1:42:31", "throughput": 2315.54, "total_tokens": 24481608} {"current_steps": 42450, "total_steps": 67140, "loss": 0.6831, "lr": 1.792086762551924e-05, "epoch": 6.322609472743521, "percentage": 63.23, "elapsed_time": "2:56:13", "remaining_time": "1:42:30", "throughput": 2315.58, "total_tokens": 24484744} {"current_steps": 42455, "total_steps": 67140, "loss": 0.7116, "lr": 1.791463501222176e-05, "epoch": 6.32335418528448, "percentage": 63.23, "elapsed_time": "2:56:15", "remaining_time": "1:42:28", "throughput": 2315.61, "total_tokens": 24487720} {"current_steps": 42460, "total_steps": 67140, "loss": 0.5102, "lr": 1.790840287772443e-05, "epoch": 6.324098897825439, "percentage": 63.24, "elapsed_time": "2:56:16", "remaining_time": "1:42:27", "throughput": 2315.64, "total_tokens": 24490792} {"current_steps": 42465, "total_steps": 67140, "loss": 0.5375, "lr": 1.79021712224484e-05, "epoch": 6.324843610366399, "percentage": 63.25, "elapsed_time": "2:56:17", "remaining_time": "1:42:26", "throughput": 2315.66, "total_tokens": 24493512} {"current_steps": 42470, "total_steps": 67140, "loss": 0.5011, "lr": 1.789594004681479e-05, "epoch": 6.3255883229073575, "percentage": 63.26, "elapsed_time": "2:56:18", "remaining_time": "1:42:24", "throughput": 2315.68, "total_tokens": 24496360} {"current_steps": 42475, "total_steps": 67140, "loss": 0.4772, "lr": 1.7889709351244675e-05, "epoch": 6.326333035448317, "percentage": 63.26, "elapsed_time": "2:56:19", "remaining_time": "1:42:23", "throughput": 2315.69, "total_tokens": 24499112} {"current_steps": 42480, "total_steps": 67140, "loss": 0.4267, "lr": 1.788347913615908e-05, "epoch": 6.327077747989276, "percentage": 63.27, "elapsed_time": "2:56:20", "remaining_time": "1:42:22", "throughput": 2315.72, "total_tokens": 24501992} {"current_steps": 42485, "total_steps": 67140, "loss": 0.5801, "lr": 1.7877249401979034e-05, "epoch": 6.327822460530236, "percentage": 63.28, "elapsed_time": "2:56:21", "remaining_time": "1:42:20", "throughput": 2315.74, "total_tokens": 24504808} {"current_steps": 42490, "total_steps": 67140, "loss": 0.6927, "lr": 1.7871020149125517e-05, "epoch": 6.328567173071194, "percentage": 63.29, "elapsed_time": "2:56:22", "remaining_time": "1:42:19", "throughput": 2315.76, "total_tokens": 24507560} {"current_steps": 42495, "total_steps": 67140, "loss": 0.7334, "lr": 1.786479137801947e-05, "epoch": 6.329311885612154, "percentage": 63.29, "elapsed_time": "2:56:24", "remaining_time": "1:42:18", "throughput": 2315.77, "total_tokens": 24510344} {"current_steps": 42500, "total_steps": 67140, "loss": 0.6648, "lr": 1.7858563089081812e-05, "epoch": 6.330056598153113, "percentage": 63.3, "elapsed_time": "2:56:25", "remaining_time": "1:42:16", "throughput": 2315.8, "total_tokens": 24513288} {"current_steps": 42505, "total_steps": 67140, "loss": 0.4627, "lr": 1.7852335282733432e-05, "epoch": 6.330801310694072, "percentage": 63.31, "elapsed_time": "2:56:26", "remaining_time": "1:42:15", "throughput": 2315.8, "total_tokens": 24515880} {"current_steps": 42510, "total_steps": 67140, "loss": 0.5864, "lr": 1.7846107959395165e-05, "epoch": 6.331546023235031, "percentage": 63.32, "elapsed_time": "2:56:27", "remaining_time": "1:42:14", "throughput": 2315.84, "total_tokens": 24518952} {"current_steps": 42515, "total_steps": 67140, "loss": 0.3786, "lr": 1.783988111948785e-05, "epoch": 6.332290735775991, "percentage": 63.32, "elapsed_time": "2:56:28", "remaining_time": "1:42:13", "throughput": 2315.87, "total_tokens": 24521896} {"current_steps": 42520, "total_steps": 67140, "loss": 0.5949, "lr": 1.7833654763432245e-05, "epoch": 6.3330354483169495, "percentage": 63.33, "elapsed_time": "2:56:29", "remaining_time": "1:42:11", "throughput": 2315.89, "total_tokens": 24524744} {"current_steps": 42525, "total_steps": 67140, "loss": 0.351, "lr": 1.782742889164912e-05, "epoch": 6.333780160857909, "percentage": 63.34, "elapsed_time": "2:56:30", "remaining_time": "1:42:10", "throughput": 2315.9, "total_tokens": 24527432} {"current_steps": 42530, "total_steps": 67140, "loss": 0.743, "lr": 1.7821203504559186e-05, "epoch": 6.334524873398868, "percentage": 63.35, "elapsed_time": "2:56:32", "remaining_time": "1:42:09", "throughput": 2315.92, "total_tokens": 24530280} {"current_steps": 42535, "total_steps": 67140, "loss": 0.5119, "lr": 1.7814978602583136e-05, "epoch": 6.335269585939828, "percentage": 63.35, "elapsed_time": "2:56:33", "remaining_time": "1:42:07", "throughput": 2315.94, "total_tokens": 24533000} {"current_steps": 42540, "total_steps": 67140, "loss": 0.733, "lr": 1.7808754186141618e-05, "epoch": 6.336014298480786, "percentage": 63.36, "elapsed_time": "2:56:34", "remaining_time": "1:42:06", "throughput": 2315.96, "total_tokens": 24535784} {"current_steps": 42545, "total_steps": 67140, "loss": 0.7186, "lr": 1.780253025565525e-05, "epoch": 6.336759011021746, "percentage": 63.37, "elapsed_time": "2:56:35", "remaining_time": "1:42:05", "throughput": 2315.99, "total_tokens": 24538760} {"current_steps": 42550, "total_steps": 67140, "loss": 0.7014, "lr": 1.7796306811544632e-05, "epoch": 6.337503723562705, "percentage": 63.38, "elapsed_time": "2:56:36", "remaining_time": "1:42:03", "throughput": 2316.02, "total_tokens": 24541800} {"current_steps": 42555, "total_steps": 67140, "loss": 0.6005, "lr": 1.779008385423031e-05, "epoch": 6.338248436103664, "percentage": 63.38, "elapsed_time": "2:56:37", "remaining_time": "1:42:02", "throughput": 2316.05, "total_tokens": 24544712} {"current_steps": 42560, "total_steps": 67140, "loss": 0.4923, "lr": 1.778386138413281e-05, "epoch": 6.338993148644623, "percentage": 63.39, "elapsed_time": "2:56:38", "remaining_time": "1:42:01", "throughput": 2316.09, "total_tokens": 24547816} {"current_steps": 42565, "total_steps": 67140, "loss": 0.5259, "lr": 1.7777639401672613e-05, "epoch": 6.339737861185583, "percentage": 63.4, "elapsed_time": "2:56:39", "remaining_time": "1:41:59", "throughput": 2316.12, "total_tokens": 24550792} {"current_steps": 42570, "total_steps": 67140, "loss": 0.5175, "lr": 1.7771417907270187e-05, "epoch": 6.340482573726542, "percentage": 63.4, "elapsed_time": "2:56:41", "remaining_time": "1:41:58", "throughput": 2316.14, "total_tokens": 24553672} {"current_steps": 42575, "total_steps": 67140, "loss": 0.5629, "lr": 1.7765196901345946e-05, "epoch": 6.3412272862675, "percentage": 63.41, "elapsed_time": "2:56:42", "remaining_time": "1:41:57", "throughput": 2316.16, "total_tokens": 24556456} {"current_steps": 42580, "total_steps": 67140, "loss": 0.6164, "lr": 1.775897638432028e-05, "epoch": 6.34197199880846, "percentage": 63.42, "elapsed_time": "2:56:43", "remaining_time": "1:41:56", "throughput": 2316.19, "total_tokens": 24559528} {"current_steps": 42585, "total_steps": 67140, "loss": 0.8189, "lr": 1.775275635661356e-05, "epoch": 6.342716711349419, "percentage": 63.43, "elapsed_time": "2:56:44", "remaining_time": "1:41:54", "throughput": 2316.2, "total_tokens": 24562152} {"current_steps": 42590, "total_steps": 67140, "loss": 0.5744, "lr": 1.774653681864609e-05, "epoch": 6.343461423890378, "percentage": 63.43, "elapsed_time": "2:56:45", "remaining_time": "1:41:53", "throughput": 2316.22, "total_tokens": 24565000} {"current_steps": 42595, "total_steps": 67140, "loss": 0.3849, "lr": 1.7740317770838173e-05, "epoch": 6.344206136431337, "percentage": 63.44, "elapsed_time": "2:56:46", "remaining_time": "1:41:52", "throughput": 2316.25, "total_tokens": 24567880} {"current_steps": 42600, "total_steps": 67140, "loss": 0.4465, "lr": 1.7734099213610075e-05, "epoch": 6.344950848972297, "percentage": 63.45, "elapsed_time": "2:56:47", "remaining_time": "1:41:50", "throughput": 2316.27, "total_tokens": 24570728} {"current_steps": 42605, "total_steps": 67140, "loss": 0.5, "lr": 1.772788114738201e-05, "epoch": 6.3456955615132555, "percentage": 63.46, "elapsed_time": "2:56:49", "remaining_time": "1:41:49", "throughput": 2316.29, "total_tokens": 24573576} {"current_steps": 42610, "total_steps": 67140, "loss": 0.814, "lr": 1.772166357257416e-05, "epoch": 6.346440274054215, "percentage": 63.46, "elapsed_time": "2:56:50", "remaining_time": "1:41:48", "throughput": 2316.31, "total_tokens": 24576392} {"current_steps": 42615, "total_steps": 67140, "loss": 0.6933, "lr": 1.7715446489606696e-05, "epoch": 6.347184986595174, "percentage": 63.47, "elapsed_time": "2:56:51", "remaining_time": "1:41:46", "throughput": 2316.33, "total_tokens": 24579144} {"current_steps": 42620, "total_steps": 67140, "loss": 0.5972, "lr": 1.770922989889975e-05, "epoch": 6.347929699136134, "percentage": 63.48, "elapsed_time": "2:56:52", "remaining_time": "1:41:45", "throughput": 2316.36, "total_tokens": 24582184} {"current_steps": 42625, "total_steps": 67140, "loss": 0.7414, "lr": 1.7703013800873398e-05, "epoch": 6.348674411677092, "percentage": 63.49, "elapsed_time": "2:56:53", "remaining_time": "1:41:44", "throughput": 2316.38, "total_tokens": 24584936} {"current_steps": 42630, "total_steps": 67140, "loss": 0.5657, "lr": 1.7696798195947704e-05, "epoch": 6.349419124218052, "percentage": 63.49, "elapsed_time": "2:56:54", "remaining_time": "1:41:42", "throughput": 2316.39, "total_tokens": 24587720} {"current_steps": 42635, "total_steps": 67140, "loss": 0.5316, "lr": 1.76905830845427e-05, "epoch": 6.350163836759011, "percentage": 63.5, "elapsed_time": "2:56:55", "remaining_time": "1:41:41", "throughput": 2316.41, "total_tokens": 24590600} {"current_steps": 42640, "total_steps": 67140, "loss": 0.499, "lr": 1.7684368467078384e-05, "epoch": 6.35090854929997, "percentage": 63.51, "elapsed_time": "2:56:56", "remaining_time": "1:41:40", "throughput": 2316.45, "total_tokens": 24593608} {"current_steps": 42645, "total_steps": 67140, "loss": 0.5224, "lr": 1.7678154343974686e-05, "epoch": 6.351653261840929, "percentage": 63.52, "elapsed_time": "2:56:58", "remaining_time": "1:41:38", "throughput": 2316.47, "total_tokens": 24596456} {"current_steps": 42650, "total_steps": 67140, "loss": 0.5581, "lr": 1.7671940715651553e-05, "epoch": 6.352397974381889, "percentage": 63.52, "elapsed_time": "2:56:59", "remaining_time": "1:41:37", "throughput": 2316.49, "total_tokens": 24599240} {"current_steps": 42655, "total_steps": 67140, "loss": 0.6515, "lr": 1.7665727582528878e-05, "epoch": 6.353142686922848, "percentage": 63.53, "elapsed_time": "2:57:00", "remaining_time": "1:41:36", "throughput": 2316.5, "total_tokens": 24601992} {"current_steps": 42660, "total_steps": 67140, "loss": 0.6996, "lr": 1.7659514945026508e-05, "epoch": 6.353887399463807, "percentage": 63.54, "elapsed_time": "2:57:01", "remaining_time": "1:41:34", "throughput": 2316.5, "total_tokens": 24604584} {"current_steps": 42665, "total_steps": 67140, "loss": 0.7638, "lr": 1.7653302803564275e-05, "epoch": 6.354632112004766, "percentage": 63.55, "elapsed_time": "2:57:02", "remaining_time": "1:41:33", "throughput": 2316.54, "total_tokens": 24607624} {"current_steps": 42670, "total_steps": 67140, "loss": 0.5463, "lr": 1.7647091158561974e-05, "epoch": 6.355376824545726, "percentage": 63.55, "elapsed_time": "2:57:03", "remaining_time": "1:41:32", "throughput": 2316.55, "total_tokens": 24610344} {"current_steps": 42675, "total_steps": 67140, "loss": 0.8104, "lr": 1.764088001043935e-05, "epoch": 6.356121537086684, "percentage": 63.56, "elapsed_time": "2:57:04", "remaining_time": "1:41:31", "throughput": 2316.57, "total_tokens": 24613160} {"current_steps": 42680, "total_steps": 67140, "loss": 0.5687, "lr": 1.763466935961615e-05, "epoch": 6.356866249627644, "percentage": 63.57, "elapsed_time": "2:57:06", "remaining_time": "1:41:29", "throughput": 2316.6, "total_tokens": 24616232} {"current_steps": 42685, "total_steps": 67140, "loss": 0.5587, "lr": 1.7628459206512033e-05, "epoch": 6.357610962168603, "percentage": 63.58, "elapsed_time": "2:57:07", "remaining_time": "1:41:28", "throughput": 2316.63, "total_tokens": 24619240} {"current_steps": 42690, "total_steps": 67140, "loss": 0.5389, "lr": 1.7622249551546682e-05, "epoch": 6.358355674709562, "percentage": 63.58, "elapsed_time": "2:57:08", "remaining_time": "1:41:27", "throughput": 2316.66, "total_tokens": 24622120} {"current_steps": 42695, "total_steps": 67140, "loss": 0.554, "lr": 1.7616040395139706e-05, "epoch": 6.359100387250521, "percentage": 63.59, "elapsed_time": "2:57:09", "remaining_time": "1:41:25", "throughput": 2316.71, "total_tokens": 24625448} {"current_steps": 42700, "total_steps": 67140, "loss": 0.557, "lr": 1.76098317377107e-05, "epoch": 6.359845099791481, "percentage": 63.6, "elapsed_time": "2:57:10", "remaining_time": "1:41:24", "throughput": 2316.74, "total_tokens": 24628392} {"current_steps": 42705, "total_steps": 67140, "loss": 0.5709, "lr": 1.7603623579679217e-05, "epoch": 6.36058981233244, "percentage": 63.61, "elapsed_time": "2:57:11", "remaining_time": "1:41:23", "throughput": 2316.73, "total_tokens": 24630920} {"current_steps": 42710, "total_steps": 67140, "loss": 0.9452, "lr": 1.759741592146478e-05, "epoch": 6.361334524873399, "percentage": 63.61, "elapsed_time": "2:57:12", "remaining_time": "1:41:21", "throughput": 2316.76, "total_tokens": 24633800} {"current_steps": 42715, "total_steps": 67140, "loss": 0.7875, "lr": 1.7591208763486883e-05, "epoch": 6.362079237414358, "percentage": 63.62, "elapsed_time": "2:57:14", "remaining_time": "1:41:20", "throughput": 2316.78, "total_tokens": 24636744} {"current_steps": 42720, "total_steps": 67140, "loss": 0.5634, "lr": 1.7585002106164976e-05, "epoch": 6.362823949955318, "percentage": 63.63, "elapsed_time": "2:57:15", "remaining_time": "1:41:19", "throughput": 2316.8, "total_tokens": 24639528} {"current_steps": 42725, "total_steps": 67140, "loss": 0.7566, "lr": 1.757879594991848e-05, "epoch": 6.363568662496276, "percentage": 63.64, "elapsed_time": "2:57:16", "remaining_time": "1:41:18", "throughput": 2316.83, "total_tokens": 24642408} {"current_steps": 42730, "total_steps": 67140, "loss": 0.4211, "lr": 1.757259029516678e-05, "epoch": 6.364313375037236, "percentage": 63.64, "elapsed_time": "2:57:17", "remaining_time": "1:41:16", "throughput": 2316.85, "total_tokens": 24645224} {"current_steps": 42735, "total_steps": 67140, "loss": 0.5129, "lr": 1.7566385142329227e-05, "epoch": 6.365058087578195, "percentage": 63.65, "elapsed_time": "2:57:18", "remaining_time": "1:41:15", "throughput": 2316.86, "total_tokens": 24648040} {"current_steps": 42740, "total_steps": 67140, "loss": 0.5035, "lr": 1.7560180491825144e-05, "epoch": 6.365802800119154, "percentage": 63.66, "elapsed_time": "2:57:19", "remaining_time": "1:41:14", "throughput": 2316.9, "total_tokens": 24651048} {"current_steps": 42745, "total_steps": 67140, "loss": 0.6886, "lr": 1.7553976344073815e-05, "epoch": 6.366547512660113, "percentage": 63.67, "elapsed_time": "2:57:20", "remaining_time": "1:41:12", "throughput": 2316.91, "total_tokens": 24653800} {"current_steps": 42750, "total_steps": 67140, "loss": 0.5168, "lr": 1.7547772699494494e-05, "epoch": 6.367292225201073, "percentage": 63.67, "elapsed_time": "2:57:21", "remaining_time": "1:41:11", "throughput": 2316.94, "total_tokens": 24656744} {"current_steps": 42755, "total_steps": 67140, "loss": 0.5791, "lr": 1.7541569558506393e-05, "epoch": 6.368036937742032, "percentage": 63.68, "elapsed_time": "2:57:23", "remaining_time": "1:41:10", "throughput": 2316.95, "total_tokens": 24659432} {"current_steps": 42760, "total_steps": 67140, "loss": 0.667, "lr": 1.7535366921528707e-05, "epoch": 6.36878165028299, "percentage": 63.69, "elapsed_time": "2:57:24", "remaining_time": "1:41:08", "throughput": 2316.99, "total_tokens": 24662536} {"current_steps": 42765, "total_steps": 67140, "loss": 0.5971, "lr": 1.752916478898056e-05, "epoch": 6.36952636282395, "percentage": 63.7, "elapsed_time": "2:57:25", "remaining_time": "1:41:07", "throughput": 2317.0, "total_tokens": 24665320} {"current_steps": 42770, "total_steps": 67140, "loss": 0.6411, "lr": 1.7522963161281094e-05, "epoch": 6.370271075364909, "percentage": 63.7, "elapsed_time": "2:57:26", "remaining_time": "1:41:06", "throughput": 2317.03, "total_tokens": 24668168} {"current_steps": 42775, "total_steps": 67140, "loss": 0.5432, "lr": 1.751676203884937e-05, "epoch": 6.371015787905868, "percentage": 63.71, "elapsed_time": "2:57:27", "remaining_time": "1:41:04", "throughput": 2317.03, "total_tokens": 24670824} {"current_steps": 42780, "total_steps": 67140, "loss": 0.6153, "lr": 1.7510561422104444e-05, "epoch": 6.371760500446827, "percentage": 63.72, "elapsed_time": "2:57:28", "remaining_time": "1:41:03", "throughput": 2317.04, "total_tokens": 24673448} {"current_steps": 42785, "total_steps": 67140, "loss": 0.7374, "lr": 1.7504361311465332e-05, "epoch": 6.372505212987787, "percentage": 63.73, "elapsed_time": "2:57:29", "remaining_time": "1:41:02", "throughput": 2317.06, "total_tokens": 24676200} {"current_steps": 42790, "total_steps": 67140, "loss": 0.5945, "lr": 1.7498161707351005e-05, "epoch": 6.373249925528746, "percentage": 63.73, "elapsed_time": "2:57:30", "remaining_time": "1:41:01", "throughput": 2317.09, "total_tokens": 24679208} {"current_steps": 42795, "total_steps": 67140, "loss": 0.5267, "lr": 1.7491962610180408e-05, "epoch": 6.373994638069705, "percentage": 63.74, "elapsed_time": "2:57:32", "remaining_time": "1:40:59", "throughput": 2317.1, "total_tokens": 24681896} {"current_steps": 42800, "total_steps": 67140, "loss": 0.4482, "lr": 1.748576402037246e-05, "epoch": 6.374739350610664, "percentage": 63.75, "elapsed_time": "2:57:33", "remaining_time": "1:40:58", "throughput": 2317.13, "total_tokens": 24684904} {"current_steps": 42805, "total_steps": 67140, "loss": 0.5305, "lr": 1.7479565938346025e-05, "epoch": 6.375484063151624, "percentage": 63.75, "elapsed_time": "2:57:34", "remaining_time": "1:40:57", "throughput": 2317.15, "total_tokens": 24687752} {"current_steps": 42810, "total_steps": 67140, "loss": 0.6273, "lr": 1.7473368364519945e-05, "epoch": 6.376228775692582, "percentage": 63.76, "elapsed_time": "2:57:35", "remaining_time": "1:40:55", "throughput": 2317.16, "total_tokens": 24690344} {"current_steps": 42815, "total_steps": 67140, "loss": 0.7261, "lr": 1.746717129931303e-05, "epoch": 6.376973488233542, "percentage": 63.77, "elapsed_time": "2:57:36", "remaining_time": "1:40:54", "throughput": 2317.2, "total_tokens": 24693320} {"current_steps": 42820, "total_steps": 67140, "loss": 0.4955, "lr": 1.7460974743144055e-05, "epoch": 6.377718200774501, "percentage": 63.78, "elapsed_time": "2:57:37", "remaining_time": "1:40:53", "throughput": 2317.22, "total_tokens": 24696200} {"current_steps": 42825, "total_steps": 67140, "loss": 0.6609, "lr": 1.7454778696431747e-05, "epoch": 6.3784629133154604, "percentage": 63.78, "elapsed_time": "2:57:38", "remaining_time": "1:40:51", "throughput": 2317.25, "total_tokens": 24699240} {"current_steps": 42830, "total_steps": 67140, "loss": 0.675, "lr": 1.7448583159594822e-05, "epoch": 6.379207625856419, "percentage": 63.79, "elapsed_time": "2:57:40", "remaining_time": "1:40:50", "throughput": 2317.27, "total_tokens": 24702120} {"current_steps": 42835, "total_steps": 67140, "loss": 0.3186, "lr": 1.744238813305195e-05, "epoch": 6.379952338397379, "percentage": 63.8, "elapsed_time": "2:57:41", "remaining_time": "1:40:49", "throughput": 2317.3, "total_tokens": 24705096} {"current_steps": 42840, "total_steps": 67140, "loss": 0.6412, "lr": 1.743619361722177e-05, "epoch": 6.380697050938338, "percentage": 63.81, "elapsed_time": "2:57:42", "remaining_time": "1:40:47", "throughput": 2317.32, "total_tokens": 24708008} {"current_steps": 42845, "total_steps": 67140, "loss": 0.6126, "lr": 1.7429999612522858e-05, "epoch": 6.381441763479297, "percentage": 63.81, "elapsed_time": "2:57:43", "remaining_time": "1:40:46", "throughput": 2317.37, "total_tokens": 24711368} {"current_steps": 42850, "total_steps": 67140, "loss": 0.6197, "lr": 1.7423806119373794e-05, "epoch": 6.382186476020256, "percentage": 63.82, "elapsed_time": "2:57:44", "remaining_time": "1:40:45", "throughput": 2317.38, "total_tokens": 24714056} {"current_steps": 42855, "total_steps": 67140, "loss": 0.6836, "lr": 1.7417613138193117e-05, "epoch": 6.382931188561216, "percentage": 63.83, "elapsed_time": "2:57:45", "remaining_time": "1:40:44", "throughput": 2317.4, "total_tokens": 24716904} {"current_steps": 42860, "total_steps": 67140, "loss": 0.5878, "lr": 1.7411420669399315e-05, "epoch": 6.383675901102174, "percentage": 63.84, "elapsed_time": "2:57:46", "remaining_time": "1:40:42", "throughput": 2317.41, "total_tokens": 24719624} {"current_steps": 42865, "total_steps": 67140, "loss": 0.6919, "lr": 1.740522871341085e-05, "epoch": 6.384420613643134, "percentage": 63.84, "elapsed_time": "2:57:48", "remaining_time": "1:40:41", "throughput": 2317.45, "total_tokens": 24722760} {"current_steps": 42870, "total_steps": 67140, "loss": 0.5713, "lr": 1.739903727064615e-05, "epoch": 6.385165326184093, "percentage": 63.85, "elapsed_time": "2:57:49", "remaining_time": "1:40:40", "throughput": 2317.47, "total_tokens": 24725576} {"current_steps": 42875, "total_steps": 67140, "loss": 0.4464, "lr": 1.7392846341523606e-05, "epoch": 6.3859100387250525, "percentage": 63.86, "elapsed_time": "2:57:50", "remaining_time": "1:40:38", "throughput": 2317.49, "total_tokens": 24728392} {"current_steps": 42880, "total_steps": 67140, "loss": 0.6693, "lr": 1.7386655926461586e-05, "epoch": 6.386654751266011, "percentage": 63.87, "elapsed_time": "2:57:51", "remaining_time": "1:40:37", "throughput": 2317.5, "total_tokens": 24731016} {"current_steps": 42885, "total_steps": 67140, "loss": 0.6262, "lr": 1.73804660258784e-05, "epoch": 6.387399463806971, "percentage": 63.87, "elapsed_time": "2:57:52", "remaining_time": "1:40:36", "throughput": 2317.53, "total_tokens": 24733928} {"current_steps": 42890, "total_steps": 67140, "loss": 0.6161, "lr": 1.737427664019234e-05, "epoch": 6.38814417634793, "percentage": 63.88, "elapsed_time": "2:57:53", "remaining_time": "1:40:34", "throughput": 2317.57, "total_tokens": 24737096} {"current_steps": 42895, "total_steps": 67140, "loss": 0.4327, "lr": 1.736808776982166e-05, "epoch": 6.388888888888889, "percentage": 63.89, "elapsed_time": "2:57:54", "remaining_time": "1:40:33", "throughput": 2317.57, "total_tokens": 24739624} {"current_steps": 42900, "total_steps": 67140, "loss": 0.5965, "lr": 1.7361899415184584e-05, "epoch": 6.389633601429848, "percentage": 63.9, "elapsed_time": "2:57:55", "remaining_time": "1:40:32", "throughput": 2317.6, "total_tokens": 24742664} {"current_steps": 42905, "total_steps": 67140, "loss": 0.7237, "lr": 1.7355711576699286e-05, "epoch": 6.390378313970807, "percentage": 63.9, "elapsed_time": "2:57:57", "remaining_time": "1:40:31", "throughput": 2317.62, "total_tokens": 24745544} {"current_steps": 42910, "total_steps": 67140, "loss": 0.6132, "lr": 1.734952425478392e-05, "epoch": 6.3911230265117664, "percentage": 63.91, "elapsed_time": "2:57:58", "remaining_time": "1:40:29", "throughput": 2317.63, "total_tokens": 24748200} {"current_steps": 42915, "total_steps": 67140, "loss": 0.6051, "lr": 1.7343337449856605e-05, "epoch": 6.391867739052726, "percentage": 63.92, "elapsed_time": "2:57:59", "remaining_time": "1:40:28", "throughput": 2317.66, "total_tokens": 24751112} {"current_steps": 42920, "total_steps": 67140, "loss": 0.6077, "lr": 1.733715116233542e-05, "epoch": 6.392612451593685, "percentage": 63.93, "elapsed_time": "2:58:00", "remaining_time": "1:40:27", "throughput": 2317.69, "total_tokens": 24754216} {"current_steps": 42925, "total_steps": 67140, "loss": 0.68, "lr": 1.7330965392638394e-05, "epoch": 6.393357164134644, "percentage": 63.93, "elapsed_time": "2:58:01", "remaining_time": "1:40:25", "throughput": 2317.72, "total_tokens": 24757160} {"current_steps": 42930, "total_steps": 67140, "loss": 0.7612, "lr": 1.732478014118355e-05, "epoch": 6.394101876675603, "percentage": 63.94, "elapsed_time": "2:58:02", "remaining_time": "1:40:24", "throughput": 2317.75, "total_tokens": 24760104} {"current_steps": 42935, "total_steps": 67140, "loss": 0.7128, "lr": 1.7318595408388862e-05, "epoch": 6.394846589216562, "percentage": 63.95, "elapsed_time": "2:58:03", "remaining_time": "1:40:23", "throughput": 2317.76, "total_tokens": 24762824} {"current_steps": 42940, "total_steps": 67140, "loss": 0.5183, "lr": 1.7312411194672258e-05, "epoch": 6.395591301757522, "percentage": 63.96, "elapsed_time": "2:58:05", "remaining_time": "1:40:21", "throughput": 2317.78, "total_tokens": 24765576} {"current_steps": 42945, "total_steps": 67140, "loss": 0.8948, "lr": 1.7306227500451654e-05, "epoch": 6.39633601429848, "percentage": 63.96, "elapsed_time": "2:58:06", "remaining_time": "1:40:20", "throughput": 2317.79, "total_tokens": 24768328} {"current_steps": 42950, "total_steps": 67140, "loss": 0.678, "lr": 1.7300044326144918e-05, "epoch": 6.39708072683944, "percentage": 63.97, "elapsed_time": "2:58:07", "remaining_time": "1:40:19", "throughput": 2317.84, "total_tokens": 24771528} {"current_steps": 42955, "total_steps": 67140, "loss": 0.601, "lr": 1.7293861672169874e-05, "epoch": 6.397825439380399, "percentage": 63.98, "elapsed_time": "2:58:08", "remaining_time": "1:40:17", "throughput": 2317.85, "total_tokens": 24774216} {"current_steps": 42960, "total_steps": 67140, "loss": 0.5633, "lr": 1.728767953894434e-05, "epoch": 6.3985701519213585, "percentage": 63.99, "elapsed_time": "2:58:09", "remaining_time": "1:40:16", "throughput": 2317.87, "total_tokens": 24777096} {"current_steps": 42965, "total_steps": 67140, "loss": 0.5723, "lr": 1.728149792688606e-05, "epoch": 6.399314864462317, "percentage": 63.99, "elapsed_time": "2:58:10", "remaining_time": "1:40:15", "throughput": 2317.89, "total_tokens": 24779848} {"current_steps": 42970, "total_steps": 67140, "loss": 0.6487, "lr": 1.7275316836412768e-05, "epoch": 6.400059577003277, "percentage": 64.0, "elapsed_time": "2:58:11", "remaining_time": "1:40:14", "throughput": 2317.92, "total_tokens": 24782856} {"current_steps": 42975, "total_steps": 67140, "loss": 0.5419, "lr": 1.7269136267942155e-05, "epoch": 6.400804289544236, "percentage": 64.01, "elapsed_time": "2:58:12", "remaining_time": "1:40:12", "throughput": 2317.93, "total_tokens": 24785544} {"current_steps": 42980, "total_steps": 67140, "loss": 0.2866, "lr": 1.7262956221891882e-05, "epoch": 6.401549002085195, "percentage": 64.02, "elapsed_time": "2:58:14", "remaining_time": "1:40:11", "throughput": 2317.94, "total_tokens": 24788168} {"current_steps": 42985, "total_steps": 67140, "loss": 0.755, "lr": 1.7256776698679577e-05, "epoch": 6.402293714626154, "percentage": 64.02, "elapsed_time": "2:58:15", "remaining_time": "1:40:10", "throughput": 2317.96, "total_tokens": 24790952} {"current_steps": 42990, "total_steps": 67140, "loss": 0.6177, "lr": 1.7250597698722813e-05, "epoch": 6.403038427167114, "percentage": 64.03, "elapsed_time": "2:58:16", "remaining_time": "1:40:08", "throughput": 2317.98, "total_tokens": 24793800} {"current_steps": 42995, "total_steps": 67140, "loss": 0.6982, "lr": 1.7244419222439152e-05, "epoch": 6.4037831397080724, "percentage": 64.04, "elapsed_time": "2:58:17", "remaining_time": "1:40:07", "throughput": 2318.01, "total_tokens": 24796840} {"current_steps": 43000, "total_steps": 67140, "loss": 0.5926, "lr": 1.723824127024612e-05, "epoch": 6.404527852249032, "percentage": 64.05, "elapsed_time": "2:58:18", "remaining_time": "1:40:06", "throughput": 2318.03, "total_tokens": 24799720} {"current_steps": 43005, "total_steps": 67140, "loss": 0.6297, "lr": 1.723206384256118e-05, "epoch": 6.405272564789991, "percentage": 64.05, "elapsed_time": "2:58:19", "remaining_time": "1:40:04", "throughput": 2318.06, "total_tokens": 24802728} {"current_steps": 43010, "total_steps": 67140, "loss": 0.6487, "lr": 1.7225886939801773e-05, "epoch": 6.4060172773309505, "percentage": 64.06, "elapsed_time": "2:58:20", "remaining_time": "1:40:03", "throughput": 2318.08, "total_tokens": 24805576} {"current_steps": 43015, "total_steps": 67140, "loss": 0.6101, "lr": 1.7219710562385324e-05, "epoch": 6.406761989871909, "percentage": 64.07, "elapsed_time": "2:58:22", "remaining_time": "1:40:02", "throughput": 2318.1, "total_tokens": 24808328} {"current_steps": 43020, "total_steps": 67140, "loss": 0.5473, "lr": 1.7213534710729205e-05, "epoch": 6.407506702412869, "percentage": 64.08, "elapsed_time": "2:58:23", "remaining_time": "1:40:00", "throughput": 2318.12, "total_tokens": 24811208} {"current_steps": 43025, "total_steps": 67140, "loss": 0.5493, "lr": 1.7207359385250756e-05, "epoch": 6.408251414953828, "percentage": 64.08, "elapsed_time": "2:58:24", "remaining_time": "1:39:59", "throughput": 2318.13, "total_tokens": 24813896} {"current_steps": 43030, "total_steps": 67140, "loss": 0.5572, "lr": 1.7201184586367272e-05, "epoch": 6.408996127494787, "percentage": 64.09, "elapsed_time": "2:58:25", "remaining_time": "1:39:58", "throughput": 2318.15, "total_tokens": 24816744} {"current_steps": 43035, "total_steps": 67140, "loss": 0.6396, "lr": 1.7195010314496023e-05, "epoch": 6.409740840035746, "percentage": 64.1, "elapsed_time": "2:58:26", "remaining_time": "1:39:57", "throughput": 2318.18, "total_tokens": 24819624} {"current_steps": 43040, "total_steps": 67140, "loss": 0.7752, "lr": 1.718883657005426e-05, "epoch": 6.410485552576706, "percentage": 64.1, "elapsed_time": "2:58:27", "remaining_time": "1:39:55", "throughput": 2318.2, "total_tokens": 24822472} {"current_steps": 43045, "total_steps": 67140, "loss": 0.5599, "lr": 1.718266335345915e-05, "epoch": 6.4112302651176645, "percentage": 64.11, "elapsed_time": "2:58:28", "remaining_time": "1:39:54", "throughput": 2318.21, "total_tokens": 24825192} {"current_steps": 43050, "total_steps": 67140, "loss": 0.5057, "lr": 1.7176490665127868e-05, "epoch": 6.411974977658624, "percentage": 64.12, "elapsed_time": "2:58:29", "remaining_time": "1:39:53", "throughput": 2318.22, "total_tokens": 24827848} {"current_steps": 43055, "total_steps": 67140, "loss": 0.5971, "lr": 1.7170318505477543e-05, "epoch": 6.412719690199583, "percentage": 64.13, "elapsed_time": "2:58:31", "remaining_time": "1:39:51", "throughput": 2318.26, "total_tokens": 24830920} {"current_steps": 43060, "total_steps": 67140, "loss": 0.5519, "lr": 1.7164146874925254e-05, "epoch": 6.4134644027405425, "percentage": 64.13, "elapsed_time": "2:58:32", "remaining_time": "1:39:50", "throughput": 2318.27, "total_tokens": 24833672} {"current_steps": 43065, "total_steps": 67140, "loss": 0.5356, "lr": 1.715797577388807e-05, "epoch": 6.414209115281501, "percentage": 64.14, "elapsed_time": "2:58:33", "remaining_time": "1:39:49", "throughput": 2318.3, "total_tokens": 24836584} {"current_steps": 43070, "total_steps": 67140, "loss": 0.6418, "lr": 1.715180520278299e-05, "epoch": 6.414953827822461, "percentage": 64.15, "elapsed_time": "2:58:34", "remaining_time": "1:39:47", "throughput": 2318.31, "total_tokens": 24839336} {"current_steps": 43075, "total_steps": 67140, "loss": 0.5055, "lr": 1.7145635162027008e-05, "epoch": 6.41569854036342, "percentage": 64.16, "elapsed_time": "2:58:35", "remaining_time": "1:39:46", "throughput": 2318.32, "total_tokens": 24842024} {"current_steps": 43080, "total_steps": 67140, "loss": 0.7767, "lr": 1.7139465652037077e-05, "epoch": 6.416443252904379, "percentage": 64.16, "elapsed_time": "2:58:36", "remaining_time": "1:39:45", "throughput": 2318.35, "total_tokens": 24844936} {"current_steps": 43085, "total_steps": 67140, "loss": 0.6137, "lr": 1.7133296673230097e-05, "epoch": 6.417187965445338, "percentage": 64.17, "elapsed_time": "2:58:37", "remaining_time": "1:39:43", "throughput": 2318.36, "total_tokens": 24847560} {"current_steps": 43090, "total_steps": 67140, "loss": 0.6621, "lr": 1.7127128226022936e-05, "epoch": 6.417932677986297, "percentage": 64.18, "elapsed_time": "2:58:38", "remaining_time": "1:39:42", "throughput": 2318.4, "total_tokens": 24850760} {"current_steps": 43095, "total_steps": 67140, "loss": 0.6123, "lr": 1.7120960310832446e-05, "epoch": 6.4186773905272565, "percentage": 64.19, "elapsed_time": "2:58:40", "remaining_time": "1:39:41", "throughput": 2318.42, "total_tokens": 24853640} {"current_steps": 43100, "total_steps": 67140, "loss": 0.6678, "lr": 1.7114792928075422e-05, "epoch": 6.419422103068215, "percentage": 64.19, "elapsed_time": "2:58:41", "remaining_time": "1:39:39", "throughput": 2318.44, "total_tokens": 24856456} {"current_steps": 43105, "total_steps": 67140, "loss": 0.5935, "lr": 1.7108626078168634e-05, "epoch": 6.420166815609175, "percentage": 64.2, "elapsed_time": "2:58:42", "remaining_time": "1:39:38", "throughput": 2318.46, "total_tokens": 24859208} {"current_steps": 43110, "total_steps": 67140, "loss": 0.5834, "lr": 1.7102459761528812e-05, "epoch": 6.420911528150134, "percentage": 64.21, "elapsed_time": "2:58:43", "remaining_time": "1:39:37", "throughput": 2318.5, "total_tokens": 24862440} {"current_steps": 43115, "total_steps": 67140, "loss": 0.6409, "lr": 1.709629397857265e-05, "epoch": 6.421656240691093, "percentage": 64.22, "elapsed_time": "2:58:44", "remaining_time": "1:39:36", "throughput": 2318.52, "total_tokens": 24865320} {"current_steps": 43120, "total_steps": 67140, "loss": 0.7173, "lr": 1.7090128729716815e-05, "epoch": 6.422400953232052, "percentage": 64.22, "elapsed_time": "2:58:45", "remaining_time": "1:39:34", "throughput": 2318.54, "total_tokens": 24868168} {"current_steps": 43125, "total_steps": 67140, "loss": 0.5068, "lr": 1.708396401537791e-05, "epoch": 6.423145665773012, "percentage": 64.23, "elapsed_time": "2:58:46", "remaining_time": "1:39:33", "throughput": 2318.58, "total_tokens": 24871208} {"current_steps": 43130, "total_steps": 67140, "loss": 0.7112, "lr": 1.707779983597253e-05, "epoch": 6.4238903783139705, "percentage": 64.24, "elapsed_time": "2:58:48", "remaining_time": "1:39:32", "throughput": 2318.61, "total_tokens": 24874312} {"current_steps": 43135, "total_steps": 67140, "loss": 0.6101, "lr": 1.7071636191917238e-05, "epoch": 6.42463509085493, "percentage": 64.25, "elapsed_time": "2:58:49", "remaining_time": "1:39:30", "throughput": 2318.64, "total_tokens": 24877192} {"current_steps": 43140, "total_steps": 67140, "loss": 0.6186, "lr": 1.706547308362853e-05, "epoch": 6.425379803395889, "percentage": 64.25, "elapsed_time": "2:58:50", "remaining_time": "1:39:29", "throughput": 2318.66, "total_tokens": 24880040} {"current_steps": 43145, "total_steps": 67140, "loss": 0.6517, "lr": 1.705931051152289e-05, "epoch": 6.4261245159368485, "percentage": 64.26, "elapsed_time": "2:58:51", "remaining_time": "1:39:28", "throughput": 2318.67, "total_tokens": 24882760} {"current_steps": 43150, "total_steps": 67140, "loss": 0.5271, "lr": 1.7053148476016774e-05, "epoch": 6.426869228477807, "percentage": 64.27, "elapsed_time": "2:58:52", "remaining_time": "1:39:26", "throughput": 2318.68, "total_tokens": 24885480} {"current_steps": 43155, "total_steps": 67140, "loss": 0.503, "lr": 1.704698697752656e-05, "epoch": 6.427613941018767, "percentage": 64.28, "elapsed_time": "2:58:53", "remaining_time": "1:39:25", "throughput": 2318.72, "total_tokens": 24888648} {"current_steps": 43160, "total_steps": 67140, "loss": 0.6238, "lr": 1.7040826016468637e-05, "epoch": 6.428358653559726, "percentage": 64.28, "elapsed_time": "2:58:54", "remaining_time": "1:39:24", "throughput": 2318.74, "total_tokens": 24891496} {"current_steps": 43165, "total_steps": 67140, "loss": 0.6903, "lr": 1.7034665593259338e-05, "epoch": 6.429103366100685, "percentage": 64.29, "elapsed_time": "2:58:56", "remaining_time": "1:39:23", "throughput": 2318.76, "total_tokens": 24894280} {"current_steps": 43170, "total_steps": 67140, "loss": 0.635, "lr": 1.7028505708314953e-05, "epoch": 6.429848078641644, "percentage": 64.3, "elapsed_time": "2:58:57", "remaining_time": "1:39:21", "throughput": 2318.78, "total_tokens": 24897096} {"current_steps": 43175, "total_steps": 67140, "loss": 0.686, "lr": 1.702234636205173e-05, "epoch": 6.430592791182604, "percentage": 64.31, "elapsed_time": "2:58:58", "remaining_time": "1:39:20", "throughput": 2318.8, "total_tokens": 24899880} {"current_steps": 43180, "total_steps": 67140, "loss": 0.4624, "lr": 1.7016187554885916e-05, "epoch": 6.4313375037235625, "percentage": 64.31, "elapsed_time": "2:58:59", "remaining_time": "1:39:19", "throughput": 2318.83, "total_tokens": 24902984} {"current_steps": 43185, "total_steps": 67140, "loss": 0.6322, "lr": 1.7010029287233688e-05, "epoch": 6.432082216264522, "percentage": 64.32, "elapsed_time": "2:59:00", "remaining_time": "1:39:17", "throughput": 2318.85, "total_tokens": 24905736} {"current_steps": 43190, "total_steps": 67140, "loss": 0.5163, "lr": 1.7003871559511187e-05, "epoch": 6.432826928805481, "percentage": 64.33, "elapsed_time": "2:59:01", "remaining_time": "1:39:16", "throughput": 2318.85, "total_tokens": 24908328} {"current_steps": 43195, "total_steps": 67140, "loss": 0.6071, "lr": 1.6997714372134544e-05, "epoch": 6.4335716413464406, "percentage": 64.34, "elapsed_time": "2:59:02", "remaining_time": "1:39:15", "throughput": 2318.9, "total_tokens": 24911624} {"current_steps": 43200, "total_steps": 67140, "loss": 0.5904, "lr": 1.6991557725519824e-05, "epoch": 6.434316353887399, "percentage": 64.34, "elapsed_time": "2:59:03", "remaining_time": "1:39:13", "throughput": 2318.92, "total_tokens": 24914376} {"current_steps": 43205, "total_steps": 67140, "loss": 0.4967, "lr": 1.698540162008308e-05, "epoch": 6.435061066428359, "percentage": 64.35, "elapsed_time": "2:59:05", "remaining_time": "1:39:12", "throughput": 2318.94, "total_tokens": 24917224} {"current_steps": 43210, "total_steps": 67140, "loss": 0.537, "lr": 1.6979246056240305e-05, "epoch": 6.435805778969318, "percentage": 64.36, "elapsed_time": "2:59:06", "remaining_time": "1:39:11", "throughput": 2318.95, "total_tokens": 24919944} {"current_steps": 43215, "total_steps": 67140, "loss": 0.7014, "lr": 1.6973091034407468e-05, "epoch": 6.436550491510277, "percentage": 64.37, "elapsed_time": "2:59:07", "remaining_time": "1:39:09", "throughput": 2318.96, "total_tokens": 24922536} {"current_steps": 43220, "total_steps": 67140, "loss": 0.7961, "lr": 1.6966936555000507e-05, "epoch": 6.437295204051236, "percentage": 64.37, "elapsed_time": "2:59:08", "remaining_time": "1:39:08", "throughput": 2319.0, "total_tokens": 24925640} {"current_steps": 43225, "total_steps": 67140, "loss": 0.6209, "lr": 1.6960782618435312e-05, "epoch": 6.438039916592196, "percentage": 64.38, "elapsed_time": "2:59:09", "remaining_time": "1:39:07", "throughput": 2319.03, "total_tokens": 24928616} {"current_steps": 43230, "total_steps": 67140, "loss": 0.7477, "lr": 1.6954629225127745e-05, "epoch": 6.4387846291331545, "percentage": 64.39, "elapsed_time": "2:59:10", "remaining_time": "1:39:06", "throughput": 2319.05, "total_tokens": 24931496} {"current_steps": 43235, "total_steps": 67140, "loss": 0.5174, "lr": 1.6948476375493622e-05, "epoch": 6.439529341674114, "percentage": 64.4, "elapsed_time": "2:59:11", "remaining_time": "1:39:04", "throughput": 2319.07, "total_tokens": 24934344} {"current_steps": 43240, "total_steps": 67140, "loss": 0.6063, "lr": 1.694232406994873e-05, "epoch": 6.440274054215073, "percentage": 64.4, "elapsed_time": "2:59:13", "remaining_time": "1:39:03", "throughput": 2319.09, "total_tokens": 24937192} {"current_steps": 43245, "total_steps": 67140, "loss": 0.5723, "lr": 1.6936172308908825e-05, "epoch": 6.441018766756033, "percentage": 64.41, "elapsed_time": "2:59:14", "remaining_time": "1:39:02", "throughput": 2319.11, "total_tokens": 24939976} {"current_steps": 43250, "total_steps": 67140, "loss": 0.5945, "lr": 1.693002109278961e-05, "epoch": 6.441763479296991, "percentage": 64.42, "elapsed_time": "2:59:15", "remaining_time": "1:39:00", "throughput": 2319.12, "total_tokens": 24942760} {"current_steps": 43255, "total_steps": 67140, "loss": 0.671, "lr": 1.6923870422006753e-05, "epoch": 6.44250819183795, "percentage": 64.43, "elapsed_time": "2:59:16", "remaining_time": "1:38:59", "throughput": 2319.16, "total_tokens": 24945864} {"current_steps": 43260, "total_steps": 67140, "loss": 0.5208, "lr": 1.6917720296975898e-05, "epoch": 6.44325290437891, "percentage": 64.43, "elapsed_time": "2:59:17", "remaining_time": "1:38:58", "throughput": 2319.18, "total_tokens": 24948744} {"current_steps": 43265, "total_steps": 67140, "loss": 0.5532, "lr": 1.6911570718112646e-05, "epoch": 6.443997616919869, "percentage": 64.44, "elapsed_time": "2:59:18", "remaining_time": "1:38:56", "throughput": 2319.2, "total_tokens": 24951592} {"current_steps": 43270, "total_steps": 67140, "loss": 0.3795, "lr": 1.6905421685832555e-05, "epoch": 6.444742329460828, "percentage": 64.45, "elapsed_time": "2:59:19", "remaining_time": "1:38:55", "throughput": 2319.22, "total_tokens": 24954344} {"current_steps": 43275, "total_steps": 67140, "loss": 0.5039, "lr": 1.689927320055116e-05, "epoch": 6.445487042001787, "percentage": 64.45, "elapsed_time": "2:59:20", "remaining_time": "1:38:54", "throughput": 2319.23, "total_tokens": 24957032} {"current_steps": 43280, "total_steps": 67140, "loss": 0.5074, "lr": 1.6893125262683952e-05, "epoch": 6.4462317545427466, "percentage": 64.46, "elapsed_time": "2:59:22", "remaining_time": "1:38:53", "throughput": 2319.26, "total_tokens": 24959976} {"current_steps": 43285, "total_steps": 67140, "loss": 0.5386, "lr": 1.688697787264638e-05, "epoch": 6.446976467083705, "percentage": 64.47, "elapsed_time": "2:59:23", "remaining_time": "1:38:51", "throughput": 2319.28, "total_tokens": 24962920} {"current_steps": 43290, "total_steps": 67140, "loss": 0.5579, "lr": 1.6880831030853854e-05, "epoch": 6.447721179624665, "percentage": 64.48, "elapsed_time": "2:59:24", "remaining_time": "1:38:50", "throughput": 2319.31, "total_tokens": 24965896} {"current_steps": 43295, "total_steps": 67140, "loss": 0.6705, "lr": 1.6874684737721752e-05, "epoch": 6.448465892165624, "percentage": 64.48, "elapsed_time": "2:59:25", "remaining_time": "1:38:49", "throughput": 2319.33, "total_tokens": 24968648} {"current_steps": 43300, "total_steps": 67140, "loss": 0.6317, "lr": 1.6868538993665426e-05, "epoch": 6.449210604706583, "percentage": 64.49, "elapsed_time": "2:59:26", "remaining_time": "1:38:47", "throughput": 2319.35, "total_tokens": 24971464} {"current_steps": 43305, "total_steps": 67140, "loss": 0.568, "lr": 1.6862393799100166e-05, "epoch": 6.449955317247542, "percentage": 64.5, "elapsed_time": "2:59:27", "remaining_time": "1:38:46", "throughput": 2319.37, "total_tokens": 24974280} {"current_steps": 43310, "total_steps": 67140, "loss": 0.6169, "lr": 1.6856249154441256e-05, "epoch": 6.450700029788502, "percentage": 64.51, "elapsed_time": "2:59:28", "remaining_time": "1:38:45", "throughput": 2319.38, "total_tokens": 24977032} {"current_steps": 43315, "total_steps": 67140, "loss": 0.6176, "lr": 1.685010506010392e-05, "epoch": 6.4514447423294605, "percentage": 64.51, "elapsed_time": "2:59:30", "remaining_time": "1:38:43", "throughput": 2319.42, "total_tokens": 24980168} {"current_steps": 43320, "total_steps": 67140, "loss": 0.6967, "lr": 1.6843961516503344e-05, "epoch": 6.45218945487042, "percentage": 64.52, "elapsed_time": "2:59:31", "remaining_time": "1:38:42", "throughput": 2319.45, "total_tokens": 24983240} {"current_steps": 43325, "total_steps": 67140, "loss": 0.5891, "lr": 1.6837818524054696e-05, "epoch": 6.452934167411379, "percentage": 64.53, "elapsed_time": "2:59:32", "remaining_time": "1:38:41", "throughput": 2319.46, "total_tokens": 24985896} {"current_steps": 43330, "total_steps": 67140, "loss": 0.5667, "lr": 1.683167608317308e-05, "epoch": 6.453678879952339, "percentage": 64.54, "elapsed_time": "2:59:33", "remaining_time": "1:38:40", "throughput": 2319.5, "total_tokens": 24989032} {"current_steps": 43335, "total_steps": 67140, "loss": 0.8102, "lr": 1.6825534194273586e-05, "epoch": 6.454423592493297, "percentage": 64.54, "elapsed_time": "2:59:34", "remaining_time": "1:38:38", "throughput": 2319.54, "total_tokens": 24992104} {"current_steps": 43340, "total_steps": 67140, "loss": 0.596, "lr": 1.6819392857771253e-05, "epoch": 6.455168305034257, "percentage": 64.55, "elapsed_time": "2:59:35", "remaining_time": "1:38:37", "throughput": 2319.55, "total_tokens": 24994792} {"current_steps": 43345, "total_steps": 67140, "loss": 0.468, "lr": 1.6813252074081094e-05, "epoch": 6.455913017575216, "percentage": 64.56, "elapsed_time": "2:59:36", "remaining_time": "1:38:36", "throughput": 2319.57, "total_tokens": 24997768} {"current_steps": 43350, "total_steps": 67140, "loss": 0.4428, "lr": 1.6807111843618077e-05, "epoch": 6.456657730116175, "percentage": 64.57, "elapsed_time": "2:59:38", "remaining_time": "1:38:34", "throughput": 2319.59, "total_tokens": 25000552} {"current_steps": 43355, "total_steps": 67140, "loss": 0.4447, "lr": 1.6800972166797126e-05, "epoch": 6.457402442657134, "percentage": 64.57, "elapsed_time": "2:59:39", "remaining_time": "1:38:33", "throughput": 2319.6, "total_tokens": 25003176} {"current_steps": 43360, "total_steps": 67140, "loss": 0.6473, "lr": 1.6794833044033147e-05, "epoch": 6.458147155198094, "percentage": 64.58, "elapsed_time": "2:59:40", "remaining_time": "1:38:32", "throughput": 2319.61, "total_tokens": 25005832} {"current_steps": 43365, "total_steps": 67140, "loss": 0.5737, "lr": 1.678869447574099e-05, "epoch": 6.4588918677390526, "percentage": 64.59, "elapsed_time": "2:59:41", "remaining_time": "1:38:30", "throughput": 2319.62, "total_tokens": 25008552} {"current_steps": 43370, "total_steps": 67140, "loss": 0.6645, "lr": 1.678255646233548e-05, "epoch": 6.459636580280012, "percentage": 64.6, "elapsed_time": "2:59:42", "remaining_time": "1:38:29", "throughput": 2319.64, "total_tokens": 25011368} {"current_steps": 43375, "total_steps": 67140, "loss": 0.5565, "lr": 1.6776419004231386e-05, "epoch": 6.460381292820971, "percentage": 64.6, "elapsed_time": "2:59:43", "remaining_time": "1:38:28", "throughput": 2319.66, "total_tokens": 25014120} {"current_steps": 43380, "total_steps": 67140, "loss": 0.776, "lr": 1.677028210184346e-05, "epoch": 6.461126005361931, "percentage": 64.61, "elapsed_time": "2:59:44", "remaining_time": "1:38:26", "throughput": 2319.68, "total_tokens": 25016968} {"current_steps": 43385, "total_steps": 67140, "loss": 0.5473, "lr": 1.6764145755586417e-05, "epoch": 6.461870717902889, "percentage": 64.62, "elapsed_time": "2:59:45", "remaining_time": "1:38:25", "throughput": 2319.69, "total_tokens": 25019720} {"current_steps": 43390, "total_steps": 67140, "loss": 0.7324, "lr": 1.675800996587491e-05, "epoch": 6.462615430443849, "percentage": 64.63, "elapsed_time": "2:59:46", "remaining_time": "1:38:24", "throughput": 2319.7, "total_tokens": 25022408} {"current_steps": 43395, "total_steps": 67140, "loss": 0.5197, "lr": 1.675187473312359e-05, "epoch": 6.463360142984808, "percentage": 64.63, "elapsed_time": "2:59:48", "remaining_time": "1:38:23", "throughput": 2319.73, "total_tokens": 25025416} {"current_steps": 43400, "total_steps": 67140, "loss": 0.593, "lr": 1.6745740057747038e-05, "epoch": 6.464104855525767, "percentage": 64.64, "elapsed_time": "2:59:49", "remaining_time": "1:38:21", "throughput": 2319.75, "total_tokens": 25028232} {"current_steps": 43405, "total_steps": 67140, "loss": 0.5946, "lr": 1.673960594015982e-05, "epoch": 6.464849568066726, "percentage": 64.65, "elapsed_time": "2:59:50", "remaining_time": "1:38:20", "throughput": 2319.78, "total_tokens": 25031240} {"current_steps": 43410, "total_steps": 67140, "loss": 0.6648, "lr": 1.673347238077644e-05, "epoch": 6.465594280607686, "percentage": 64.66, "elapsed_time": "2:59:51", "remaining_time": "1:38:19", "throughput": 2319.81, "total_tokens": 25034152} {"current_steps": 43415, "total_steps": 67140, "loss": 0.5582, "lr": 1.6727339380011386e-05, "epoch": 6.466338993148645, "percentage": 64.66, "elapsed_time": "2:59:52", "remaining_time": "1:38:17", "throughput": 2319.82, "total_tokens": 25036744} {"current_steps": 43420, "total_steps": 67140, "loss": 0.4701, "lr": 1.6721206938279105e-05, "epoch": 6.467083705689604, "percentage": 64.67, "elapsed_time": "2:59:53", "remaining_time": "1:38:16", "throughput": 2319.82, "total_tokens": 25039336} {"current_steps": 43425, "total_steps": 67140, "loss": 0.4738, "lr": 1.6715075055993994e-05, "epoch": 6.467828418230563, "percentage": 64.68, "elapsed_time": "2:59:54", "remaining_time": "1:38:15", "throughput": 2319.86, "total_tokens": 25042472} {"current_steps": 43430, "total_steps": 67140, "loss": 0.7224, "lr": 1.6708943733570437e-05, "epoch": 6.468573130771523, "percentage": 64.69, "elapsed_time": "2:59:55", "remaining_time": "1:38:13", "throughput": 2319.91, "total_tokens": 25045704} {"current_steps": 43435, "total_steps": 67140, "loss": 0.5817, "lr": 1.6702812971422746e-05, "epoch": 6.469317843312481, "percentage": 64.69, "elapsed_time": "2:59:57", "remaining_time": "1:38:12", "throughput": 2319.95, "total_tokens": 25048968} {"current_steps": 43440, "total_steps": 67140, "loss": 0.5119, "lr": 1.669668276996522e-05, "epoch": 6.47006255585344, "percentage": 64.7, "elapsed_time": "2:59:58", "remaining_time": "1:38:11", "throughput": 2319.97, "total_tokens": 25051880} {"current_steps": 43445, "total_steps": 67140, "loss": 0.4983, "lr": 1.6690553129612125e-05, "epoch": 6.4708072683944, "percentage": 64.71, "elapsed_time": "2:59:59", "remaining_time": "1:38:10", "throughput": 2320.0, "total_tokens": 25054728} {"current_steps": 43450, "total_steps": 67140, "loss": 0.5942, "lr": 1.668442405077766e-05, "epoch": 6.4715519809353586, "percentage": 64.72, "elapsed_time": "3:00:00", "remaining_time": "1:38:08", "throughput": 2320.02, "total_tokens": 25057640} {"current_steps": 43455, "total_steps": 67140, "loss": 0.5985, "lr": 1.6678295533876006e-05, "epoch": 6.472296693476318, "percentage": 64.72, "elapsed_time": "3:00:01", "remaining_time": "1:38:07", "throughput": 2320.03, "total_tokens": 25060296} {"current_steps": 43460, "total_steps": 67140, "loss": 0.4633, "lr": 1.6672167579321305e-05, "epoch": 6.473041406017277, "percentage": 64.73, "elapsed_time": "3:00:02", "remaining_time": "1:38:06", "throughput": 2320.06, "total_tokens": 25063176} {"current_steps": 43465, "total_steps": 67140, "loss": 0.7728, "lr": 1.6666040187527665e-05, "epoch": 6.473786118558237, "percentage": 64.74, "elapsed_time": "3:00:03", "remaining_time": "1:38:04", "throughput": 2320.06, "total_tokens": 25065736} {"current_steps": 43470, "total_steps": 67140, "loss": 0.5877, "lr": 1.665991335890914e-05, "epoch": 6.474530831099195, "percentage": 64.75, "elapsed_time": "3:00:05", "remaining_time": "1:38:03", "throughput": 2320.08, "total_tokens": 25068520} {"current_steps": 43475, "total_steps": 67140, "loss": 0.5793, "lr": 1.6653787093879762e-05, "epoch": 6.475275543640155, "percentage": 64.75, "elapsed_time": "3:00:06", "remaining_time": "1:38:02", "throughput": 2320.09, "total_tokens": 25071176} {"current_steps": 43480, "total_steps": 67140, "loss": 0.527, "lr": 1.6647661392853525e-05, "epoch": 6.476020256181114, "percentage": 64.76, "elapsed_time": "3:00:07", "remaining_time": "1:38:00", "throughput": 2320.12, "total_tokens": 25074120} {"current_steps": 43485, "total_steps": 67140, "loss": 0.7585, "lr": 1.664153625624438e-05, "epoch": 6.476764968722073, "percentage": 64.77, "elapsed_time": "3:00:08", "remaining_time": "1:37:59", "throughput": 2320.13, "total_tokens": 25076904} {"current_steps": 43490, "total_steps": 67140, "loss": 0.6157, "lr": 1.6635411684466217e-05, "epoch": 6.477509681263032, "percentage": 64.78, "elapsed_time": "3:00:09", "remaining_time": "1:37:58", "throughput": 2320.17, "total_tokens": 25080104} {"current_steps": 43495, "total_steps": 67140, "loss": 0.6354, "lr": 1.6629287677932924e-05, "epoch": 6.478254393803992, "percentage": 64.78, "elapsed_time": "3:00:10", "remaining_time": "1:37:56", "throughput": 2320.2, "total_tokens": 25083144} {"current_steps": 43500, "total_steps": 67140, "loss": 0.7833, "lr": 1.6623164237058347e-05, "epoch": 6.478999106344951, "percentage": 64.79, "elapsed_time": "3:00:11", "remaining_time": "1:37:55", "throughput": 2320.23, "total_tokens": 25086024} {"current_steps": 43505, "total_steps": 67140, "loss": 0.4559, "lr": 1.6617041362256265e-05, "epoch": 6.47974381888591, "percentage": 64.8, "elapsed_time": "3:00:12", "remaining_time": "1:37:54", "throughput": 2320.23, "total_tokens": 25088680} {"current_steps": 43510, "total_steps": 67140, "loss": 0.4252, "lr": 1.6610919053940446e-05, "epoch": 6.480488531426869, "percentage": 64.8, "elapsed_time": "3:00:14", "remaining_time": "1:37:53", "throughput": 2320.26, "total_tokens": 25091688} {"current_steps": 43515, "total_steps": 67140, "loss": 0.6657, "lr": 1.6604797312524613e-05, "epoch": 6.481233243967829, "percentage": 64.81, "elapsed_time": "3:00:15", "remaining_time": "1:37:51", "throughput": 2320.28, "total_tokens": 25094440} {"current_steps": 43520, "total_steps": 67140, "loss": 0.5822, "lr": 1.659867613842244e-05, "epoch": 6.481977956508787, "percentage": 64.82, "elapsed_time": "3:00:16", "remaining_time": "1:37:50", "throughput": 2320.3, "total_tokens": 25097288} {"current_steps": 43525, "total_steps": 67140, "loss": 0.6884, "lr": 1.6592555532047592e-05, "epoch": 6.482722669049747, "percentage": 64.83, "elapsed_time": "3:00:17", "remaining_time": "1:37:49", "throughput": 2320.32, "total_tokens": 25100264} {"current_steps": 43530, "total_steps": 67140, "loss": 0.6095, "lr": 1.6586435493813645e-05, "epoch": 6.483467381590706, "percentage": 64.83, "elapsed_time": "3:00:18", "remaining_time": "1:37:47", "throughput": 2320.33, "total_tokens": 25102984} {"current_steps": 43535, "total_steps": 67140, "loss": 0.658, "lr": 1.6580316024134186e-05, "epoch": 6.484212094131665, "percentage": 64.84, "elapsed_time": "3:00:19", "remaining_time": "1:37:46", "throughput": 2320.35, "total_tokens": 25105768} {"current_steps": 43540, "total_steps": 67140, "loss": 0.5903, "lr": 1.657419712342273e-05, "epoch": 6.484956806672624, "percentage": 64.85, "elapsed_time": "3:00:20", "remaining_time": "1:37:45", "throughput": 2320.36, "total_tokens": 25108488} {"current_steps": 43545, "total_steps": 67140, "loss": 0.7157, "lr": 1.656807879209278e-05, "epoch": 6.485701519213584, "percentage": 64.86, "elapsed_time": "3:00:22", "remaining_time": "1:37:43", "throughput": 2320.38, "total_tokens": 25111336} {"current_steps": 43550, "total_steps": 67140, "loss": 0.6233, "lr": 1.656196103055779e-05, "epoch": 6.486446231754543, "percentage": 64.86, "elapsed_time": "3:00:23", "remaining_time": "1:37:42", "throughput": 2320.41, "total_tokens": 25114248} {"current_steps": 43555, "total_steps": 67140, "loss": 0.6622, "lr": 1.6555843839231156e-05, "epoch": 6.487190944295502, "percentage": 64.87, "elapsed_time": "3:00:24", "remaining_time": "1:37:41", "throughput": 2320.42, "total_tokens": 25117000} {"current_steps": 43560, "total_steps": 67140, "loss": 0.485, "lr": 1.654972721852627e-05, "epoch": 6.487935656836461, "percentage": 64.88, "elapsed_time": "3:00:25", "remaining_time": "1:37:40", "throughput": 2320.45, "total_tokens": 25119848} {"current_steps": 43565, "total_steps": 67140, "loss": 0.7713, "lr": 1.6543611168856464e-05, "epoch": 6.488680369377421, "percentage": 64.89, "elapsed_time": "3:00:26", "remaining_time": "1:37:38", "throughput": 2320.46, "total_tokens": 25122600} {"current_steps": 43570, "total_steps": 67140, "loss": 0.7745, "lr": 1.6537495690635034e-05, "epoch": 6.489425081918379, "percentage": 64.89, "elapsed_time": "3:00:27", "remaining_time": "1:37:37", "throughput": 2320.49, "total_tokens": 25125608} {"current_steps": 43575, "total_steps": 67140, "loss": 0.622, "lr": 1.6531380784275237e-05, "epoch": 6.490169794459339, "percentage": 64.9, "elapsed_time": "3:00:28", "remaining_time": "1:37:36", "throughput": 2320.53, "total_tokens": 25128808} {"current_steps": 43580, "total_steps": 67140, "loss": 0.549, "lr": 1.6525266450190296e-05, "epoch": 6.490914507000298, "percentage": 64.91, "elapsed_time": "3:00:30", "remaining_time": "1:37:34", "throughput": 2320.55, "total_tokens": 25131688} {"current_steps": 43585, "total_steps": 67140, "loss": 0.5881, "lr": 1.6519152688793387e-05, "epoch": 6.4916592195412575, "percentage": 64.92, "elapsed_time": "3:00:31", "remaining_time": "1:37:33", "throughput": 2320.57, "total_tokens": 25134408} {"current_steps": 43590, "total_steps": 67140, "loss": 0.6835, "lr": 1.6513039500497663e-05, "epoch": 6.492403932082216, "percentage": 64.92, "elapsed_time": "3:00:32", "remaining_time": "1:37:32", "throughput": 2320.61, "total_tokens": 25137608} {"current_steps": 43595, "total_steps": 67140, "loss": 0.5392, "lr": 1.6506926885716224e-05, "epoch": 6.493148644623176, "percentage": 64.93, "elapsed_time": "3:00:33", "remaining_time": "1:37:30", "throughput": 2320.63, "total_tokens": 25140520} {"current_steps": 43600, "total_steps": 67140, "loss": 0.42, "lr": 1.6500814844862135e-05, "epoch": 6.493893357164135, "percentage": 64.94, "elapsed_time": "3:00:34", "remaining_time": "1:37:29", "throughput": 2320.65, "total_tokens": 25143208} {"current_steps": 43605, "total_steps": 67140, "loss": 0.5907, "lr": 1.6494703378348433e-05, "epoch": 6.494638069705093, "percentage": 64.95, "elapsed_time": "3:00:35", "remaining_time": "1:37:28", "throughput": 2320.67, "total_tokens": 25146088} {"current_steps": 43610, "total_steps": 67140, "loss": 0.5935, "lr": 1.6488592486588087e-05, "epoch": 6.495382782246053, "percentage": 64.95, "elapsed_time": "3:00:36", "remaining_time": "1:37:27", "throughput": 2320.7, "total_tokens": 25149192} {"current_steps": 43615, "total_steps": 67140, "loss": 0.5134, "lr": 1.6482482169994055e-05, "epoch": 6.496127494787013, "percentage": 64.96, "elapsed_time": "3:00:37", "remaining_time": "1:37:25", "throughput": 2320.71, "total_tokens": 25151784} {"current_steps": 43620, "total_steps": 67140, "loss": 0.6148, "lr": 1.6476372428979254e-05, "epoch": 6.496872207327971, "percentage": 64.97, "elapsed_time": "3:00:39", "remaining_time": "1:37:24", "throughput": 2320.72, "total_tokens": 25154504} {"current_steps": 43625, "total_steps": 67140, "loss": 0.6553, "lr": 1.6470263263956543e-05, "epoch": 6.49761691986893, "percentage": 64.98, "elapsed_time": "3:00:40", "remaining_time": "1:37:23", "throughput": 2320.75, "total_tokens": 25157480} {"current_steps": 43630, "total_steps": 67140, "loss": 0.505, "lr": 1.6464154675338767e-05, "epoch": 6.49836163240989, "percentage": 64.98, "elapsed_time": "3:00:41", "remaining_time": "1:37:21", "throughput": 2320.77, "total_tokens": 25160392} {"current_steps": 43635, "total_steps": 67140, "loss": 0.5854, "lr": 1.6458046663538706e-05, "epoch": 6.499106344950849, "percentage": 64.99, "elapsed_time": "3:00:42", "remaining_time": "1:37:20", "throughput": 2320.79, "total_tokens": 25163208} {"current_steps": 43640, "total_steps": 67140, "loss": 0.7743, "lr": 1.6451939228969127e-05, "epoch": 6.499851057491808, "percentage": 65.0, "elapsed_time": "3:00:43", "remaining_time": "1:37:19", "throughput": 2320.81, "total_tokens": 25166024} {"current_steps": 43641, "total_steps": 67140, "eval_loss": 0.664467990398407, "epoch": 6.5, "percentage": 65.0, "elapsed_time": "3:01:58", "remaining_time": "1:37:59", "throughput": 2305.02, "total_tokens": 25166536} {"current_steps": 43645, "total_steps": 67140, "loss": 0.649, "lr": 1.644583237204275e-05, "epoch": 6.500595770032767, "percentage": 65.01, "elapsed_time": "3:02:01", "remaining_time": "1:37:59", "throughput": 2304.4, "total_tokens": 25168680} {"current_steps": 43650, "total_steps": 67140, "loss": 0.6483, "lr": 1.6439726093172237e-05, "epoch": 6.501340482573727, "percentage": 65.01, "elapsed_time": "3:02:03", "remaining_time": "1:37:58", "throughput": 2304.45, "total_tokens": 25171816} {"current_steps": 43655, "total_steps": 67140, "loss": 0.6261, "lr": 1.6433620392770227e-05, "epoch": 6.502085195114685, "percentage": 65.02, "elapsed_time": "3:02:04", "remaining_time": "1:37:56", "throughput": 2304.47, "total_tokens": 25174728} {"current_steps": 43660, "total_steps": 67140, "loss": 0.6359, "lr": 1.642751527124932e-05, "epoch": 6.502829907655645, "percentage": 65.03, "elapsed_time": "3:02:05", "remaining_time": "1:37:55", "throughput": 2304.49, "total_tokens": 25177544} {"current_steps": 43665, "total_steps": 67140, "loss": 0.6882, "lr": 1.6421410729022087e-05, "epoch": 6.503574620196604, "percentage": 65.04, "elapsed_time": "3:02:06", "remaining_time": "1:37:54", "throughput": 2304.53, "total_tokens": 25180744} {"current_steps": 43670, "total_steps": 67140, "loss": 0.7301, "lr": 1.641530676650103e-05, "epoch": 6.5043193327375635, "percentage": 65.04, "elapsed_time": "3:02:07", "remaining_time": "1:37:53", "throughput": 2304.57, "total_tokens": 25183912} {"current_steps": 43675, "total_steps": 67140, "loss": 0.7525, "lr": 1.6409203384098637e-05, "epoch": 6.505064045278522, "percentage": 65.05, "elapsed_time": "3:02:08", "remaining_time": "1:37:51", "throughput": 2304.59, "total_tokens": 25186728} {"current_steps": 43680, "total_steps": 67140, "loss": 0.544, "lr": 1.640310058222736e-05, "epoch": 6.505808757819482, "percentage": 65.06, "elapsed_time": "3:02:10", "remaining_time": "1:37:50", "throughput": 2304.61, "total_tokens": 25189544} {"current_steps": 43685, "total_steps": 67140, "loss": 0.6406, "lr": 1.6396998361299597e-05, "epoch": 6.506553470360441, "percentage": 65.07, "elapsed_time": "3:02:11", "remaining_time": "1:37:49", "throughput": 2304.64, "total_tokens": 25192616} {"current_steps": 43690, "total_steps": 67140, "loss": 0.5494, "lr": 1.63908967217277e-05, "epoch": 6.5072981829014, "percentage": 65.07, "elapsed_time": "3:02:12", "remaining_time": "1:37:47", "throughput": 2304.7, "total_tokens": 25196008} {"current_steps": 43695, "total_steps": 67140, "loss": 0.4633, "lr": 1.6384795663924003e-05, "epoch": 6.508042895442359, "percentage": 65.08, "elapsed_time": "3:02:13", "remaining_time": "1:37:46", "throughput": 2304.72, "total_tokens": 25198792} {"current_steps": 43700, "total_steps": 67140, "loss": 0.6226, "lr": 1.6378695188300787e-05, "epoch": 6.508787607983319, "percentage": 65.09, "elapsed_time": "3:02:14", "remaining_time": "1:37:45", "throughput": 2304.74, "total_tokens": 25201512} {"current_steps": 43705, "total_steps": 67140, "loss": 0.6826, "lr": 1.6372595295270294e-05, "epoch": 6.509532320524277, "percentage": 65.1, "elapsed_time": "3:02:15", "remaining_time": "1:37:43", "throughput": 2304.77, "total_tokens": 25204520} {"current_steps": 43710, "total_steps": 67140, "loss": 0.5447, "lr": 1.6366495985244736e-05, "epoch": 6.510277033065237, "percentage": 65.1, "elapsed_time": "3:02:16", "remaining_time": "1:37:42", "throughput": 2304.78, "total_tokens": 25207304} {"current_steps": 43715, "total_steps": 67140, "loss": 0.6298, "lr": 1.6360397258636284e-05, "epoch": 6.511021745606196, "percentage": 65.11, "elapsed_time": "3:02:18", "remaining_time": "1:37:41", "throughput": 2304.81, "total_tokens": 25210152} {"current_steps": 43720, "total_steps": 67140, "loss": 0.5163, "lr": 1.6354299115857052e-05, "epoch": 6.5117664581471555, "percentage": 65.12, "elapsed_time": "3:02:19", "remaining_time": "1:37:39", "throughput": 2304.84, "total_tokens": 25213160} {"current_steps": 43725, "total_steps": 67140, "loss": 0.5189, "lr": 1.6348201557319148e-05, "epoch": 6.512511170688114, "percentage": 65.13, "elapsed_time": "3:02:20", "remaining_time": "1:37:38", "throughput": 2304.86, "total_tokens": 25216040} {"current_steps": 43730, "total_steps": 67140, "loss": 0.4687, "lr": 1.6342104583434595e-05, "epoch": 6.513255883229074, "percentage": 65.13, "elapsed_time": "3:02:21", "remaining_time": "1:37:37", "throughput": 2304.89, "total_tokens": 25218920} {"current_steps": 43735, "total_steps": 67140, "loss": 0.3995, "lr": 1.633600819461542e-05, "epoch": 6.514000595770033, "percentage": 65.14, "elapsed_time": "3:02:22", "remaining_time": "1:37:36", "throughput": 2304.9, "total_tokens": 25221704} {"current_steps": 43740, "total_steps": 67140, "loss": 0.5738, "lr": 1.632991239127358e-05, "epoch": 6.514745308310992, "percentage": 65.15, "elapsed_time": "3:02:23", "remaining_time": "1:37:34", "throughput": 2304.92, "total_tokens": 25224552} {"current_steps": 43745, "total_steps": 67140, "loss": 0.6805, "lr": 1.6323817173821014e-05, "epoch": 6.515490020851951, "percentage": 65.15, "elapsed_time": "3:02:24", "remaining_time": "1:37:33", "throughput": 2304.95, "total_tokens": 25227528} {"current_steps": 43750, "total_steps": 67140, "loss": 0.5272, "lr": 1.6317722542669606e-05, "epoch": 6.516234733392911, "percentage": 65.16, "elapsed_time": "3:02:26", "remaining_time": "1:37:32", "throughput": 2305.01, "total_tokens": 25230952} {"current_steps": 43755, "total_steps": 67140, "loss": 0.6666, "lr": 1.6311628498231208e-05, "epoch": 6.5169794459338695, "percentage": 65.17, "elapsed_time": "3:02:27", "remaining_time": "1:37:30", "throughput": 2305.04, "total_tokens": 25233864} {"current_steps": 43760, "total_steps": 67140, "loss": 0.7051, "lr": 1.6305535040917638e-05, "epoch": 6.517724158474829, "percentage": 65.18, "elapsed_time": "3:02:28", "remaining_time": "1:37:29", "throughput": 2305.07, "total_tokens": 25236776} {"current_steps": 43765, "total_steps": 67140, "loss": 0.5787, "lr": 1.6299442171140656e-05, "epoch": 6.518468871015788, "percentage": 65.18, "elapsed_time": "3:02:29", "remaining_time": "1:37:28", "throughput": 2305.1, "total_tokens": 25239784} {"current_steps": 43770, "total_steps": 67140, "loss": 0.4069, "lr": 1.6293349889312007e-05, "epoch": 6.519213583556747, "percentage": 65.19, "elapsed_time": "3:02:30", "remaining_time": "1:37:26", "throughput": 2305.13, "total_tokens": 25242760} {"current_steps": 43775, "total_steps": 67140, "loss": 0.685, "lr": 1.6287258195843363e-05, "epoch": 6.519958296097706, "percentage": 65.2, "elapsed_time": "3:02:31", "remaining_time": "1:37:25", "throughput": 2305.16, "total_tokens": 25245768} {"current_steps": 43780, "total_steps": 67140, "loss": 0.6351, "lr": 1.6281167091146392e-05, "epoch": 6.520703008638666, "percentage": 65.21, "elapsed_time": "3:02:32", "remaining_time": "1:37:24", "throughput": 2305.18, "total_tokens": 25248680} {"current_steps": 43785, "total_steps": 67140, "loss": 0.2966, "lr": 1.62750765756327e-05, "epoch": 6.521447721179625, "percentage": 65.21, "elapsed_time": "3:02:34", "remaining_time": "1:37:22", "throughput": 2305.19, "total_tokens": 25251304} {"current_steps": 43790, "total_steps": 67140, "loss": 0.483, "lr": 1.6268986649713852e-05, "epoch": 6.522192433720583, "percentage": 65.22, "elapsed_time": "3:02:35", "remaining_time": "1:37:21", "throughput": 2305.21, "total_tokens": 25254088} {"current_steps": 43795, "total_steps": 67140, "loss": 0.5131, "lr": 1.6262897313801402e-05, "epoch": 6.522937146261543, "percentage": 65.23, "elapsed_time": "3:02:36", "remaining_time": "1:37:20", "throughput": 2305.27, "total_tokens": 25257576} {"current_steps": 43800, "total_steps": 67140, "loss": 0.7062, "lr": 1.625680856830682e-05, "epoch": 6.523681858802503, "percentage": 65.24, "elapsed_time": "3:02:37", "remaining_time": "1:37:19", "throughput": 2305.29, "total_tokens": 25260328} {"current_steps": 43805, "total_steps": 67140, "loss": 0.5354, "lr": 1.6250720413641565e-05, "epoch": 6.5244265713434615, "percentage": 65.24, "elapsed_time": "3:02:38", "remaining_time": "1:37:17", "throughput": 2305.33, "total_tokens": 25263496} {"current_steps": 43810, "total_steps": 67140, "loss": 0.5942, "lr": 1.6244632850217067e-05, "epoch": 6.52517128388442, "percentage": 65.25, "elapsed_time": "3:02:39", "remaining_time": "1:37:16", "throughput": 2305.34, "total_tokens": 25266152} {"current_steps": 43815, "total_steps": 67140, "loss": 0.608, "lr": 1.6238545878444676e-05, "epoch": 6.52591599642538, "percentage": 65.26, "elapsed_time": "3:02:41", "remaining_time": "1:37:15", "throughput": 2305.37, "total_tokens": 25269224} {"current_steps": 43820, "total_steps": 67140, "loss": 0.399, "lr": 1.623245949873573e-05, "epoch": 6.526660708966339, "percentage": 65.27, "elapsed_time": "3:02:42", "remaining_time": "1:37:13", "throughput": 2305.39, "total_tokens": 25271944} {"current_steps": 43825, "total_steps": 67140, "loss": 0.6913, "lr": 1.6226373711501523e-05, "epoch": 6.527405421507298, "percentage": 65.27, "elapsed_time": "3:02:43", "remaining_time": "1:37:12", "throughput": 2305.41, "total_tokens": 25274728} {"current_steps": 43830, "total_steps": 67140, "loss": 0.4517, "lr": 1.6220288517153318e-05, "epoch": 6.528150134048257, "percentage": 65.28, "elapsed_time": "3:02:44", "remaining_time": "1:37:11", "throughput": 2305.43, "total_tokens": 25277640} {"current_steps": 43835, "total_steps": 67140, "loss": 0.4545, "lr": 1.621420391610231e-05, "epoch": 6.528894846589217, "percentage": 65.29, "elapsed_time": "3:02:45", "remaining_time": "1:37:09", "throughput": 2305.45, "total_tokens": 25280520} {"current_steps": 43840, "total_steps": 67140, "loss": 0.5765, "lr": 1.6208119908759684e-05, "epoch": 6.5296395591301755, "percentage": 65.3, "elapsed_time": "3:02:46", "remaining_time": "1:37:08", "throughput": 2305.47, "total_tokens": 25283336} {"current_steps": 43845, "total_steps": 67140, "loss": 0.7157, "lr": 1.6202036495536575e-05, "epoch": 6.530384271671135, "percentage": 65.3, "elapsed_time": "3:02:47", "remaining_time": "1:37:07", "throughput": 2305.51, "total_tokens": 25286376} {"current_steps": 43850, "total_steps": 67140, "loss": 0.8193, "lr": 1.6195953676844072e-05, "epoch": 6.531128984212094, "percentage": 65.31, "elapsed_time": "3:02:48", "remaining_time": "1:37:05", "throughput": 2305.53, "total_tokens": 25289192} {"current_steps": 43855, "total_steps": 67140, "loss": 0.6123, "lr": 1.6189871453093217e-05, "epoch": 6.5318736967530535, "percentage": 65.32, "elapsed_time": "3:02:50", "remaining_time": "1:37:04", "throughput": 2305.55, "total_tokens": 25292008} {"current_steps": 43860, "total_steps": 67140, "loss": 0.5773, "lr": 1.6183789824695027e-05, "epoch": 6.532618409294012, "percentage": 65.33, "elapsed_time": "3:02:51", "remaining_time": "1:37:03", "throughput": 2305.56, "total_tokens": 25294728} {"current_steps": 43865, "total_steps": 67140, "loss": 0.6044, "lr": 1.6177708792060486e-05, "epoch": 6.533363121834972, "percentage": 65.33, "elapsed_time": "3:02:52", "remaining_time": "1:37:01", "throughput": 2305.59, "total_tokens": 25297608} {"current_steps": 43870, "total_steps": 67140, "loss": 0.5692, "lr": 1.6171628355600507e-05, "epoch": 6.534107834375931, "percentage": 65.34, "elapsed_time": "3:02:53", "remaining_time": "1:37:00", "throughput": 2305.61, "total_tokens": 25300456} {"current_steps": 43875, "total_steps": 67140, "loss": 0.482, "lr": 1.6165548515725992e-05, "epoch": 6.53485254691689, "percentage": 65.35, "elapsed_time": "3:02:54", "remaining_time": "1:36:59", "throughput": 2305.63, "total_tokens": 25303144} {"current_steps": 43880, "total_steps": 67140, "loss": 0.704, "lr": 1.6159469272847793e-05, "epoch": 6.535597259457849, "percentage": 65.36, "elapsed_time": "3:02:55", "remaining_time": "1:36:57", "throughput": 2305.64, "total_tokens": 25305832} {"current_steps": 43885, "total_steps": 67140, "loss": 0.4795, "lr": 1.6153390627376717e-05, "epoch": 6.536341971998809, "percentage": 65.36, "elapsed_time": "3:02:56", "remaining_time": "1:36:56", "throughput": 2305.67, "total_tokens": 25308776} {"current_steps": 43890, "total_steps": 67140, "loss": 0.709, "lr": 1.6147312579723542e-05, "epoch": 6.5370866845397675, "percentage": 65.37, "elapsed_time": "3:02:57", "remaining_time": "1:36:55", "throughput": 2305.69, "total_tokens": 25311720} {"current_steps": 43895, "total_steps": 67140, "loss": 0.8398, "lr": 1.6141235130298983e-05, "epoch": 6.537831397080727, "percentage": 65.38, "elapsed_time": "3:02:59", "remaining_time": "1:36:54", "throughput": 2305.71, "total_tokens": 25314536} {"current_steps": 43900, "total_steps": 67140, "loss": 0.481, "lr": 1.6135158279513737e-05, "epoch": 6.538576109621686, "percentage": 65.39, "elapsed_time": "3:03:00", "remaining_time": "1:36:52", "throughput": 2305.74, "total_tokens": 25317448} {"current_steps": 43905, "total_steps": 67140, "loss": 0.6528, "lr": 1.612908202777845e-05, "epoch": 6.5393208221626455, "percentage": 65.39, "elapsed_time": "3:03:01", "remaining_time": "1:36:51", "throughput": 2305.78, "total_tokens": 25320616} {"current_steps": 43910, "total_steps": 67140, "loss": 0.6153, "lr": 1.6123006375503737e-05, "epoch": 6.540065534703604, "percentage": 65.4, "elapsed_time": "3:03:02", "remaining_time": "1:36:50", "throughput": 2305.81, "total_tokens": 25323592} {"current_steps": 43915, "total_steps": 67140, "loss": 0.6835, "lr": 1.6116931323100158e-05, "epoch": 6.540810247244564, "percentage": 65.41, "elapsed_time": "3:03:03", "remaining_time": "1:36:48", "throughput": 2305.84, "total_tokens": 25326632} {"current_steps": 43920, "total_steps": 67140, "loss": 0.5457, "lr": 1.6110856870978245e-05, "epoch": 6.541554959785523, "percentage": 65.42, "elapsed_time": "3:03:04", "remaining_time": "1:36:47", "throughput": 2305.86, "total_tokens": 25329320} {"current_steps": 43925, "total_steps": 67140, "loss": 0.5123, "lr": 1.6104783019548486e-05, "epoch": 6.542299672326482, "percentage": 65.42, "elapsed_time": "3:03:05", "remaining_time": "1:36:46", "throughput": 2305.88, "total_tokens": 25332232} {"current_steps": 43930, "total_steps": 67140, "loss": 0.7402, "lr": 1.6098709769221333e-05, "epoch": 6.543044384867441, "percentage": 65.43, "elapsed_time": "3:03:07", "remaining_time": "1:36:44", "throughput": 2305.91, "total_tokens": 25335112} {"current_steps": 43935, "total_steps": 67140, "loss": 0.5833, "lr": 1.6092637120407174e-05, "epoch": 6.5437890974084, "percentage": 65.44, "elapsed_time": "3:03:08", "remaining_time": "1:36:43", "throughput": 2305.93, "total_tokens": 25338024} {"current_steps": 43940, "total_steps": 67140, "loss": 0.6497, "lr": 1.6086565073516385e-05, "epoch": 6.5445338099493595, "percentage": 65.45, "elapsed_time": "3:03:09", "remaining_time": "1:36:42", "throughput": 2305.95, "total_tokens": 25340776} {"current_steps": 43945, "total_steps": 67140, "loss": 0.8639, "lr": 1.608049362895929e-05, "epoch": 6.545278522490319, "percentage": 65.45, "elapsed_time": "3:03:10", "remaining_time": "1:36:40", "throughput": 2305.98, "total_tokens": 25343784} {"current_steps": 43950, "total_steps": 67140, "loss": 0.4462, "lr": 1.607442278714617e-05, "epoch": 6.546023235031278, "percentage": 65.46, "elapsed_time": "3:03:11", "remaining_time": "1:36:39", "throughput": 2305.99, "total_tokens": 25346536} {"current_steps": 43955, "total_steps": 67140, "loss": 0.8583, "lr": 1.6068352548487263e-05, "epoch": 6.546767947572237, "percentage": 65.47, "elapsed_time": "3:03:12", "remaining_time": "1:36:38", "throughput": 2306.01, "total_tokens": 25349352} {"current_steps": 43960, "total_steps": 67140, "loss": 0.9575, "lr": 1.606228291339279e-05, "epoch": 6.547512660113196, "percentage": 65.48, "elapsed_time": "3:03:13", "remaining_time": "1:36:37", "throughput": 2306.05, "total_tokens": 25352488} {"current_steps": 43965, "total_steps": 67140, "loss": 0.5908, "lr": 1.6056213882272892e-05, "epoch": 6.548257372654156, "percentage": 65.48, "elapsed_time": "3:03:15", "remaining_time": "1:36:35", "throughput": 2306.08, "total_tokens": 25355496} {"current_steps": 43970, "total_steps": 67140, "loss": 0.5092, "lr": 1.6050145455537708e-05, "epoch": 6.549002085195115, "percentage": 65.49, "elapsed_time": "3:03:16", "remaining_time": "1:36:34", "throughput": 2306.11, "total_tokens": 25358408} {"current_steps": 43975, "total_steps": 67140, "loss": 0.5059, "lr": 1.6044077633597292e-05, "epoch": 6.5497467977360735, "percentage": 65.5, "elapsed_time": "3:03:17", "remaining_time": "1:36:33", "throughput": 2306.12, "total_tokens": 25361064} {"current_steps": 43980, "total_steps": 67140, "loss": 0.879, "lr": 1.603801041686171e-05, "epoch": 6.550491510277033, "percentage": 65.5, "elapsed_time": "3:03:18", "remaining_time": "1:36:31", "throughput": 2306.14, "total_tokens": 25363944} {"current_steps": 43985, "total_steps": 67140, "loss": 0.7013, "lr": 1.6031943805740934e-05, "epoch": 6.551236222817992, "percentage": 65.51, "elapsed_time": "3:03:19", "remaining_time": "1:36:30", "throughput": 2306.16, "total_tokens": 25366728} {"current_steps": 43990, "total_steps": 67140, "loss": 0.4912, "lr": 1.602587780064494e-05, "epoch": 6.5519809353589515, "percentage": 65.52, "elapsed_time": "3:03:20", "remaining_time": "1:36:29", "throughput": 2306.19, "total_tokens": 25369576} {"current_steps": 43995, "total_steps": 67140, "loss": 0.7285, "lr": 1.601981240198364e-05, "epoch": 6.55272564789991, "percentage": 65.53, "elapsed_time": "3:03:21", "remaining_time": "1:36:27", "throughput": 2306.19, "total_tokens": 25372200} {"current_steps": 44000, "total_steps": 67140, "loss": 0.7559, "lr": 1.6013747610166903e-05, "epoch": 6.55347036044087, "percentage": 65.53, "elapsed_time": "3:03:22", "remaining_time": "1:36:26", "throughput": 2306.21, "total_tokens": 25374888} {"current_steps": 44005, "total_steps": 67140, "loss": 0.6225, "lr": 1.600768342560457e-05, "epoch": 6.554215072981829, "percentage": 65.54, "elapsed_time": "3:03:24", "remaining_time": "1:36:25", "throughput": 2306.24, "total_tokens": 25377960} {"current_steps": 44010, "total_steps": 67140, "loss": 0.7181, "lr": 1.6001619848706435e-05, "epoch": 6.554959785522788, "percentage": 65.55, "elapsed_time": "3:03:25", "remaining_time": "1:36:23", "throughput": 2306.26, "total_tokens": 25380744} {"current_steps": 44015, "total_steps": 67140, "loss": 0.4636, "lr": 1.5995556879882246e-05, "epoch": 6.555704498063747, "percentage": 65.56, "elapsed_time": "3:03:26", "remaining_time": "1:36:22", "throughput": 2306.28, "total_tokens": 25383528} {"current_steps": 44020, "total_steps": 67140, "loss": 0.7056, "lr": 1.5989494519541706e-05, "epoch": 6.556449210604707, "percentage": 65.56, "elapsed_time": "3:03:27", "remaining_time": "1:36:21", "throughput": 2306.3, "total_tokens": 25386408} {"current_steps": 44025, "total_steps": 67140, "loss": 0.5995, "lr": 1.5983432768094495e-05, "epoch": 6.5571939231456655, "percentage": 65.57, "elapsed_time": "3:03:28", "remaining_time": "1:36:19", "throughput": 2306.32, "total_tokens": 25389128} {"current_steps": 44030, "total_steps": 67140, "loss": 0.5363, "lr": 1.597737162595024e-05, "epoch": 6.557938635686625, "percentage": 65.58, "elapsed_time": "3:03:29", "remaining_time": "1:36:18", "throughput": 2306.37, "total_tokens": 25392424} {"current_steps": 44035, "total_steps": 67140, "loss": 0.7082, "lr": 1.5971311093518527e-05, "epoch": 6.558683348227584, "percentage": 65.59, "elapsed_time": "3:03:30", "remaining_time": "1:36:17", "throughput": 2306.39, "total_tokens": 25395240} {"current_steps": 44040, "total_steps": 67140, "loss": 0.5701, "lr": 1.5965251171208896e-05, "epoch": 6.559428060768544, "percentage": 65.59, "elapsed_time": "3:03:31", "remaining_time": "1:36:16", "throughput": 2306.41, "total_tokens": 25397992} {"current_steps": 44045, "total_steps": 67140, "loss": 0.7114, "lr": 1.5959191859430867e-05, "epoch": 6.560172773309502, "percentage": 65.6, "elapsed_time": "3:03:33", "remaining_time": "1:36:14", "throughput": 2306.43, "total_tokens": 25400872} {"current_steps": 44050, "total_steps": 67140, "loss": 0.5057, "lr": 1.5953133158593904e-05, "epoch": 6.560917485850462, "percentage": 65.61, "elapsed_time": "3:03:34", "remaining_time": "1:36:13", "throughput": 2306.46, "total_tokens": 25403880} {"current_steps": 44055, "total_steps": 67140, "loss": 0.6862, "lr": 1.5947075069107402e-05, "epoch": 6.561662198391421, "percentage": 65.62, "elapsed_time": "3:03:35", "remaining_time": "1:36:12", "throughput": 2306.49, "total_tokens": 25406856} {"current_steps": 44060, "total_steps": 67140, "loss": 0.5915, "lr": 1.5941017591380764e-05, "epoch": 6.56240691093238, "percentage": 65.62, "elapsed_time": "3:03:36", "remaining_time": "1:36:10", "throughput": 2306.51, "total_tokens": 25409608} {"current_steps": 44065, "total_steps": 67140, "loss": 0.6332, "lr": 1.5934960725823335e-05, "epoch": 6.563151623473339, "percentage": 65.63, "elapsed_time": "3:03:37", "remaining_time": "1:36:09", "throughput": 2306.54, "total_tokens": 25412584} {"current_steps": 44070, "total_steps": 67140, "loss": 0.611, "lr": 1.5928904472844393e-05, "epoch": 6.563896336014299, "percentage": 65.64, "elapsed_time": "3:03:38", "remaining_time": "1:36:08", "throughput": 2306.56, "total_tokens": 25415432} {"current_steps": 44075, "total_steps": 67140, "loss": 0.5625, "lr": 1.5922848832853217e-05, "epoch": 6.5646410485552575, "percentage": 65.65, "elapsed_time": "3:03:39", "remaining_time": "1:36:06", "throughput": 2306.58, "total_tokens": 25418216} {"current_steps": 44080, "total_steps": 67140, "loss": 0.53, "lr": 1.5916793806259e-05, "epoch": 6.565385761096217, "percentage": 65.65, "elapsed_time": "3:03:41", "remaining_time": "1:36:05", "throughput": 2306.6, "total_tokens": 25421064} {"current_steps": 44085, "total_steps": 67140, "loss": 0.7089, "lr": 1.5910739393470934e-05, "epoch": 6.566130473637176, "percentage": 65.66, "elapsed_time": "3:03:42", "remaining_time": "1:36:04", "throughput": 2306.62, "total_tokens": 25423784} {"current_steps": 44090, "total_steps": 67140, "loss": 0.7028, "lr": 1.5904685594898154e-05, "epoch": 6.566875186178136, "percentage": 65.67, "elapsed_time": "3:03:43", "remaining_time": "1:36:02", "throughput": 2306.65, "total_tokens": 25426792} {"current_steps": 44095, "total_steps": 67140, "loss": 0.6875, "lr": 1.589863241094974e-05, "epoch": 6.567619898719094, "percentage": 65.68, "elapsed_time": "3:03:44", "remaining_time": "1:36:01", "throughput": 2306.68, "total_tokens": 25429864} {"current_steps": 44100, "total_steps": 67140, "loss": 0.7349, "lr": 1.589257984203473e-05, "epoch": 6.568364611260054, "percentage": 65.68, "elapsed_time": "3:03:45", "remaining_time": "1:36:00", "throughput": 2306.69, "total_tokens": 25432552} {"current_steps": 44105, "total_steps": 67140, "loss": 0.4492, "lr": 1.588652788856215e-05, "epoch": 6.569109323801013, "percentage": 65.69, "elapsed_time": "3:03:46", "remaining_time": "1:35:58", "throughput": 2306.71, "total_tokens": 25435272} {"current_steps": 44110, "total_steps": 67140, "loss": 0.5535, "lr": 1.5880476550940975e-05, "epoch": 6.569854036341972, "percentage": 65.7, "elapsed_time": "3:03:47", "remaining_time": "1:35:57", "throughput": 2306.73, "total_tokens": 25438056} {"current_steps": 44115, "total_steps": 67140, "loss": 0.7107, "lr": 1.5874425829580108e-05, "epoch": 6.570598748882931, "percentage": 65.71, "elapsed_time": "3:03:48", "remaining_time": "1:35:56", "throughput": 2306.76, "total_tokens": 25441064} {"current_steps": 44120, "total_steps": 67140, "loss": 0.6491, "lr": 1.586837572488844e-05, "epoch": 6.57134346142389, "percentage": 65.71, "elapsed_time": "3:03:50", "remaining_time": "1:35:55", "throughput": 2306.78, "total_tokens": 25443912} {"current_steps": 44125, "total_steps": 67140, "loss": 0.5307, "lr": 1.586232623727482e-05, "epoch": 6.57208817396485, "percentage": 65.72, "elapsed_time": "3:03:51", "remaining_time": "1:35:53", "throughput": 2306.8, "total_tokens": 25446824} {"current_steps": 44130, "total_steps": 67140, "loss": 0.6339, "lr": 1.5856277367148047e-05, "epoch": 6.572832886505809, "percentage": 65.73, "elapsed_time": "3:03:52", "remaining_time": "1:35:52", "throughput": 2306.85, "total_tokens": 25450056} {"current_steps": 44135, "total_steps": 67140, "loss": 0.4987, "lr": 1.5850229114916864e-05, "epoch": 6.573577599046768, "percentage": 65.74, "elapsed_time": "3:03:53", "remaining_time": "1:35:51", "throughput": 2306.86, "total_tokens": 25452808} {"current_steps": 44140, "total_steps": 67140, "loss": 0.6637, "lr": 1.5844181480989995e-05, "epoch": 6.574322311587727, "percentage": 65.74, "elapsed_time": "3:03:54", "remaining_time": "1:35:49", "throughput": 2306.88, "total_tokens": 25455560} {"current_steps": 44145, "total_steps": 67140, "loss": 0.4832, "lr": 1.5838134465776126e-05, "epoch": 6.575067024128686, "percentage": 65.75, "elapsed_time": "3:03:55", "remaining_time": "1:35:48", "throughput": 2306.9, "total_tokens": 25458376} {"current_steps": 44150, "total_steps": 67140, "loss": 0.6143, "lr": 1.583208806968387e-05, "epoch": 6.575811736669645, "percentage": 65.76, "elapsed_time": "3:03:56", "remaining_time": "1:35:47", "throughput": 2306.92, "total_tokens": 25461224} {"current_steps": 44155, "total_steps": 67140, "loss": 0.6383, "lr": 1.5826042293121835e-05, "epoch": 6.576556449210605, "percentage": 65.77, "elapsed_time": "3:03:58", "remaining_time": "1:35:45", "throughput": 2306.97, "total_tokens": 25464456} {"current_steps": 44160, "total_steps": 67140, "loss": 0.5247, "lr": 1.581999713649856e-05, "epoch": 6.5773011617515635, "percentage": 65.77, "elapsed_time": "3:03:59", "remaining_time": "1:35:44", "throughput": 2306.99, "total_tokens": 25467400} {"current_steps": 44165, "total_steps": 67140, "loss": 0.5949, "lr": 1.5813952600222556e-05, "epoch": 6.578045874292523, "percentage": 65.78, "elapsed_time": "3:04:00", "remaining_time": "1:35:43", "throughput": 2307.01, "total_tokens": 25470152} {"current_steps": 44170, "total_steps": 67140, "loss": 0.5461, "lr": 1.58079086847023e-05, "epoch": 6.578790586833482, "percentage": 65.79, "elapsed_time": "3:04:01", "remaining_time": "1:35:41", "throughput": 2307.05, "total_tokens": 25473384} {"current_steps": 44175, "total_steps": 67140, "loss": 0.6678, "lr": 1.580186539034619e-05, "epoch": 6.579535299374442, "percentage": 65.8, "elapsed_time": "3:04:02", "remaining_time": "1:35:40", "throughput": 2307.1, "total_tokens": 25476648} {"current_steps": 44180, "total_steps": 67140, "loss": 0.7048, "lr": 1.579582271756262e-05, "epoch": 6.5802800119154, "percentage": 65.8, "elapsed_time": "3:04:03", "remaining_time": "1:35:39", "throughput": 2307.12, "total_tokens": 25479624} {"current_steps": 44185, "total_steps": 67140, "loss": 0.6317, "lr": 1.578978066675993e-05, "epoch": 6.58102472445636, "percentage": 65.81, "elapsed_time": "3:04:05", "remaining_time": "1:35:38", "throughput": 2307.14, "total_tokens": 25482440} {"current_steps": 44190, "total_steps": 67140, "loss": 0.5604, "lr": 1.578373923834641e-05, "epoch": 6.581769436997319, "percentage": 65.82, "elapsed_time": "3:04:06", "remaining_time": "1:35:36", "throughput": 2307.15, "total_tokens": 25485064} {"current_steps": 44195, "total_steps": 67140, "loss": 0.5168, "lr": 1.5777698432730333e-05, "epoch": 6.582514149538278, "percentage": 65.83, "elapsed_time": "3:04:07", "remaining_time": "1:35:35", "throughput": 2307.17, "total_tokens": 25487912} {"current_steps": 44200, "total_steps": 67140, "loss": 0.5403, "lr": 1.5771658250319895e-05, "epoch": 6.583258862079237, "percentage": 65.83, "elapsed_time": "3:04:08", "remaining_time": "1:35:34", "throughput": 2307.21, "total_tokens": 25491048} {"current_steps": 44205, "total_steps": 67140, "loss": 0.7629, "lr": 1.576561869152327e-05, "epoch": 6.584003574620197, "percentage": 65.84, "elapsed_time": "3:04:09", "remaining_time": "1:35:32", "throughput": 2307.24, "total_tokens": 25494056} {"current_steps": 44210, "total_steps": 67140, "loss": 0.7293, "lr": 1.5759579756748603e-05, "epoch": 6.584748287161156, "percentage": 65.85, "elapsed_time": "3:04:10", "remaining_time": "1:35:31", "throughput": 2307.27, "total_tokens": 25497128} {"current_steps": 44215, "total_steps": 67140, "loss": 0.4953, "lr": 1.5753541446403964e-05, "epoch": 6.585492999702115, "percentage": 65.85, "elapsed_time": "3:04:11", "remaining_time": "1:35:30", "throughput": 2307.31, "total_tokens": 25500360} {"current_steps": 44220, "total_steps": 67140, "loss": 0.6095, "lr": 1.574750376089739e-05, "epoch": 6.586237712243074, "percentage": 65.86, "elapsed_time": "3:04:13", "remaining_time": "1:35:29", "throughput": 2307.35, "total_tokens": 25503528} {"current_steps": 44225, "total_steps": 67140, "loss": 0.535, "lr": 1.5741466700636898e-05, "epoch": 6.586982424784034, "percentage": 65.87, "elapsed_time": "3:04:14", "remaining_time": "1:35:27", "throughput": 2307.38, "total_tokens": 25506440} {"current_steps": 44230, "total_steps": 67140, "loss": 0.5428, "lr": 1.5735430266030447e-05, "epoch": 6.587727137324992, "percentage": 65.88, "elapsed_time": "3:04:15", "remaining_time": "1:35:26", "throughput": 2307.39, "total_tokens": 25509160} {"current_steps": 44235, "total_steps": 67140, "loss": 0.6533, "lr": 1.5729394457485946e-05, "epoch": 6.588471849865952, "percentage": 65.88, "elapsed_time": "3:04:16", "remaining_time": "1:35:25", "throughput": 2307.42, "total_tokens": 25512040} {"current_steps": 44240, "total_steps": 67140, "loss": 0.5166, "lr": 1.5723359275411283e-05, "epoch": 6.589216562406911, "percentage": 65.89, "elapsed_time": "3:04:17", "remaining_time": "1:35:23", "throughput": 2307.43, "total_tokens": 25514664} {"current_steps": 44245, "total_steps": 67140, "loss": 0.6136, "lr": 1.571732472021428e-05, "epoch": 6.58996127494787, "percentage": 65.9, "elapsed_time": "3:04:18", "remaining_time": "1:35:22", "throughput": 2307.45, "total_tokens": 25517448} {"current_steps": 44250, "total_steps": 67140, "loss": 0.6188, "lr": 1.571129079230274e-05, "epoch": 6.590705987488829, "percentage": 65.91, "elapsed_time": "3:04:19", "remaining_time": "1:35:21", "throughput": 2307.46, "total_tokens": 25520168} {"current_steps": 44255, "total_steps": 67140, "loss": 0.5805, "lr": 1.570525749208439e-05, "epoch": 6.591450700029789, "percentage": 65.91, "elapsed_time": "3:04:20", "remaining_time": "1:35:19", "throughput": 2307.47, "total_tokens": 25522792} {"current_steps": 44260, "total_steps": 67140, "loss": 0.6394, "lr": 1.5699224819966957e-05, "epoch": 6.592195412570748, "percentage": 65.92, "elapsed_time": "3:04:22", "remaining_time": "1:35:18", "throughput": 2307.49, "total_tokens": 25525640} {"current_steps": 44265, "total_steps": 67140, "loss": 0.5418, "lr": 1.5693192776358092e-05, "epoch": 6.592940125111707, "percentage": 65.93, "elapsed_time": "3:04:23", "remaining_time": "1:35:17", "throughput": 2307.52, "total_tokens": 25528648} {"current_steps": 44270, "total_steps": 67140, "loss": 0.5255, "lr": 1.568716136166542e-05, "epoch": 6.593684837652666, "percentage": 65.94, "elapsed_time": "3:04:24", "remaining_time": "1:35:15", "throughput": 2307.55, "total_tokens": 25531624} {"current_steps": 44275, "total_steps": 67140, "loss": 0.4335, "lr": 1.5681130576296528e-05, "epoch": 6.594429550193626, "percentage": 65.94, "elapsed_time": "3:04:25", "remaining_time": "1:35:14", "throughput": 2307.55, "total_tokens": 25534184} {"current_steps": 44280, "total_steps": 67140, "loss": 0.5285, "lr": 1.5675100420658935e-05, "epoch": 6.595174262734584, "percentage": 65.95, "elapsed_time": "3:04:26", "remaining_time": "1:35:13", "throughput": 2307.58, "total_tokens": 25537096} {"current_steps": 44285, "total_steps": 67140, "loss": 0.7082, "lr": 1.5669070895160143e-05, "epoch": 6.595918975275543, "percentage": 65.96, "elapsed_time": "3:04:27", "remaining_time": "1:35:11", "throughput": 2307.6, "total_tokens": 25539912} {"current_steps": 44290, "total_steps": 67140, "loss": 0.4928, "lr": 1.566304200020761e-05, "epoch": 6.596663687816503, "percentage": 65.97, "elapsed_time": "3:04:28", "remaining_time": "1:35:10", "throughput": 2307.63, "total_tokens": 25542952} {"current_steps": 44295, "total_steps": 67140, "loss": 0.7712, "lr": 1.565701373620874e-05, "epoch": 6.5974084003574625, "percentage": 65.97, "elapsed_time": "3:04:30", "remaining_time": "1:35:09", "throughput": 2307.65, "total_tokens": 25545864} {"current_steps": 44300, "total_steps": 67140, "loss": 0.6012, "lr": 1.5650986103570887e-05, "epoch": 6.598153112898421, "percentage": 65.98, "elapsed_time": "3:04:31", "remaining_time": "1:35:08", "throughput": 2307.68, "total_tokens": 25548744} {"current_steps": 44305, "total_steps": 67140, "loss": 0.5142, "lr": 1.5644959102701384e-05, "epoch": 6.59889782543938, "percentage": 65.99, "elapsed_time": "3:04:32", "remaining_time": "1:35:06", "throughput": 2307.74, "total_tokens": 25552296} {"current_steps": 44310, "total_steps": 67140, "loss": 0.6244, "lr": 1.5638932734007515e-05, "epoch": 6.59964253798034, "percentage": 66.0, "elapsed_time": "3:04:33", "remaining_time": "1:35:05", "throughput": 2307.75, "total_tokens": 25554952} {"current_steps": 44315, "total_steps": 67140, "loss": 0.5498, "lr": 1.563290699789651e-05, "epoch": 6.600387250521299, "percentage": 66.0, "elapsed_time": "3:04:34", "remaining_time": "1:35:04", "throughput": 2307.76, "total_tokens": 25557704} {"current_steps": 44320, "total_steps": 67140, "loss": 0.6141, "lr": 1.562688189477556e-05, "epoch": 6.601131963062258, "percentage": 66.01, "elapsed_time": "3:04:35", "remaining_time": "1:35:02", "throughput": 2307.79, "total_tokens": 25560648} {"current_steps": 44325, "total_steps": 67140, "loss": 0.5628, "lr": 1.562085742505183e-05, "epoch": 6.601876675603217, "percentage": 66.02, "elapsed_time": "3:04:36", "remaining_time": "1:35:01", "throughput": 2307.84, "total_tokens": 25563848} {"current_steps": 44330, "total_steps": 67140, "loss": 0.4156, "lr": 1.5614833589132427e-05, "epoch": 6.602621388144176, "percentage": 66.03, "elapsed_time": "3:04:38", "remaining_time": "1:35:00", "throughput": 2307.87, "total_tokens": 25566920} {"current_steps": 44335, "total_steps": 67140, "loss": 0.4142, "lr": 1.5608810387424406e-05, "epoch": 6.603366100685135, "percentage": 66.03, "elapsed_time": "3:04:39", "remaining_time": "1:34:58", "throughput": 2307.88, "total_tokens": 25569576} {"current_steps": 44340, "total_steps": 67140, "loss": 0.4665, "lr": 1.5602787820334798e-05, "epoch": 6.604110813226095, "percentage": 66.04, "elapsed_time": "3:04:40", "remaining_time": "1:34:57", "throughput": 2307.91, "total_tokens": 25572584} {"current_steps": 44345, "total_steps": 67140, "loss": 0.6174, "lr": 1.559676588827058e-05, "epoch": 6.604855525767054, "percentage": 66.05, "elapsed_time": "3:04:41", "remaining_time": "1:34:56", "throughput": 2307.94, "total_tokens": 25575464} {"current_steps": 44350, "total_steps": 67140, "loss": 0.5569, "lr": 1.5590744591638693e-05, "epoch": 6.605600238308013, "percentage": 66.06, "elapsed_time": "3:04:42", "remaining_time": "1:34:55", "throughput": 2307.95, "total_tokens": 25578248} {"current_steps": 44355, "total_steps": 67140, "loss": 0.5029, "lr": 1.5584723930846034e-05, "epoch": 6.606344950848972, "percentage": 66.06, "elapsed_time": "3:04:43", "remaining_time": "1:34:53", "throughput": 2307.96, "total_tokens": 25580904} {"current_steps": 44360, "total_steps": 67140, "loss": 0.5505, "lr": 1.557870390629945e-05, "epoch": 6.607089663389932, "percentage": 66.07, "elapsed_time": "3:04:44", "remaining_time": "1:34:52", "throughput": 2308.0, "total_tokens": 25584040} {"current_steps": 44365, "total_steps": 67140, "loss": 0.4755, "lr": 1.5572684518405757e-05, "epoch": 6.60783437593089, "percentage": 66.08, "elapsed_time": "3:04:46", "remaining_time": "1:34:51", "throughput": 2308.02, "total_tokens": 25586856} {"current_steps": 44370, "total_steps": 67140, "loss": 0.668, "lr": 1.5566665767571708e-05, "epoch": 6.60857908847185, "percentage": 66.09, "elapsed_time": "3:04:47", "remaining_time": "1:34:49", "throughput": 2308.06, "total_tokens": 25590088} {"current_steps": 44375, "total_steps": 67140, "loss": 0.6498, "lr": 1.5560647654204043e-05, "epoch": 6.609323801012809, "percentage": 66.09, "elapsed_time": "3:04:48", "remaining_time": "1:34:48", "throughput": 2308.08, "total_tokens": 25592872} {"current_steps": 44380, "total_steps": 67140, "loss": 0.7355, "lr": 1.5554630178709427e-05, "epoch": 6.6100685135537685, "percentage": 66.1, "elapsed_time": "3:04:49", "remaining_time": "1:34:47", "throughput": 2308.09, "total_tokens": 25595560} {"current_steps": 44385, "total_steps": 67140, "loss": 0.6936, "lr": 1.55486133414945e-05, "epoch": 6.610813226094727, "percentage": 66.11, "elapsed_time": "3:04:50", "remaining_time": "1:34:45", "throughput": 2308.12, "total_tokens": 25598568} {"current_steps": 44390, "total_steps": 67140, "loss": 0.8138, "lr": 1.5542597142965857e-05, "epoch": 6.611557938635687, "percentage": 66.12, "elapsed_time": "3:04:51", "remaining_time": "1:34:44", "throughput": 2308.15, "total_tokens": 25601512} {"current_steps": 44395, "total_steps": 67140, "loss": 0.6448, "lr": 1.5536581583530048e-05, "epoch": 6.612302651176646, "percentage": 66.12, "elapsed_time": "3:04:52", "remaining_time": "1:34:43", "throughput": 2308.18, "total_tokens": 25604520} {"current_steps": 44400, "total_steps": 67140, "loss": 0.8333, "lr": 1.5530566663593584e-05, "epoch": 6.613047363717605, "percentage": 66.13, "elapsed_time": "3:04:54", "remaining_time": "1:34:41", "throughput": 2308.21, "total_tokens": 25607400} {"current_steps": 44405, "total_steps": 67140, "loss": 0.8306, "lr": 1.552455238356292e-05, "epoch": 6.613792076258564, "percentage": 66.14, "elapsed_time": "3:04:55", "remaining_time": "1:34:40", "throughput": 2308.24, "total_tokens": 25610344} {"current_steps": 44410, "total_steps": 67140, "loss": 0.6609, "lr": 1.551853874384448e-05, "epoch": 6.614536788799524, "percentage": 66.15, "elapsed_time": "3:04:56", "remaining_time": "1:34:39", "throughput": 2308.26, "total_tokens": 25613288} {"current_steps": 44415, "total_steps": 67140, "loss": 0.7555, "lr": 1.5512525744844656e-05, "epoch": 6.615281501340482, "percentage": 66.15, "elapsed_time": "3:04:57", "remaining_time": "1:34:38", "throughput": 2308.27, "total_tokens": 25615912} {"current_steps": 44420, "total_steps": 67140, "loss": 0.5873, "lr": 1.5506513386969757e-05, "epoch": 6.616026213881442, "percentage": 66.16, "elapsed_time": "3:04:58", "remaining_time": "1:34:36", "throughput": 2308.28, "total_tokens": 25618568} {"current_steps": 44425, "total_steps": 67140, "loss": 0.6303, "lr": 1.550050167062609e-05, "epoch": 6.616770926422401, "percentage": 66.17, "elapsed_time": "3:04:59", "remaining_time": "1:34:35", "throughput": 2308.3, "total_tokens": 25621320} {"current_steps": 44430, "total_steps": 67140, "loss": 0.5748, "lr": 1.549449059621989e-05, "epoch": 6.6175156389633605, "percentage": 66.18, "elapsed_time": "3:05:00", "remaining_time": "1:34:34", "throughput": 2308.32, "total_tokens": 25624232} {"current_steps": 44435, "total_steps": 67140, "loss": 0.5573, "lr": 1.5488480164157375e-05, "epoch": 6.618260351504319, "percentage": 66.18, "elapsed_time": "3:05:01", "remaining_time": "1:34:32", "throughput": 2308.34, "total_tokens": 25626984} {"current_steps": 44440, "total_steps": 67140, "loss": 0.6766, "lr": 1.5482470374844698e-05, "epoch": 6.619005064045279, "percentage": 66.19, "elapsed_time": "3:05:03", "remaining_time": "1:34:31", "throughput": 2308.35, "total_tokens": 25629672} {"current_steps": 44445, "total_steps": 67140, "loss": 0.579, "lr": 1.5476461228687976e-05, "epoch": 6.619749776586238, "percentage": 66.2, "elapsed_time": "3:05:04", "remaining_time": "1:34:30", "throughput": 2308.37, "total_tokens": 25632456} {"current_steps": 44450, "total_steps": 67140, "loss": 0.4291, "lr": 1.5470452726093287e-05, "epoch": 6.620494489127196, "percentage": 66.2, "elapsed_time": "3:05:05", "remaining_time": "1:34:28", "throughput": 2308.41, "total_tokens": 25635688} {"current_steps": 44455, "total_steps": 67140, "loss": 0.6871, "lr": 1.5464444867466666e-05, "epoch": 6.621239201668156, "percentage": 66.21, "elapsed_time": "3:05:06", "remaining_time": "1:34:27", "throughput": 2308.43, "total_tokens": 25638472} {"current_steps": 44460, "total_steps": 67140, "loss": 0.5508, "lr": 1.5458437653214088e-05, "epoch": 6.621983914209116, "percentage": 66.22, "elapsed_time": "3:05:07", "remaining_time": "1:34:26", "throughput": 2308.44, "total_tokens": 25641288} {"current_steps": 44465, "total_steps": 67140, "loss": 0.6199, "lr": 1.545243108374149e-05, "epoch": 6.6227286267500745, "percentage": 66.23, "elapsed_time": "3:05:08", "remaining_time": "1:34:24", "throughput": 2308.48, "total_tokens": 25644392} {"current_steps": 44470, "total_steps": 67140, "loss": 0.7135, "lr": 1.544642515945479e-05, "epoch": 6.623473339291033, "percentage": 66.23, "elapsed_time": "3:05:09", "remaining_time": "1:34:23", "throughput": 2308.5, "total_tokens": 25647240} {"current_steps": 44475, "total_steps": 67140, "loss": 0.6332, "lr": 1.5440419880759838e-05, "epoch": 6.624218051831993, "percentage": 66.24, "elapsed_time": "3:05:11", "remaining_time": "1:34:22", "throughput": 2308.51, "total_tokens": 25649928} {"current_steps": 44480, "total_steps": 67140, "loss": 0.5243, "lr": 1.5434415248062435e-05, "epoch": 6.6249627643729525, "percentage": 66.25, "elapsed_time": "3:05:12", "remaining_time": "1:34:21", "throughput": 2308.53, "total_tokens": 25652808} {"current_steps": 44485, "total_steps": 67140, "loss": 0.5411, "lr": 1.542841126176836e-05, "epoch": 6.625707476913911, "percentage": 66.26, "elapsed_time": "3:05:13", "remaining_time": "1:34:19", "throughput": 2308.56, "total_tokens": 25655688} {"current_steps": 44490, "total_steps": 67140, "loss": 0.6819, "lr": 1.5422407922283343e-05, "epoch": 6.62645218945487, "percentage": 66.26, "elapsed_time": "3:05:14", "remaining_time": "1:34:18", "throughput": 2308.57, "total_tokens": 25658472} {"current_steps": 44495, "total_steps": 67140, "loss": 0.5016, "lr": 1.5416405230013065e-05, "epoch": 6.62719690199583, "percentage": 66.27, "elapsed_time": "3:05:15", "remaining_time": "1:34:17", "throughput": 2308.59, "total_tokens": 25661224} {"current_steps": 44500, "total_steps": 67140, "loss": 0.7057, "lr": 1.5410403185363147e-05, "epoch": 6.627941614536788, "percentage": 66.28, "elapsed_time": "3:05:16", "remaining_time": "1:34:15", "throughput": 2308.63, "total_tokens": 25664424} {"current_steps": 44505, "total_steps": 67140, "loss": 0.671, "lr": 1.540440178873919e-05, "epoch": 6.628686327077748, "percentage": 66.29, "elapsed_time": "3:05:17", "remaining_time": "1:34:14", "throughput": 2308.66, "total_tokens": 25667464} {"current_steps": 44510, "total_steps": 67140, "loss": 0.6115, "lr": 1.539840104054676e-05, "epoch": 6.629431039618707, "percentage": 66.29, "elapsed_time": "3:05:19", "remaining_time": "1:34:13", "throughput": 2308.7, "total_tokens": 25670504} {"current_steps": 44515, "total_steps": 67140, "loss": 0.6816, "lr": 1.5392400941191337e-05, "epoch": 6.6301757521596665, "percentage": 66.3, "elapsed_time": "3:05:20", "remaining_time": "1:34:11", "throughput": 2308.72, "total_tokens": 25673480} {"current_steps": 44520, "total_steps": 67140, "loss": 0.6199, "lr": 1.53864014910784e-05, "epoch": 6.630920464700625, "percentage": 66.31, "elapsed_time": "3:05:21", "remaining_time": "1:34:10", "throughput": 2308.74, "total_tokens": 25676296} {"current_steps": 44525, "total_steps": 67140, "loss": 0.6634, "lr": 1.538040269061337e-05, "epoch": 6.631665177241585, "percentage": 66.32, "elapsed_time": "3:05:22", "remaining_time": "1:34:09", "throughput": 2308.76, "total_tokens": 25679176} {"current_steps": 44530, "total_steps": 67140, "loss": 0.5899, "lr": 1.5374404540201612e-05, "epoch": 6.632409889782544, "percentage": 66.32, "elapsed_time": "3:05:23", "remaining_time": "1:34:07", "throughput": 2308.78, "total_tokens": 25682024} {"current_steps": 44535, "total_steps": 67140, "loss": 0.5699, "lr": 1.5368407040248467e-05, "epoch": 6.633154602323503, "percentage": 66.33, "elapsed_time": "3:05:24", "remaining_time": "1:34:06", "throughput": 2308.81, "total_tokens": 25684904} {"current_steps": 44540, "total_steps": 67140, "loss": 0.5891, "lr": 1.536241019115921e-05, "epoch": 6.633899314864462, "percentage": 66.34, "elapsed_time": "3:05:25", "remaining_time": "1:34:05", "throughput": 2308.83, "total_tokens": 25687784} {"current_steps": 44545, "total_steps": 67140, "loss": 0.5142, "lr": 1.5356413993339088e-05, "epoch": 6.634644027405422, "percentage": 66.35, "elapsed_time": "3:05:27", "remaining_time": "1:34:04", "throughput": 2308.87, "total_tokens": 25691016} {"current_steps": 44550, "total_steps": 67140, "loss": 0.5673, "lr": 1.5350418447193298e-05, "epoch": 6.6353887399463805, "percentage": 66.35, "elapsed_time": "3:05:28", "remaining_time": "1:34:02", "throughput": 2308.89, "total_tokens": 25693896} {"current_steps": 44555, "total_steps": 67140, "loss": 0.6391, "lr": 1.5344423553126997e-05, "epoch": 6.63613345248734, "percentage": 66.36, "elapsed_time": "3:05:29", "remaining_time": "1:34:01", "throughput": 2308.92, "total_tokens": 25696776} {"current_steps": 44560, "total_steps": 67140, "loss": 0.6889, "lr": 1.53384293115453e-05, "epoch": 6.636878165028299, "percentage": 66.37, "elapsed_time": "3:05:30", "remaining_time": "1:34:00", "throughput": 2308.95, "total_tokens": 25699912} {"current_steps": 44565, "total_steps": 67140, "loss": 0.6271, "lr": 1.5332435722853263e-05, "epoch": 6.6376228775692585, "percentage": 66.38, "elapsed_time": "3:05:31", "remaining_time": "1:33:58", "throughput": 2308.97, "total_tokens": 25702632} {"current_steps": 44570, "total_steps": 67140, "loss": 0.6099, "lr": 1.532644278745592e-05, "epoch": 6.638367590110217, "percentage": 66.38, "elapsed_time": "3:05:32", "remaining_time": "1:33:57", "throughput": 2308.98, "total_tokens": 25705352} {"current_steps": 44575, "total_steps": 67140, "loss": 0.6796, "lr": 1.5320450505758247e-05, "epoch": 6.639112302651177, "percentage": 66.39, "elapsed_time": "3:05:33", "remaining_time": "1:33:56", "throughput": 2309.01, "total_tokens": 25708264} {"current_steps": 44580, "total_steps": 67140, "loss": 0.7682, "lr": 1.531445887816517e-05, "epoch": 6.639857015192136, "percentage": 66.4, "elapsed_time": "3:05:35", "remaining_time": "1:33:54", "throughput": 2309.02, "total_tokens": 25710984} {"current_steps": 44585, "total_steps": 67140, "loss": 0.5001, "lr": 1.530846790508158e-05, "epoch": 6.640601727733095, "percentage": 66.41, "elapsed_time": "3:05:36", "remaining_time": "1:33:53", "throughput": 2309.04, "total_tokens": 25713864} {"current_steps": 44590, "total_steps": 67140, "loss": 0.604, "lr": 1.5302477586912333e-05, "epoch": 6.641346440274054, "percentage": 66.41, "elapsed_time": "3:05:37", "remaining_time": "1:33:52", "throughput": 2309.07, "total_tokens": 25716744} {"current_steps": 44595, "total_steps": 67140, "loss": 0.7131, "lr": 1.5296487924062218e-05, "epoch": 6.642091152815014, "percentage": 66.42, "elapsed_time": "3:05:38", "remaining_time": "1:33:51", "throughput": 2309.11, "total_tokens": 25719976} {"current_steps": 44600, "total_steps": 67140, "loss": 0.5812, "lr": 1.5290498916935995e-05, "epoch": 6.6428358653559725, "percentage": 66.43, "elapsed_time": "3:05:39", "remaining_time": "1:33:49", "throughput": 2309.14, "total_tokens": 25723016} {"current_steps": 44605, "total_steps": 67140, "loss": 0.5882, "lr": 1.5284510565938385e-05, "epoch": 6.643580577896932, "percentage": 66.44, "elapsed_time": "3:05:40", "remaining_time": "1:33:48", "throughput": 2309.15, "total_tokens": 25725672} {"current_steps": 44610, "total_steps": 67140, "loss": 0.5632, "lr": 1.5278522871474045e-05, "epoch": 6.644325290437891, "percentage": 66.44, "elapsed_time": "3:05:41", "remaining_time": "1:33:47", "throughput": 2309.17, "total_tokens": 25728584} {"current_steps": 44615, "total_steps": 67140, "loss": 0.5649, "lr": 1.527253583394762e-05, "epoch": 6.6450700029788505, "percentage": 66.45, "elapsed_time": "3:05:43", "remaining_time": "1:33:45", "throughput": 2309.21, "total_tokens": 25731688} {"current_steps": 44620, "total_steps": 67140, "loss": 0.482, "lr": 1.5266549453763655e-05, "epoch": 6.645814715519809, "percentage": 66.46, "elapsed_time": "3:05:44", "remaining_time": "1:33:44", "throughput": 2309.23, "total_tokens": 25734504} {"current_steps": 44625, "total_steps": 67140, "loss": 0.5285, "lr": 1.5260563731326715e-05, "epoch": 6.646559428060769, "percentage": 66.47, "elapsed_time": "3:05:45", "remaining_time": "1:33:43", "throughput": 2309.25, "total_tokens": 25737288} {"current_steps": 44630, "total_steps": 67140, "loss": 0.5673, "lr": 1.5254578667041278e-05, "epoch": 6.647304140601728, "percentage": 66.47, "elapsed_time": "3:05:46", "remaining_time": "1:33:41", "throughput": 2309.26, "total_tokens": 25740008} {"current_steps": 44635, "total_steps": 67140, "loss": 0.4631, "lr": 1.5248594261311789e-05, "epoch": 6.6480488531426865, "percentage": 66.48, "elapsed_time": "3:05:47", "remaining_time": "1:33:40", "throughput": 2309.28, "total_tokens": 25742792} {"current_steps": 44640, "total_steps": 67140, "loss": 0.4534, "lr": 1.524261051454266e-05, "epoch": 6.648793565683646, "percentage": 66.49, "elapsed_time": "3:05:48", "remaining_time": "1:33:39", "throughput": 2309.29, "total_tokens": 25745416} {"current_steps": 44645, "total_steps": 67140, "loss": 0.5834, "lr": 1.5236627427138237e-05, "epoch": 6.649538278224606, "percentage": 66.5, "elapsed_time": "3:05:49", "remaining_time": "1:33:37", "throughput": 2309.33, "total_tokens": 25748552} {"current_steps": 44650, "total_steps": 67140, "loss": 0.7129, "lr": 1.5230644999502835e-05, "epoch": 6.6502829907655645, "percentage": 66.5, "elapsed_time": "3:05:50", "remaining_time": "1:33:36", "throughput": 2309.35, "total_tokens": 25751400} {"current_steps": 44655, "total_steps": 67140, "loss": 0.6122, "lr": 1.5224663232040736e-05, "epoch": 6.651027703306523, "percentage": 66.51, "elapsed_time": "3:05:52", "remaining_time": "1:33:35", "throughput": 2309.39, "total_tokens": 25754568} {"current_steps": 44660, "total_steps": 67140, "loss": 0.483, "lr": 1.5218682125156148e-05, "epoch": 6.651772415847483, "percentage": 66.52, "elapsed_time": "3:05:53", "remaining_time": "1:33:34", "throughput": 2309.41, "total_tokens": 25757448} {"current_steps": 44665, "total_steps": 67140, "loss": 0.7994, "lr": 1.521270167925325e-05, "epoch": 6.652517128388443, "percentage": 66.53, "elapsed_time": "3:05:54", "remaining_time": "1:33:32", "throughput": 2309.43, "total_tokens": 25760296} {"current_steps": 44670, "total_steps": 67140, "loss": 0.5983, "lr": 1.5206721894736178e-05, "epoch": 6.653261840929401, "percentage": 66.53, "elapsed_time": "3:05:55", "remaining_time": "1:33:31", "throughput": 2309.46, "total_tokens": 25763176} {"current_steps": 44675, "total_steps": 67140, "loss": 0.4766, "lr": 1.520074277200903e-05, "epoch": 6.65400655347036, "percentage": 66.54, "elapsed_time": "3:05:56", "remaining_time": "1:33:30", "throughput": 2309.49, "total_tokens": 25766216} {"current_steps": 44680, "total_steps": 67140, "loss": 0.516, "lr": 1.519476431147584e-05, "epoch": 6.65475126601132, "percentage": 66.55, "elapsed_time": "3:05:57", "remaining_time": "1:33:28", "throughput": 2309.51, "total_tokens": 25769192} {"current_steps": 44685, "total_steps": 67140, "loss": 0.4787, "lr": 1.518878651354061e-05, "epoch": 6.6554959785522785, "percentage": 66.55, "elapsed_time": "3:05:59", "remaining_time": "1:33:27", "throughput": 2309.54, "total_tokens": 25772200} {"current_steps": 44690, "total_steps": 67140, "loss": 0.6918, "lr": 1.5182809378607304e-05, "epoch": 6.656240691093238, "percentage": 66.56, "elapsed_time": "3:06:00", "remaining_time": "1:33:26", "throughput": 2309.55, "total_tokens": 25774888} {"current_steps": 44695, "total_steps": 67140, "loss": 0.5968, "lr": 1.5176832907079836e-05, "epoch": 6.656985403634197, "percentage": 66.57, "elapsed_time": "3:06:01", "remaining_time": "1:33:24", "throughput": 2309.58, "total_tokens": 25777864} {"current_steps": 44700, "total_steps": 67140, "loss": 0.5345, "lr": 1.5170857099362045e-05, "epoch": 6.6577301161751565, "percentage": 66.58, "elapsed_time": "3:06:02", "remaining_time": "1:33:23", "throughput": 2309.6, "total_tokens": 25780520} {"current_steps": 44705, "total_steps": 67140, "loss": 0.5911, "lr": 1.5164881955857774e-05, "epoch": 6.658474828716115, "percentage": 66.58, "elapsed_time": "3:06:03", "remaining_time": "1:33:22", "throughput": 2309.62, "total_tokens": 25783368} {"current_steps": 44710, "total_steps": 67140, "loss": 0.5358, "lr": 1.5158907476970796e-05, "epoch": 6.659219541257075, "percentage": 66.59, "elapsed_time": "3:06:04", "remaining_time": "1:33:21", "throughput": 2309.66, "total_tokens": 25786664} {"current_steps": 44715, "total_steps": 67140, "loss": 0.5782, "lr": 1.5152933663104834e-05, "epoch": 6.659964253798034, "percentage": 66.6, "elapsed_time": "3:06:05", "remaining_time": "1:33:19", "throughput": 2309.69, "total_tokens": 25789672} {"current_steps": 44720, "total_steps": 67140, "loss": 0.5609, "lr": 1.5146960514663583e-05, "epoch": 6.660708966338993, "percentage": 66.61, "elapsed_time": "3:06:06", "remaining_time": "1:33:18", "throughput": 2309.71, "total_tokens": 25792456} {"current_steps": 44725, "total_steps": 67140, "loss": 0.5285, "lr": 1.5140988032050685e-05, "epoch": 6.661453678879952, "percentage": 66.61, "elapsed_time": "3:06:08", "remaining_time": "1:33:17", "throughput": 2309.72, "total_tokens": 25795176} {"current_steps": 44730, "total_steps": 67140, "loss": 0.8575, "lr": 1.5135016215669724e-05, "epoch": 6.662198391420912, "percentage": 66.62, "elapsed_time": "3:06:09", "remaining_time": "1:33:15", "throughput": 2309.75, "total_tokens": 25798152} {"current_steps": 44735, "total_steps": 67140, "loss": 0.6822, "lr": 1.5129045065924271e-05, "epoch": 6.6629431039618705, "percentage": 66.63, "elapsed_time": "3:06:10", "remaining_time": "1:33:14", "throughput": 2309.78, "total_tokens": 25801064} {"current_steps": 44740, "total_steps": 67140, "loss": 0.595, "lr": 1.5123074583217812e-05, "epoch": 6.66368781650283, "percentage": 66.64, "elapsed_time": "3:06:11", "remaining_time": "1:33:13", "throughput": 2309.79, "total_tokens": 25803752} {"current_steps": 44745, "total_steps": 67140, "loss": 0.6796, "lr": 1.5117104767953818e-05, "epoch": 6.664432529043789, "percentage": 66.64, "elapsed_time": "3:06:12", "remaining_time": "1:33:11", "throughput": 2309.83, "total_tokens": 25806984} {"current_steps": 44750, "total_steps": 67140, "loss": 0.3611, "lr": 1.51111356205357e-05, "epoch": 6.665177241584749, "percentage": 66.65, "elapsed_time": "3:06:13", "remaining_time": "1:33:10", "throughput": 2309.85, "total_tokens": 25809832} {"current_steps": 44755, "total_steps": 67140, "loss": 0.6082, "lr": 1.5105167141366836e-05, "epoch": 6.665921954125707, "percentage": 66.66, "elapsed_time": "3:06:14", "remaining_time": "1:33:09", "throughput": 2309.88, "total_tokens": 25812840} {"current_steps": 44760, "total_steps": 67140, "loss": 0.4372, "lr": 1.509919933085054e-05, "epoch": 6.666666666666667, "percentage": 66.67, "elapsed_time": "3:06:16", "remaining_time": "1:33:08", "throughput": 2309.91, "total_tokens": 25815880} {"current_steps": 44765, "total_steps": 67140, "loss": 0.5941, "lr": 1.5093232189390103e-05, "epoch": 6.667411379207626, "percentage": 66.67, "elapsed_time": "3:06:17", "remaining_time": "1:33:06", "throughput": 2309.93, "total_tokens": 25818696} {"current_steps": 44770, "total_steps": 67140, "loss": 0.5719, "lr": 1.508726571738876e-05, "epoch": 6.668156091748585, "percentage": 66.68, "elapsed_time": "3:06:18", "remaining_time": "1:33:05", "throughput": 2309.99, "total_tokens": 25822312} {"current_steps": 44775, "total_steps": 67140, "loss": 0.6246, "lr": 1.5081299915249702e-05, "epoch": 6.668900804289544, "percentage": 66.69, "elapsed_time": "3:06:19", "remaining_time": "1:33:04", "throughput": 2310.06, "total_tokens": 25825832} {"current_steps": 44780, "total_steps": 67140, "loss": 0.5791, "lr": 1.507533478337606e-05, "epoch": 6.669645516830504, "percentage": 66.7, "elapsed_time": "3:06:20", "remaining_time": "1:33:02", "throughput": 2310.08, "total_tokens": 25828744} {"current_steps": 44785, "total_steps": 67140, "loss": 0.5966, "lr": 1.5069370322170941e-05, "epoch": 6.6703902293714625, "percentage": 66.7, "elapsed_time": "3:06:22", "remaining_time": "1:33:01", "throughput": 2310.11, "total_tokens": 25831752} {"current_steps": 44790, "total_steps": 67140, "loss": 0.7012, "lr": 1.5063406532037408e-05, "epoch": 6.671134941912422, "percentage": 66.71, "elapsed_time": "3:06:23", "remaining_time": "1:33:00", "throughput": 2310.14, "total_tokens": 25834664} {"current_steps": 44795, "total_steps": 67140, "loss": 0.4449, "lr": 1.5057443413378458e-05, "epoch": 6.671879654453381, "percentage": 66.72, "elapsed_time": "3:06:24", "remaining_time": "1:32:59", "throughput": 2310.15, "total_tokens": 25837384} {"current_steps": 44800, "total_steps": 67140, "loss": 0.6521, "lr": 1.5051480966597054e-05, "epoch": 6.67262436699434, "percentage": 66.73, "elapsed_time": "3:06:25", "remaining_time": "1:32:57", "throughput": 2310.18, "total_tokens": 25840328} {"current_steps": 44805, "total_steps": 67140, "loss": 0.6892, "lr": 1.5045519192096128e-05, "epoch": 6.673369079535299, "percentage": 66.73, "elapsed_time": "3:06:26", "remaining_time": "1:32:56", "throughput": 2310.21, "total_tokens": 25843336} {"current_steps": 44810, "total_steps": 67140, "loss": 0.6263, "lr": 1.5039558090278538e-05, "epoch": 6.674113792076259, "percentage": 66.74, "elapsed_time": "3:06:27", "remaining_time": "1:32:55", "throughput": 2310.22, "total_tokens": 25846056} {"current_steps": 44815, "total_steps": 67140, "loss": 0.5639, "lr": 1.5033597661547123e-05, "epoch": 6.674858504617218, "percentage": 66.75, "elapsed_time": "3:06:28", "remaining_time": "1:32:53", "throughput": 2310.24, "total_tokens": 25848904} {"current_steps": 44820, "total_steps": 67140, "loss": 0.8383, "lr": 1.5027637906304648e-05, "epoch": 6.6756032171581765, "percentage": 66.76, "elapsed_time": "3:06:29", "remaining_time": "1:32:52", "throughput": 2310.26, "total_tokens": 25851624} {"current_steps": 44825, "total_steps": 67140, "loss": 0.5714, "lr": 1.5021678824953867e-05, "epoch": 6.676347929699136, "percentage": 66.76, "elapsed_time": "3:06:31", "remaining_time": "1:32:51", "throughput": 2310.29, "total_tokens": 25854568} {"current_steps": 44830, "total_steps": 67140, "loss": 0.4597, "lr": 1.5015720417897456e-05, "epoch": 6.677092642240096, "percentage": 66.77, "elapsed_time": "3:06:32", "remaining_time": "1:32:49", "throughput": 2310.31, "total_tokens": 25857512} {"current_steps": 44835, "total_steps": 67140, "loss": 0.4646, "lr": 1.5009762685538065e-05, "epoch": 6.677837354781055, "percentage": 66.78, "elapsed_time": "3:06:33", "remaining_time": "1:32:48", "throughput": 2310.33, "total_tokens": 25860360} {"current_steps": 44840, "total_steps": 67140, "loss": 0.5928, "lr": 1.5003805628278297e-05, "epoch": 6.678582067322013, "percentage": 66.79, "elapsed_time": "3:06:34", "remaining_time": "1:32:47", "throughput": 2310.36, "total_tokens": 25863304} {"current_steps": 44845, "total_steps": 67140, "loss": 0.7787, "lr": 1.49978492465207e-05, "epoch": 6.679326779862973, "percentage": 66.79, "elapsed_time": "3:06:35", "remaining_time": "1:32:45", "throughput": 2310.37, "total_tokens": 25865928} {"current_steps": 44850, "total_steps": 67140, "loss": 0.7098, "lr": 1.4991893540667783e-05, "epoch": 6.680071492403932, "percentage": 66.8, "elapsed_time": "3:06:36", "remaining_time": "1:32:44", "throughput": 2310.41, "total_tokens": 25869096} {"current_steps": 44855, "total_steps": 67140, "loss": 0.5339, "lr": 1.4985938511122027e-05, "epoch": 6.680816204944891, "percentage": 66.81, "elapsed_time": "3:06:37", "remaining_time": "1:32:43", "throughput": 2310.44, "total_tokens": 25872008} {"current_steps": 44860, "total_steps": 67140, "loss": 0.4742, "lr": 1.497998415828582e-05, "epoch": 6.68156091748585, "percentage": 66.82, "elapsed_time": "3:06:39", "remaining_time": "1:32:42", "throughput": 2310.48, "total_tokens": 25875240} {"current_steps": 44865, "total_steps": 67140, "loss": 0.8484, "lr": 1.4974030482561546e-05, "epoch": 6.68230563002681, "percentage": 66.82, "elapsed_time": "3:06:40", "remaining_time": "1:32:40", "throughput": 2310.52, "total_tokens": 25878472} {"current_steps": 44870, "total_steps": 67140, "loss": 0.7952, "lr": 1.4968077484351529e-05, "epoch": 6.6830503425677685, "percentage": 66.83, "elapsed_time": "3:06:41", "remaining_time": "1:32:39", "throughput": 2310.54, "total_tokens": 25881288} {"current_steps": 44875, "total_steps": 67140, "loss": 0.7376, "lr": 1.496212516405805e-05, "epoch": 6.683795055108728, "percentage": 66.84, "elapsed_time": "3:06:42", "remaining_time": "1:32:38", "throughput": 2310.56, "total_tokens": 25884104} {"current_steps": 44880, "total_steps": 67140, "loss": 0.7224, "lr": 1.4956173522083338e-05, "epoch": 6.684539767649687, "percentage": 66.85, "elapsed_time": "3:06:43", "remaining_time": "1:32:36", "throughput": 2310.58, "total_tokens": 25886856} {"current_steps": 44885, "total_steps": 67140, "loss": 0.6628, "lr": 1.4950222558829582e-05, "epoch": 6.685284480190647, "percentage": 66.85, "elapsed_time": "3:06:44", "remaining_time": "1:32:35", "throughput": 2310.61, "total_tokens": 25889896} {"current_steps": 44890, "total_steps": 67140, "loss": 0.6516, "lr": 1.4944272274698935e-05, "epoch": 6.686029192731605, "percentage": 66.86, "elapsed_time": "3:06:45", "remaining_time": "1:32:34", "throughput": 2310.64, "total_tokens": 25892904} {"current_steps": 44895, "total_steps": 67140, "loss": 0.505, "lr": 1.4938322670093485e-05, "epoch": 6.686773905272565, "percentage": 66.87, "elapsed_time": "3:06:47", "remaining_time": "1:32:32", "throughput": 2310.65, "total_tokens": 25895624} {"current_steps": 44900, "total_steps": 67140, "loss": 0.6139, "lr": 1.4932373745415273e-05, "epoch": 6.687518617813524, "percentage": 66.88, "elapsed_time": "3:06:48", "remaining_time": "1:32:31", "throughput": 2310.68, "total_tokens": 25898632} {"current_steps": 44905, "total_steps": 67140, "loss": 0.4351, "lr": 1.4926425501066313e-05, "epoch": 6.688263330354483, "percentage": 66.88, "elapsed_time": "3:06:49", "remaining_time": "1:32:30", "throughput": 2310.69, "total_tokens": 25901256} {"current_steps": 44910, "total_steps": 67140, "loss": 0.5134, "lr": 1.4920477937448565e-05, "epoch": 6.689008042895442, "percentage": 66.89, "elapsed_time": "3:06:50", "remaining_time": "1:32:29", "throughput": 2310.69, "total_tokens": 25903848} {"current_steps": 44915, "total_steps": 67140, "loss": 0.7171, "lr": 1.4914531054963931e-05, "epoch": 6.689752755436402, "percentage": 66.9, "elapsed_time": "3:06:51", "remaining_time": "1:32:27", "throughput": 2310.71, "total_tokens": 25906696} {"current_steps": 44920, "total_steps": 67140, "loss": 0.6976, "lr": 1.4908584854014294e-05, "epoch": 6.690497467977361, "percentage": 66.9, "elapsed_time": "3:06:52", "remaining_time": "1:32:26", "throughput": 2310.76, "total_tokens": 25909992} {"current_steps": 44925, "total_steps": 67140, "loss": 0.5656, "lr": 1.4902639335001456e-05, "epoch": 6.69124218051832, "percentage": 66.91, "elapsed_time": "3:06:53", "remaining_time": "1:32:25", "throughput": 2310.8, "total_tokens": 25913096} {"current_steps": 44930, "total_steps": 67140, "loss": 0.5392, "lr": 1.4896694498327195e-05, "epoch": 6.691986893059279, "percentage": 66.92, "elapsed_time": "3:06:55", "remaining_time": "1:32:23", "throughput": 2310.83, "total_tokens": 25916168} {"current_steps": 44935, "total_steps": 67140, "loss": 0.6705, "lr": 1.4890750344393254e-05, "epoch": 6.692731605600239, "percentage": 66.93, "elapsed_time": "3:06:56", "remaining_time": "1:32:22", "throughput": 2310.85, "total_tokens": 25919144} {"current_steps": 44940, "total_steps": 67140, "loss": 0.5869, "lr": 1.4884806873601303e-05, "epoch": 6.693476318141197, "percentage": 66.93, "elapsed_time": "3:06:57", "remaining_time": "1:32:21", "throughput": 2310.89, "total_tokens": 25922184} {"current_steps": 44945, "total_steps": 67140, "loss": 0.4864, "lr": 1.4878864086352973e-05, "epoch": 6.694221030682157, "percentage": 66.94, "elapsed_time": "3:06:58", "remaining_time": "1:32:20", "throughput": 2310.91, "total_tokens": 25925064} {"current_steps": 44950, "total_steps": 67140, "loss": 0.7257, "lr": 1.4872921983049854e-05, "epoch": 6.694965743223116, "percentage": 66.95, "elapsed_time": "3:06:59", "remaining_time": "1:32:18", "throughput": 2310.92, "total_tokens": 25927688} {"current_steps": 44955, "total_steps": 67140, "loss": 0.6683, "lr": 1.4866980564093503e-05, "epoch": 6.695710455764075, "percentage": 66.96, "elapsed_time": "3:07:00", "remaining_time": "1:32:17", "throughput": 2310.95, "total_tokens": 25930696} {"current_steps": 44960, "total_steps": 67140, "loss": 0.6142, "lr": 1.4861039829885398e-05, "epoch": 6.696455168305034, "percentage": 66.96, "elapsed_time": "3:07:01", "remaining_time": "1:32:16", "throughput": 2310.98, "total_tokens": 25933704} {"current_steps": 44965, "total_steps": 67140, "loss": 0.8313, "lr": 1.4855099780827004e-05, "epoch": 6.697199880845994, "percentage": 66.97, "elapsed_time": "3:07:03", "remaining_time": "1:32:14", "throughput": 2311.0, "total_tokens": 25936584} {"current_steps": 44970, "total_steps": 67140, "loss": 0.6565, "lr": 1.4849160417319724e-05, "epoch": 6.697944593386953, "percentage": 66.98, "elapsed_time": "3:07:04", "remaining_time": "1:32:13", "throughput": 2311.02, "total_tokens": 25939464} {"current_steps": 44975, "total_steps": 67140, "loss": 0.5335, "lr": 1.4843221739764906e-05, "epoch": 6.698689305927912, "percentage": 66.99, "elapsed_time": "3:07:05", "remaining_time": "1:32:12", "throughput": 2311.06, "total_tokens": 25942472} {"current_steps": 44980, "total_steps": 67140, "loss": 0.5507, "lr": 1.483728374856388e-05, "epoch": 6.699434018468871, "percentage": 66.99, "elapsed_time": "3:07:06", "remaining_time": "1:32:10", "throughput": 2311.07, "total_tokens": 25945192} {"current_steps": 44985, "total_steps": 67140, "loss": 0.5962, "lr": 1.4831346444117888e-05, "epoch": 6.70017873100983, "percentage": 67.0, "elapsed_time": "3:07:07", "remaining_time": "1:32:09", "throughput": 2311.1, "total_tokens": 25948232} {"current_steps": 44990, "total_steps": 67140, "loss": 0.6479, "lr": 1.4825409826828169e-05, "epoch": 6.700923443550789, "percentage": 67.01, "elapsed_time": "3:07:08", "remaining_time": "1:32:08", "throughput": 2311.12, "total_tokens": 25951112} {"current_steps": 44995, "total_steps": 67140, "loss": 0.4961, "lr": 1.4819473897095876e-05, "epoch": 6.701668156091749, "percentage": 67.02, "elapsed_time": "3:07:09", "remaining_time": "1:32:06", "throughput": 2311.15, "total_tokens": 25954056} {"current_steps": 45000, "total_steps": 67140, "loss": 0.6875, "lr": 1.4813538655322151e-05, "epoch": 6.702412868632708, "percentage": 67.02, "elapsed_time": "3:07:11", "remaining_time": "1:32:05", "throughput": 2311.18, "total_tokens": 25957096} {"current_steps": 45005, "total_steps": 67140, "loss": 0.7177, "lr": 1.4807604101908073e-05, "epoch": 6.703157581173667, "percentage": 67.03, "elapsed_time": "3:07:12", "remaining_time": "1:32:04", "throughput": 2311.18, "total_tokens": 25959688} {"current_steps": 45010, "total_steps": 67140, "loss": 0.6942, "lr": 1.4801670237254664e-05, "epoch": 6.703902293714626, "percentage": 67.04, "elapsed_time": "3:07:13", "remaining_time": "1:32:03", "throughput": 2311.21, "total_tokens": 25962728} {"current_steps": 45015, "total_steps": 67140, "loss": 0.6843, "lr": 1.4795737061762918e-05, "epoch": 6.704647006255585, "percentage": 67.05, "elapsed_time": "3:07:14", "remaining_time": "1:32:01", "throughput": 2311.23, "total_tokens": 25965480} {"current_steps": 45020, "total_steps": 67140, "loss": 0.5159, "lr": 1.4789804575833782e-05, "epoch": 6.705391718796545, "percentage": 67.05, "elapsed_time": "3:07:15", "remaining_time": "1:32:00", "throughput": 2311.26, "total_tokens": 25968488} {"current_steps": 45025, "total_steps": 67140, "loss": 0.4598, "lr": 1.4783872779868141e-05, "epoch": 6.706136431337503, "percentage": 67.06, "elapsed_time": "3:07:16", "remaining_time": "1:31:59", "throughput": 2311.29, "total_tokens": 25971496} {"current_steps": 45030, "total_steps": 67140, "loss": 0.5471, "lr": 1.4777941674266832e-05, "epoch": 6.706881143878463, "percentage": 67.07, "elapsed_time": "3:07:17", "remaining_time": "1:31:57", "throughput": 2311.29, "total_tokens": 25974120} {"current_steps": 45035, "total_steps": 67140, "loss": 0.5134, "lr": 1.4772011259430668e-05, "epoch": 6.707625856419422, "percentage": 67.08, "elapsed_time": "3:07:19", "remaining_time": "1:31:56", "throughput": 2311.31, "total_tokens": 25976840} {"current_steps": 45040, "total_steps": 67140, "loss": 0.7081, "lr": 1.4766081535760401e-05, "epoch": 6.708370568960381, "percentage": 67.08, "elapsed_time": "3:07:20", "remaining_time": "1:31:55", "throughput": 2311.35, "total_tokens": 25980104} {"current_steps": 45045, "total_steps": 67140, "loss": 0.5556, "lr": 1.4760152503656733e-05, "epoch": 6.70911528150134, "percentage": 67.09, "elapsed_time": "3:07:21", "remaining_time": "1:31:53", "throughput": 2311.36, "total_tokens": 25982664} {"current_steps": 45050, "total_steps": 67140, "loss": 0.5506, "lr": 1.4754224163520325e-05, "epoch": 6.7098599940423, "percentage": 67.1, "elapsed_time": "3:07:22", "remaining_time": "1:31:52", "throughput": 2311.41, "total_tokens": 25986024} {"current_steps": 45055, "total_steps": 67140, "loss": 0.5499, "lr": 1.4748296515751797e-05, "epoch": 6.710604706583259, "percentage": 67.11, "elapsed_time": "3:07:23", "remaining_time": "1:31:51", "throughput": 2311.42, "total_tokens": 25988808} {"current_steps": 45060, "total_steps": 67140, "loss": 0.7256, "lr": 1.4742369560751718e-05, "epoch": 6.711349419124218, "percentage": 67.11, "elapsed_time": "3:07:24", "remaining_time": "1:31:50", "throughput": 2311.45, "total_tokens": 25991720} {"current_steps": 45065, "total_steps": 67140, "loss": 0.5275, "lr": 1.4736443298920588e-05, "epoch": 6.712094131665177, "percentage": 67.12, "elapsed_time": "3:07:25", "remaining_time": "1:31:48", "throughput": 2311.46, "total_tokens": 25994408} {"current_steps": 45070, "total_steps": 67140, "loss": 0.5498, "lr": 1.4730517730658888e-05, "epoch": 6.712838844206137, "percentage": 67.13, "elapsed_time": "3:07:26", "remaining_time": "1:31:47", "throughput": 2311.48, "total_tokens": 25997128} {"current_steps": 45075, "total_steps": 67140, "loss": 0.5816, "lr": 1.4724592856367057e-05, "epoch": 6.713583556747095, "percentage": 67.14, "elapsed_time": "3:07:28", "remaining_time": "1:31:46", "throughput": 2311.49, "total_tokens": 25999880} {"current_steps": 45080, "total_steps": 67140, "loss": 0.5902, "lr": 1.4718668676445454e-05, "epoch": 6.714328269288055, "percentage": 67.14, "elapsed_time": "3:07:29", "remaining_time": "1:31:44", "throughput": 2311.51, "total_tokens": 26002696} {"current_steps": 45085, "total_steps": 67140, "loss": 0.6259, "lr": 1.4712745191294431e-05, "epoch": 6.715072981829014, "percentage": 67.15, "elapsed_time": "3:07:30", "remaining_time": "1:31:43", "throughput": 2311.54, "total_tokens": 26005768} {"current_steps": 45090, "total_steps": 67140, "loss": 0.6714, "lr": 1.4706822401314254e-05, "epoch": 6.7158176943699734, "percentage": 67.16, "elapsed_time": "3:07:31", "remaining_time": "1:31:42", "throughput": 2311.58, "total_tokens": 26008872} {"current_steps": 45095, "total_steps": 67140, "loss": 0.6274, "lr": 1.4700900306905172e-05, "epoch": 6.716562406910932, "percentage": 67.17, "elapsed_time": "3:07:32", "remaining_time": "1:31:40", "throughput": 2311.58, "total_tokens": 26011464} {"current_steps": 45100, "total_steps": 67140, "loss": 0.7091, "lr": 1.4694978908467384e-05, "epoch": 6.717307119451892, "percentage": 67.17, "elapsed_time": "3:07:33", "remaining_time": "1:31:39", "throughput": 2311.61, "total_tokens": 26014408} {"current_steps": 45105, "total_steps": 67140, "loss": 0.8458, "lr": 1.468905820640102e-05, "epoch": 6.718051831992851, "percentage": 67.18, "elapsed_time": "3:07:35", "remaining_time": "1:31:38", "throughput": 2311.65, "total_tokens": 26017672} {"current_steps": 45110, "total_steps": 67140, "loss": 0.7143, "lr": 1.4683138201106175e-05, "epoch": 6.71879654453381, "percentage": 67.19, "elapsed_time": "3:07:36", "remaining_time": "1:31:37", "throughput": 2311.68, "total_tokens": 26020744} {"current_steps": 45115, "total_steps": 67140, "loss": 0.5856, "lr": 1.4677218892982906e-05, "epoch": 6.719541257074769, "percentage": 67.2, "elapsed_time": "3:07:37", "remaining_time": "1:31:35", "throughput": 2311.73, "total_tokens": 26024040} {"current_steps": 45120, "total_steps": 67140, "loss": 0.6482, "lr": 1.467130028243122e-05, "epoch": 6.720285969615729, "percentage": 67.2, "elapsed_time": "3:07:38", "remaining_time": "1:31:34", "throughput": 2311.75, "total_tokens": 26026856} {"current_steps": 45125, "total_steps": 67140, "loss": 0.6595, "lr": 1.466538236985106e-05, "epoch": 6.721030682156687, "percentage": 67.21, "elapsed_time": "3:07:39", "remaining_time": "1:31:33", "throughput": 2311.77, "total_tokens": 26029704} {"current_steps": 45130, "total_steps": 67140, "loss": 0.6838, "lr": 1.4659465155642343e-05, "epoch": 6.721775394697647, "percentage": 67.22, "elapsed_time": "3:07:40", "remaining_time": "1:31:31", "throughput": 2311.78, "total_tokens": 26032360} {"current_steps": 45135, "total_steps": 67140, "loss": 0.5779, "lr": 1.4653548640204934e-05, "epoch": 6.722520107238606, "percentage": 67.23, "elapsed_time": "3:07:41", "remaining_time": "1:31:30", "throughput": 2311.81, "total_tokens": 26035336} {"current_steps": 45140, "total_steps": 67140, "loss": 0.5872, "lr": 1.4647632823938651e-05, "epoch": 6.7232648197795655, "percentage": 67.23, "elapsed_time": "3:07:43", "remaining_time": "1:31:29", "throughput": 2311.84, "total_tokens": 26038344} {"current_steps": 45145, "total_steps": 67140, "loss": 0.7809, "lr": 1.4641717707243238e-05, "epoch": 6.724009532320524, "percentage": 67.24, "elapsed_time": "3:07:44", "remaining_time": "1:31:27", "throughput": 2311.85, "total_tokens": 26041096} {"current_steps": 45150, "total_steps": 67140, "loss": 0.4995, "lr": 1.463580329051843e-05, "epoch": 6.724754244861483, "percentage": 67.25, "elapsed_time": "3:07:45", "remaining_time": "1:31:26", "throughput": 2311.88, "total_tokens": 26044008} {"current_steps": 45155, "total_steps": 67140, "loss": 0.49, "lr": 1.4629889574163903e-05, "epoch": 6.725498957402443, "percentage": 67.25, "elapsed_time": "3:07:46", "remaining_time": "1:31:25", "throughput": 2311.89, "total_tokens": 26046760} {"current_steps": 45160, "total_steps": 67140, "loss": 0.6199, "lr": 1.4623976558579272e-05, "epoch": 6.726243669943402, "percentage": 67.26, "elapsed_time": "3:07:47", "remaining_time": "1:31:24", "throughput": 2311.93, "total_tokens": 26049800} {"current_steps": 45165, "total_steps": 67140, "loss": 0.6147, "lr": 1.461806424416412e-05, "epoch": 6.726988382484361, "percentage": 67.27, "elapsed_time": "3:07:48", "remaining_time": "1:31:22", "throughput": 2311.94, "total_tokens": 26052584} {"current_steps": 45170, "total_steps": 67140, "loss": 0.7411, "lr": 1.4612152631317976e-05, "epoch": 6.72773309502532, "percentage": 67.28, "elapsed_time": "3:07:49", "remaining_time": "1:31:21", "throughput": 2311.98, "total_tokens": 26055720} {"current_steps": 45175, "total_steps": 67140, "loss": 0.6183, "lr": 1.4606241720440326e-05, "epoch": 6.7284778075662794, "percentage": 67.28, "elapsed_time": "3:07:51", "remaining_time": "1:31:20", "throughput": 2312.01, "total_tokens": 26058728} {"current_steps": 45180, "total_steps": 67140, "loss": 0.5948, "lr": 1.4600331511930609e-05, "epoch": 6.729222520107239, "percentage": 67.29, "elapsed_time": "3:07:52", "remaining_time": "1:31:18", "throughput": 2312.03, "total_tokens": 26061544} {"current_steps": 45185, "total_steps": 67140, "loss": 0.5993, "lr": 1.4594422006188196e-05, "epoch": 6.729967232648198, "percentage": 67.3, "elapsed_time": "3:07:53", "remaining_time": "1:31:17", "throughput": 2312.05, "total_tokens": 26064488} {"current_steps": 45190, "total_steps": 67140, "loss": 0.5591, "lr": 1.458851320361244e-05, "epoch": 6.730711945189157, "percentage": 67.31, "elapsed_time": "3:07:54", "remaining_time": "1:31:16", "throughput": 2312.07, "total_tokens": 26067304} {"current_steps": 45195, "total_steps": 67140, "loss": 0.5056, "lr": 1.458260510460264e-05, "epoch": 6.731456657730116, "percentage": 67.31, "elapsed_time": "3:07:55", "remaining_time": "1:31:14", "throughput": 2312.08, "total_tokens": 26069896} {"current_steps": 45200, "total_steps": 67140, "loss": 0.6106, "lr": 1.4576697709558023e-05, "epoch": 6.732201370271075, "percentage": 67.32, "elapsed_time": "3:07:56", "remaining_time": "1:31:13", "throughput": 2312.11, "total_tokens": 26072904} {"current_steps": 45205, "total_steps": 67140, "loss": 0.5874, "lr": 1.4570791018877796e-05, "epoch": 6.732946082812035, "percentage": 67.33, "elapsed_time": "3:07:57", "remaining_time": "1:31:12", "throughput": 2312.12, "total_tokens": 26075592} {"current_steps": 45210, "total_steps": 67140, "loss": 0.5174, "lr": 1.4564885032961112e-05, "epoch": 6.733690795352993, "percentage": 67.34, "elapsed_time": "3:07:58", "remaining_time": "1:31:11", "throughput": 2312.14, "total_tokens": 26078408} {"current_steps": 45215, "total_steps": 67140, "loss": 0.5251, "lr": 1.455897975220707e-05, "epoch": 6.734435507893953, "percentage": 67.34, "elapsed_time": "3:08:00", "remaining_time": "1:31:09", "throughput": 2312.16, "total_tokens": 26081288} {"current_steps": 45220, "total_steps": 67140, "loss": 0.506, "lr": 1.4553075177014736e-05, "epoch": 6.735180220434912, "percentage": 67.35, "elapsed_time": "3:08:01", "remaining_time": "1:31:08", "throughput": 2312.2, "total_tokens": 26084424} {"current_steps": 45225, "total_steps": 67140, "loss": 0.6575, "lr": 1.4547171307783097e-05, "epoch": 6.7359249329758715, "percentage": 67.36, "elapsed_time": "3:08:02", "remaining_time": "1:31:07", "throughput": 2312.24, "total_tokens": 26087624} {"current_steps": 45230, "total_steps": 67140, "loss": 0.5919, "lr": 1.4541268144911135e-05, "epoch": 6.73666964551683, "percentage": 67.37, "elapsed_time": "3:08:03", "remaining_time": "1:31:05", "throughput": 2312.26, "total_tokens": 26090536} {"current_steps": 45235, "total_steps": 67140, "loss": 0.4633, "lr": 1.4535365688797735e-05, "epoch": 6.73741435805779, "percentage": 67.37, "elapsed_time": "3:08:04", "remaining_time": "1:31:04", "throughput": 2312.27, "total_tokens": 26093032} {"current_steps": 45240, "total_steps": 67140, "loss": 0.5477, "lr": 1.452946393984178e-05, "epoch": 6.738159070598749, "percentage": 67.38, "elapsed_time": "3:08:05", "remaining_time": "1:31:03", "throughput": 2312.28, "total_tokens": 26095784} {"current_steps": 45245, "total_steps": 67140, "loss": 0.5556, "lr": 1.4523562898442084e-05, "epoch": 6.738903783139708, "percentage": 67.39, "elapsed_time": "3:08:06", "remaining_time": "1:31:01", "throughput": 2312.33, "total_tokens": 26099144} {"current_steps": 45250, "total_steps": 67140, "loss": 0.3417, "lr": 1.451766256499741e-05, "epoch": 6.739648495680667, "percentage": 67.4, "elapsed_time": "3:08:08", "remaining_time": "1:31:00", "throughput": 2312.34, "total_tokens": 26101736} {"current_steps": 45255, "total_steps": 67140, "loss": 0.541, "lr": 1.4511762939906481e-05, "epoch": 6.740393208221627, "percentage": 67.4, "elapsed_time": "3:08:09", "remaining_time": "1:30:59", "throughput": 2312.36, "total_tokens": 26104584} {"current_steps": 45260, "total_steps": 67140, "loss": 0.5615, "lr": 1.4505864023567983e-05, "epoch": 6.7411379207625854, "percentage": 67.41, "elapsed_time": "3:08:10", "remaining_time": "1:30:58", "throughput": 2312.38, "total_tokens": 26107464} {"current_steps": 45265, "total_steps": 67140, "loss": 0.5876, "lr": 1.4499965816380525e-05, "epoch": 6.741882633303545, "percentage": 67.42, "elapsed_time": "3:08:11", "remaining_time": "1:30:56", "throughput": 2312.39, "total_tokens": 26110088} {"current_steps": 45270, "total_steps": 67140, "loss": 0.4781, "lr": 1.4494068318742679e-05, "epoch": 6.742627345844504, "percentage": 67.43, "elapsed_time": "3:08:12", "remaining_time": "1:30:55", "throughput": 2312.41, "total_tokens": 26112936} {"current_steps": 45275, "total_steps": 67140, "loss": 0.406, "lr": 1.4488171531052982e-05, "epoch": 6.7433720583854635, "percentage": 67.43, "elapsed_time": "3:08:13", "remaining_time": "1:30:54", "throughput": 2312.43, "total_tokens": 26115784} {"current_steps": 45280, "total_steps": 67140, "loss": 0.7703, "lr": 1.4482275453709915e-05, "epoch": 6.744116770926422, "percentage": 67.44, "elapsed_time": "3:08:14", "remaining_time": "1:30:52", "throughput": 2312.46, "total_tokens": 26118760} {"current_steps": 45285, "total_steps": 67140, "loss": 0.6735, "lr": 1.447638008711191e-05, "epoch": 6.744861483467382, "percentage": 67.45, "elapsed_time": "3:08:15", "remaining_time": "1:30:51", "throughput": 2312.47, "total_tokens": 26121448} {"current_steps": 45290, "total_steps": 67140, "loss": 0.6774, "lr": 1.4470485431657355e-05, "epoch": 6.745606196008341, "percentage": 67.46, "elapsed_time": "3:08:17", "remaining_time": "1:30:50", "throughput": 2312.48, "total_tokens": 26124200} {"current_steps": 45295, "total_steps": 67140, "loss": 0.5979, "lr": 1.446459148774459e-05, "epoch": 6.7463509085493, "percentage": 67.46, "elapsed_time": "3:08:18", "remaining_time": "1:30:48", "throughput": 2312.5, "total_tokens": 26127048} {"current_steps": 45300, "total_steps": 67140, "loss": 0.5137, "lr": 1.4458698255771902e-05, "epoch": 6.747095621090259, "percentage": 67.47, "elapsed_time": "3:08:19", "remaining_time": "1:30:47", "throughput": 2312.53, "total_tokens": 26129960} {"current_steps": 45305, "total_steps": 67140, "loss": 0.4594, "lr": 1.445280573613752e-05, "epoch": 6.747840333631219, "percentage": 67.48, "elapsed_time": "3:08:20", "remaining_time": "1:30:46", "throughput": 2312.55, "total_tokens": 26132840} {"current_steps": 45310, "total_steps": 67140, "loss": 0.8082, "lr": 1.4446913929239642e-05, "epoch": 6.7485850461721775, "percentage": 67.49, "elapsed_time": "3:08:21", "remaining_time": "1:30:45", "throughput": 2312.57, "total_tokens": 26135656} {"current_steps": 45315, "total_steps": 67140, "loss": 0.7057, "lr": 1.4441022835476414e-05, "epoch": 6.749329758713137, "percentage": 67.49, "elapsed_time": "3:08:22", "remaining_time": "1:30:43", "throughput": 2312.6, "total_tokens": 26138728} {"current_steps": 45320, "total_steps": 67140, "loss": 0.7136, "lr": 1.4435132455245934e-05, "epoch": 6.750074471254096, "percentage": 67.5, "elapsed_time": "3:08:23", "remaining_time": "1:30:42", "throughput": 2312.65, "total_tokens": 26142120} {"current_steps": 45325, "total_steps": 67140, "loss": 0.7025, "lr": 1.4429242788946259e-05, "epoch": 6.7508191837950555, "percentage": 67.51, "elapsed_time": "3:08:25", "remaining_time": "1:30:41", "throughput": 2312.68, "total_tokens": 26145032} {"current_steps": 45330, "total_steps": 67140, "loss": 0.9155, "lr": 1.442335383697537e-05, "epoch": 6.751563896336014, "percentage": 67.52, "elapsed_time": "3:08:26", "remaining_time": "1:30:39", "throughput": 2312.71, "total_tokens": 26148008} {"current_steps": 45335, "total_steps": 67140, "loss": 0.529, "lr": 1.4417465599731226e-05, "epoch": 6.752308608876973, "percentage": 67.52, "elapsed_time": "3:08:27", "remaining_time": "1:30:38", "throughput": 2312.73, "total_tokens": 26150888} {"current_steps": 45340, "total_steps": 67140, "loss": 0.6141, "lr": 1.4411578077611743e-05, "epoch": 6.753053321417933, "percentage": 67.53, "elapsed_time": "3:08:28", "remaining_time": "1:30:37", "throughput": 2312.76, "total_tokens": 26153896} {"current_steps": 45345, "total_steps": 67140, "loss": 0.6911, "lr": 1.4405691271014751e-05, "epoch": 6.753798033958892, "percentage": 67.54, "elapsed_time": "3:08:29", "remaining_time": "1:30:35", "throughput": 2312.78, "total_tokens": 26156840} {"current_steps": 45350, "total_steps": 67140, "loss": 0.546, "lr": 1.4399805180338072e-05, "epoch": 6.754542746499851, "percentage": 67.55, "elapsed_time": "3:08:30", "remaining_time": "1:30:34", "throughput": 2312.81, "total_tokens": 26159816} {"current_steps": 45355, "total_steps": 67140, "loss": 0.5158, "lr": 1.439391980597946e-05, "epoch": 6.75528745904081, "percentage": 67.55, "elapsed_time": "3:08:31", "remaining_time": "1:30:33", "throughput": 2312.84, "total_tokens": 26162792} {"current_steps": 45360, "total_steps": 67140, "loss": 0.6051, "lr": 1.4388035148336637e-05, "epoch": 6.7560321715817695, "percentage": 67.56, "elapsed_time": "3:08:33", "remaining_time": "1:30:32", "throughput": 2312.87, "total_tokens": 26165832} {"current_steps": 45365, "total_steps": 67140, "loss": 0.5055, "lr": 1.4382151207807243e-05, "epoch": 6.756776884122728, "percentage": 67.57, "elapsed_time": "3:08:34", "remaining_time": "1:30:30", "throughput": 2312.9, "total_tokens": 26168744} {"current_steps": 45370, "total_steps": 67140, "loss": 0.6622, "lr": 1.4376267984788902e-05, "epoch": 6.757521596663688, "percentage": 67.58, "elapsed_time": "3:08:35", "remaining_time": "1:30:29", "throughput": 2312.92, "total_tokens": 26171560} {"current_steps": 45375, "total_steps": 67140, "loss": 0.4928, "lr": 1.4370385479679177e-05, "epoch": 6.758266309204647, "percentage": 67.58, "elapsed_time": "3:08:36", "remaining_time": "1:30:28", "throughput": 2312.95, "total_tokens": 26174472} {"current_steps": 45380, "total_steps": 67140, "loss": 0.5708, "lr": 1.4364503692875598e-05, "epoch": 6.759011021745606, "percentage": 67.59, "elapsed_time": "3:08:37", "remaining_time": "1:30:26", "throughput": 2312.97, "total_tokens": 26177352} {"current_steps": 45385, "total_steps": 67140, "loss": 0.5612, "lr": 1.4358622624775603e-05, "epoch": 6.759755734286565, "percentage": 67.6, "elapsed_time": "3:08:38", "remaining_time": "1:30:25", "throughput": 2312.99, "total_tokens": 26180136} {"current_steps": 45390, "total_steps": 67140, "loss": 0.6383, "lr": 1.4352742275776632e-05, "epoch": 6.760500446827525, "percentage": 67.61, "elapsed_time": "3:08:39", "remaining_time": "1:30:24", "throughput": 2313.0, "total_tokens": 26182920} {"current_steps": 45395, "total_steps": 67140, "loss": 0.8482, "lr": 1.4346862646276055e-05, "epoch": 6.7612451593684835, "percentage": 67.61, "elapsed_time": "3:08:41", "remaining_time": "1:30:22", "throughput": 2313.03, "total_tokens": 26185832} {"current_steps": 45400, "total_steps": 67140, "loss": 0.4521, "lr": 1.4340983736671179e-05, "epoch": 6.761989871909443, "percentage": 67.62, "elapsed_time": "3:08:42", "remaining_time": "1:30:21", "throughput": 2313.04, "total_tokens": 26188520} {"current_steps": 45405, "total_steps": 67140, "loss": 0.6487, "lr": 1.4335105547359287e-05, "epoch": 6.762734584450402, "percentage": 67.63, "elapsed_time": "3:08:43", "remaining_time": "1:30:20", "throughput": 2313.05, "total_tokens": 26191272} {"current_steps": 45410, "total_steps": 67140, "loss": 0.5418, "lr": 1.43292280787376e-05, "epoch": 6.7634792969913615, "percentage": 67.63, "elapsed_time": "3:08:44", "remaining_time": "1:30:19", "throughput": 2313.07, "total_tokens": 26194152} {"current_steps": 45415, "total_steps": 67140, "loss": 0.5603, "lr": 1.4323351331203296e-05, "epoch": 6.76422400953232, "percentage": 67.64, "elapsed_time": "3:08:45", "remaining_time": "1:30:17", "throughput": 2313.08, "total_tokens": 26196680} {"current_steps": 45420, "total_steps": 67140, "loss": 0.6323, "lr": 1.431747530515351e-05, "epoch": 6.76496872207328, "percentage": 67.65, "elapsed_time": "3:08:46", "remaining_time": "1:30:16", "throughput": 2313.1, "total_tokens": 26199688} {"current_steps": 45425, "total_steps": 67140, "loss": 0.5212, "lr": 1.4311600000985303e-05, "epoch": 6.765713434614239, "percentage": 67.66, "elapsed_time": "3:08:47", "remaining_time": "1:30:15", "throughput": 2313.13, "total_tokens": 26202568} {"current_steps": 45430, "total_steps": 67140, "loss": 0.6074, "lr": 1.4305725419095722e-05, "epoch": 6.766458147155198, "percentage": 67.66, "elapsed_time": "3:08:48", "remaining_time": "1:30:13", "throughput": 2313.16, "total_tokens": 26205736} {"current_steps": 45435, "total_steps": 67140, "loss": 0.5997, "lr": 1.4299851559881727e-05, "epoch": 6.767202859696157, "percentage": 67.67, "elapsed_time": "3:08:50", "remaining_time": "1:30:12", "throughput": 2313.19, "total_tokens": 26208712} {"current_steps": 45440, "total_steps": 67140, "loss": 0.6795, "lr": 1.4293978423740259e-05, "epoch": 6.767947572237117, "percentage": 67.68, "elapsed_time": "3:08:51", "remaining_time": "1:30:11", "throughput": 2313.21, "total_tokens": 26211592} {"current_steps": 45445, "total_steps": 67140, "loss": 0.6778, "lr": 1.4288106011068203e-05, "epoch": 6.7686922847780755, "percentage": 67.69, "elapsed_time": "3:08:52", "remaining_time": "1:30:09", "throughput": 2313.23, "total_tokens": 26214504} {"current_steps": 45450, "total_steps": 67140, "loss": 0.4593, "lr": 1.4282234322262389e-05, "epoch": 6.769436997319035, "percentage": 67.69, "elapsed_time": "3:08:53", "remaining_time": "1:30:08", "throughput": 2313.25, "total_tokens": 26217352} {"current_steps": 45455, "total_steps": 67140, "loss": 0.7084, "lr": 1.4276363357719605e-05, "epoch": 6.770181709859994, "percentage": 67.7, "elapsed_time": "3:08:54", "remaining_time": "1:30:07", "throughput": 2313.28, "total_tokens": 26220296} {"current_steps": 45460, "total_steps": 67140, "loss": 0.496, "lr": 1.4270493117836597e-05, "epoch": 6.7709264224009535, "percentage": 67.71, "elapsed_time": "3:08:55", "remaining_time": "1:30:06", "throughput": 2313.28, "total_tokens": 26222824} {"current_steps": 45465, "total_steps": 67140, "loss": 0.5693, "lr": 1.4264623603010042e-05, "epoch": 6.771671134941912, "percentage": 67.72, "elapsed_time": "3:08:56", "remaining_time": "1:30:04", "throughput": 2313.29, "total_tokens": 26225512} {"current_steps": 45470, "total_steps": 67140, "loss": 0.6813, "lr": 1.4258754813636565e-05, "epoch": 6.772415847482872, "percentage": 67.72, "elapsed_time": "3:08:58", "remaining_time": "1:30:03", "throughput": 2313.31, "total_tokens": 26228296} {"current_steps": 45475, "total_steps": 67140, "loss": 0.7115, "lr": 1.4252886750112768e-05, "epoch": 6.773160560023831, "percentage": 67.73, "elapsed_time": "3:08:59", "remaining_time": "1:30:02", "throughput": 2313.33, "total_tokens": 26231144} {"current_steps": 45480, "total_steps": 67140, "loss": 0.6813, "lr": 1.4247019412835188e-05, "epoch": 6.77390527256479, "percentage": 67.74, "elapsed_time": "3:09:00", "remaining_time": "1:30:00", "throughput": 2313.34, "total_tokens": 26233960} {"current_steps": 45485, "total_steps": 67140, "loss": 0.6697, "lr": 1.4241152802200319e-05, "epoch": 6.774649985105749, "percentage": 67.75, "elapsed_time": "3:09:01", "remaining_time": "1:29:59", "throughput": 2313.35, "total_tokens": 26236584} {"current_steps": 45490, "total_steps": 67140, "loss": 0.552, "lr": 1.4235286918604613e-05, "epoch": 6.775394697646709, "percentage": 67.75, "elapsed_time": "3:09:02", "remaining_time": "1:29:58", "throughput": 2313.37, "total_tokens": 26239400} {"current_steps": 45495, "total_steps": 67140, "loss": 0.5875, "lr": 1.422942176244444e-05, "epoch": 6.7761394101876675, "percentage": 67.76, "elapsed_time": "3:09:03", "remaining_time": "1:29:56", "throughput": 2313.39, "total_tokens": 26242184} {"current_steps": 45500, "total_steps": 67140, "loss": 0.594, "lr": 1.4223557334116167e-05, "epoch": 6.776884122728626, "percentage": 67.77, "elapsed_time": "3:09:04", "remaining_time": "1:29:55", "throughput": 2313.39, "total_tokens": 26244808} {"current_steps": 45505, "total_steps": 67140, "loss": 0.3899, "lr": 1.421769363401606e-05, "epoch": 6.777628835269586, "percentage": 67.78, "elapsed_time": "3:09:05", "remaining_time": "1:29:54", "throughput": 2313.41, "total_tokens": 26247560} {"current_steps": 45510, "total_steps": 67140, "loss": 0.5836, "lr": 1.4211830662540381e-05, "epoch": 6.778373547810546, "percentage": 67.78, "elapsed_time": "3:09:06", "remaining_time": "1:29:52", "throughput": 2313.44, "total_tokens": 26250536} {"current_steps": 45515, "total_steps": 67140, "loss": 0.4864, "lr": 1.4205968420085324e-05, "epoch": 6.779118260351504, "percentage": 67.79, "elapsed_time": "3:09:08", "remaining_time": "1:29:51", "throughput": 2313.47, "total_tokens": 26253544} {"current_steps": 45520, "total_steps": 67140, "loss": 0.5157, "lr": 1.4200106907047039e-05, "epoch": 6.779862972892463, "percentage": 67.8, "elapsed_time": "3:09:09", "remaining_time": "1:29:50", "throughput": 2313.49, "total_tokens": 26256360} {"current_steps": 45525, "total_steps": 67140, "loss": 0.3536, "lr": 1.419424612382163e-05, "epoch": 6.780607685433423, "percentage": 67.81, "elapsed_time": "3:09:10", "remaining_time": "1:29:49", "throughput": 2313.51, "total_tokens": 26259272} {"current_steps": 45530, "total_steps": 67140, "loss": 0.7214, "lr": 1.418838607080512e-05, "epoch": 6.781352397974382, "percentage": 67.81, "elapsed_time": "3:09:11", "remaining_time": "1:29:47", "throughput": 2313.55, "total_tokens": 26262280} {"current_steps": 45535, "total_steps": 67140, "loss": 0.5546, "lr": 1.4182526748393526e-05, "epoch": 6.782097110515341, "percentage": 67.82, "elapsed_time": "3:09:12", "remaining_time": "1:29:46", "throughput": 2313.56, "total_tokens": 26264968} {"current_steps": 45540, "total_steps": 67140, "loss": 0.3291, "lr": 1.4176668156982798e-05, "epoch": 6.7828418230563, "percentage": 67.83, "elapsed_time": "3:09:13", "remaining_time": "1:29:45", "throughput": 2313.59, "total_tokens": 26268072} {"current_steps": 45545, "total_steps": 67140, "loss": 0.6888, "lr": 1.4170810296968834e-05, "epoch": 6.7835865355972595, "percentage": 67.84, "elapsed_time": "3:09:14", "remaining_time": "1:29:43", "throughput": 2313.61, "total_tokens": 26270920} {"current_steps": 45550, "total_steps": 67140, "loss": 0.8221, "lr": 1.4164953168747475e-05, "epoch": 6.784331248138218, "percentage": 67.84, "elapsed_time": "3:09:16", "remaining_time": "1:29:42", "throughput": 2313.64, "total_tokens": 26273800} {"current_steps": 45555, "total_steps": 67140, "loss": 0.6524, "lr": 1.4159096772714531e-05, "epoch": 6.785075960679178, "percentage": 67.85, "elapsed_time": "3:09:17", "remaining_time": "1:29:41", "throughput": 2313.66, "total_tokens": 26276712} {"current_steps": 45560, "total_steps": 67140, "loss": 0.5103, "lr": 1.4153241109265759e-05, "epoch": 6.785820673220137, "percentage": 67.86, "elapsed_time": "3:09:18", "remaining_time": "1:29:39", "throughput": 2313.67, "total_tokens": 26279400} {"current_steps": 45565, "total_steps": 67140, "loss": 0.7244, "lr": 1.414738617879684e-05, "epoch": 6.786565385761096, "percentage": 67.87, "elapsed_time": "3:09:19", "remaining_time": "1:29:38", "throughput": 2313.7, "total_tokens": 26282344} {"current_steps": 45570, "total_steps": 67140, "loss": 0.5741, "lr": 1.4141531981703444e-05, "epoch": 6.787310098302055, "percentage": 67.87, "elapsed_time": "3:09:20", "remaining_time": "1:29:37", "throughput": 2313.73, "total_tokens": 26285352} {"current_steps": 45575, "total_steps": 67140, "loss": 0.5916, "lr": 1.4135678518381168e-05, "epoch": 6.788054810843015, "percentage": 67.88, "elapsed_time": "3:09:21", "remaining_time": "1:29:36", "throughput": 2313.75, "total_tokens": 26288104} {"current_steps": 45580, "total_steps": 67140, "loss": 0.7692, "lr": 1.4129825789225564e-05, "epoch": 6.7887995233839735, "percentage": 67.89, "elapsed_time": "3:09:22", "remaining_time": "1:29:34", "throughput": 2313.76, "total_tokens": 26290824} {"current_steps": 45585, "total_steps": 67140, "loss": 0.717, "lr": 1.412397379463215e-05, "epoch": 6.789544235924933, "percentage": 67.9, "elapsed_time": "3:09:23", "remaining_time": "1:29:33", "throughput": 2313.79, "total_tokens": 26293832} {"current_steps": 45590, "total_steps": 67140, "loss": 0.5464, "lr": 1.4118122534996358e-05, "epoch": 6.790288948465892, "percentage": 67.9, "elapsed_time": "3:09:25", "remaining_time": "1:29:32", "throughput": 2313.82, "total_tokens": 26296872} {"current_steps": 45595, "total_steps": 67140, "loss": 0.4654, "lr": 1.4112272010713617e-05, "epoch": 6.791033661006852, "percentage": 67.91, "elapsed_time": "3:09:26", "remaining_time": "1:29:30", "throughput": 2313.85, "total_tokens": 26299784} {"current_steps": 45600, "total_steps": 67140, "loss": 0.5847, "lr": 1.4106422222179252e-05, "epoch": 6.79177837354781, "percentage": 67.92, "elapsed_time": "3:09:27", "remaining_time": "1:29:29", "throughput": 2313.85, "total_tokens": 26302440} {"current_steps": 45605, "total_steps": 67140, "loss": 0.6334, "lr": 1.4100573169788584e-05, "epoch": 6.79252308608877, "percentage": 67.93, "elapsed_time": "3:09:28", "remaining_time": "1:29:28", "throughput": 2313.86, "total_tokens": 26304968} {"current_steps": 45610, "total_steps": 67140, "loss": 0.5929, "lr": 1.4094724853936869e-05, "epoch": 6.793267798629729, "percentage": 67.93, "elapsed_time": "3:09:29", "remaining_time": "1:29:26", "throughput": 2313.87, "total_tokens": 26307784} {"current_steps": 45615, "total_steps": 67140, "loss": 0.6584, "lr": 1.4088877275019311e-05, "epoch": 6.794012511170688, "percentage": 67.94, "elapsed_time": "3:09:30", "remaining_time": "1:29:25", "throughput": 2313.9, "total_tokens": 26310728} {"current_steps": 45620, "total_steps": 67140, "loss": 0.3566, "lr": 1.4083030433431066e-05, "epoch": 6.794757223711647, "percentage": 67.95, "elapsed_time": "3:09:31", "remaining_time": "1:29:24", "throughput": 2313.91, "total_tokens": 26313448} {"current_steps": 45625, "total_steps": 67140, "loss": 0.6257, "lr": 1.4077184329567244e-05, "epoch": 6.795501936252607, "percentage": 67.96, "elapsed_time": "3:09:32", "remaining_time": "1:29:23", "throughput": 2313.93, "total_tokens": 26316296} {"current_steps": 45630, "total_steps": 67140, "loss": 0.481, "lr": 1.40713389638229e-05, "epoch": 6.7962466487935655, "percentage": 67.96, "elapsed_time": "3:09:34", "remaining_time": "1:29:21", "throughput": 2313.94, "total_tokens": 26318984} {"current_steps": 45635, "total_steps": 67140, "loss": 0.599, "lr": 1.4065494336593027e-05, "epoch": 6.796991361334525, "percentage": 67.97, "elapsed_time": "3:09:35", "remaining_time": "1:29:20", "throughput": 2313.98, "total_tokens": 26322088} {"current_steps": 45640, "total_steps": 67140, "loss": 0.6407, "lr": 1.4059650448272587e-05, "epoch": 6.797736073875484, "percentage": 67.98, "elapsed_time": "3:09:36", "remaining_time": "1:29:19", "throughput": 2314.01, "total_tokens": 26325000} {"current_steps": 45645, "total_steps": 67140, "loss": 0.4748, "lr": 1.4053807299256495e-05, "epoch": 6.798480786416444, "percentage": 67.98, "elapsed_time": "3:09:37", "remaining_time": "1:29:17", "throughput": 2314.03, "total_tokens": 26327912} {"current_steps": 45650, "total_steps": 67140, "loss": 0.7705, "lr": 1.4047964889939596e-05, "epoch": 6.799225498957402, "percentage": 67.99, "elapsed_time": "3:09:38", "remaining_time": "1:29:16", "throughput": 2314.04, "total_tokens": 26330536} {"current_steps": 45655, "total_steps": 67140, "loss": 0.4897, "lr": 1.4042123220716713e-05, "epoch": 6.799970211498362, "percentage": 68.0, "elapsed_time": "3:09:39", "remaining_time": "1:29:15", "throughput": 2314.07, "total_tokens": 26333544} {"current_steps": 45660, "total_steps": 67140, "loss": 0.4082, "lr": 1.4036282291982583e-05, "epoch": 6.800714924039321, "percentage": 68.01, "elapsed_time": "3:09:40", "remaining_time": "1:29:13", "throughput": 2314.08, "total_tokens": 26336328} {"current_steps": 45665, "total_steps": 67140, "loss": 0.4572, "lr": 1.403044210413193e-05, "epoch": 6.8014596365802795, "percentage": 68.01, "elapsed_time": "3:09:42", "remaining_time": "1:29:12", "throughput": 2314.1, "total_tokens": 26339144} {"current_steps": 45670, "total_steps": 67140, "loss": 0.3781, "lr": 1.4024602657559393e-05, "epoch": 6.802204349121239, "percentage": 68.02, "elapsed_time": "3:09:43", "remaining_time": "1:29:11", "throughput": 2314.13, "total_tokens": 26342184} {"current_steps": 45675, "total_steps": 67140, "loss": 0.7555, "lr": 1.4018763952659581e-05, "epoch": 6.802949061662199, "percentage": 68.03, "elapsed_time": "3:09:44", "remaining_time": "1:29:10", "throughput": 2314.16, "total_tokens": 26345256} {"current_steps": 45680, "total_steps": 67140, "loss": 0.7366, "lr": 1.4012925989827058e-05, "epoch": 6.803693774203158, "percentage": 68.04, "elapsed_time": "3:09:45", "remaining_time": "1:29:08", "throughput": 2314.18, "total_tokens": 26348072} {"current_steps": 45685, "total_steps": 67140, "loss": 0.7436, "lr": 1.4007088769456326e-05, "epoch": 6.804438486744116, "percentage": 68.04, "elapsed_time": "3:09:46", "remaining_time": "1:29:07", "throughput": 2314.21, "total_tokens": 26351144} {"current_steps": 45690, "total_steps": 67140, "loss": 0.654, "lr": 1.400125229194185e-05, "epoch": 6.805183199285076, "percentage": 68.05, "elapsed_time": "3:09:47", "remaining_time": "1:29:06", "throughput": 2314.23, "total_tokens": 26353960} {"current_steps": 45695, "total_steps": 67140, "loss": 0.6428, "lr": 1.3995416557678016e-05, "epoch": 6.805927911826036, "percentage": 68.06, "elapsed_time": "3:09:48", "remaining_time": "1:29:04", "throughput": 2314.24, "total_tokens": 26356712} {"current_steps": 45700, "total_steps": 67140, "loss": 0.6638, "lr": 1.398958156705919e-05, "epoch": 6.806672624366994, "percentage": 68.07, "elapsed_time": "3:09:50", "remaining_time": "1:29:03", "throughput": 2314.26, "total_tokens": 26359560} {"current_steps": 45705, "total_steps": 67140, "loss": 0.5283, "lr": 1.3983747320479688e-05, "epoch": 6.807417336907953, "percentage": 68.07, "elapsed_time": "3:09:51", "remaining_time": "1:29:02", "throughput": 2314.29, "total_tokens": 26362536} {"current_steps": 45710, "total_steps": 67140, "loss": 0.5933, "lr": 1.3977913818333744e-05, "epoch": 6.808162049448913, "percentage": 68.08, "elapsed_time": "3:09:52", "remaining_time": "1:29:01", "throughput": 2314.31, "total_tokens": 26365480} {"current_steps": 45715, "total_steps": 67140, "loss": 0.7487, "lr": 1.3972081061015569e-05, "epoch": 6.8089067619898715, "percentage": 68.09, "elapsed_time": "3:09:53", "remaining_time": "1:28:59", "throughput": 2314.34, "total_tokens": 26368456} {"current_steps": 45720, "total_steps": 67140, "loss": 0.7591, "lr": 1.396624904891932e-05, "epoch": 6.809651474530831, "percentage": 68.1, "elapsed_time": "3:09:54", "remaining_time": "1:28:58", "throughput": 2314.38, "total_tokens": 26371528} {"current_steps": 45725, "total_steps": 67140, "loss": 0.6056, "lr": 1.3960417782439112e-05, "epoch": 6.81039618707179, "percentage": 68.1, "elapsed_time": "3:09:55", "remaining_time": "1:28:57", "throughput": 2314.38, "total_tokens": 26374088} {"current_steps": 45730, "total_steps": 67140, "loss": 0.532, "lr": 1.3954587261968974e-05, "epoch": 6.81114089961275, "percentage": 68.11, "elapsed_time": "3:09:56", "remaining_time": "1:28:55", "throughput": 2314.4, "total_tokens": 26376936} {"current_steps": 45735, "total_steps": 67140, "loss": 0.5833, "lr": 1.3948757487902923e-05, "epoch": 6.811885612153708, "percentage": 68.12, "elapsed_time": "3:09:58", "remaining_time": "1:28:54", "throughput": 2314.42, "total_tokens": 26379752} {"current_steps": 45740, "total_steps": 67140, "loss": 0.3178, "lr": 1.3942928460634907e-05, "epoch": 6.812630324694668, "percentage": 68.13, "elapsed_time": "3:09:59", "remaining_time": "1:28:53", "throughput": 2314.45, "total_tokens": 26382920} {"current_steps": 45745, "total_steps": 67140, "loss": 0.7132, "lr": 1.3937100180558846e-05, "epoch": 6.813375037235627, "percentage": 68.13, "elapsed_time": "3:10:00", "remaining_time": "1:28:51", "throughput": 2314.49, "total_tokens": 26385960} {"current_steps": 45750, "total_steps": 67140, "loss": 0.6175, "lr": 1.3931272648068565e-05, "epoch": 6.814119749776586, "percentage": 68.14, "elapsed_time": "3:10:01", "remaining_time": "1:28:50", "throughput": 2314.5, "total_tokens": 26388744} {"current_steps": 45755, "total_steps": 67140, "loss": 0.4291, "lr": 1.3925445863557873e-05, "epoch": 6.814864462317545, "percentage": 68.15, "elapsed_time": "3:10:02", "remaining_time": "1:28:49", "throughput": 2314.52, "total_tokens": 26391592} {"current_steps": 45760, "total_steps": 67140, "loss": 0.6592, "lr": 1.3919619827420538e-05, "epoch": 6.815609174858505, "percentage": 68.16, "elapsed_time": "3:10:03", "remaining_time": "1:28:48", "throughput": 2314.55, "total_tokens": 26394504} {"current_steps": 45765, "total_steps": 67140, "loss": 0.6356, "lr": 1.3913794540050234e-05, "epoch": 6.816353887399464, "percentage": 68.16, "elapsed_time": "3:10:04", "remaining_time": "1:28:46", "throughput": 2314.56, "total_tokens": 26397256} {"current_steps": 45770, "total_steps": 67140, "loss": 0.5517, "lr": 1.390797000184062e-05, "epoch": 6.817098599940423, "percentage": 68.17, "elapsed_time": "3:10:05", "remaining_time": "1:28:45", "throughput": 2314.58, "total_tokens": 26400072} {"current_steps": 45775, "total_steps": 67140, "loss": 0.454, "lr": 1.3902146213185297e-05, "epoch": 6.817843312481382, "percentage": 68.18, "elapsed_time": "3:10:07", "remaining_time": "1:28:44", "throughput": 2314.6, "total_tokens": 26402920} {"current_steps": 45780, "total_steps": 67140, "loss": 0.6237, "lr": 1.3896323174477815e-05, "epoch": 6.818588025022342, "percentage": 68.19, "elapsed_time": "3:10:08", "remaining_time": "1:28:42", "throughput": 2314.64, "total_tokens": 26406056} {"current_steps": 45785, "total_steps": 67140, "loss": 0.7759, "lr": 1.3890500886111673e-05, "epoch": 6.8193327375633, "percentage": 68.19, "elapsed_time": "3:10:09", "remaining_time": "1:28:41", "throughput": 2314.68, "total_tokens": 26409224} {"current_steps": 45790, "total_steps": 67140, "loss": 0.6335, "lr": 1.3884679348480309e-05, "epoch": 6.82007745010426, "percentage": 68.2, "elapsed_time": "3:10:10", "remaining_time": "1:28:40", "throughput": 2314.69, "total_tokens": 26411912} {"current_steps": 45795, "total_steps": 67140, "loss": 0.4884, "lr": 1.3878858561977131e-05, "epoch": 6.820822162645219, "percentage": 68.21, "elapsed_time": "3:10:11", "remaining_time": "1:28:38", "throughput": 2314.72, "total_tokens": 26414920} {"current_steps": 45800, "total_steps": 67140, "loss": 0.6075, "lr": 1.3873038526995466e-05, "epoch": 6.821566875186178, "percentage": 68.22, "elapsed_time": "3:10:12", "remaining_time": "1:28:37", "throughput": 2314.74, "total_tokens": 26417768} {"current_steps": 45805, "total_steps": 67140, "loss": 0.721, "lr": 1.386721924392862e-05, "epoch": 6.822311587727137, "percentage": 68.22, "elapsed_time": "3:10:14", "remaining_time": "1:28:36", "throughput": 2314.76, "total_tokens": 26420744} {"current_steps": 45810, "total_steps": 67140, "loss": 0.5317, "lr": 1.3861400713169831e-05, "epoch": 6.823056300268097, "percentage": 68.23, "elapsed_time": "3:10:15", "remaining_time": "1:28:35", "throughput": 2314.78, "total_tokens": 26423560} {"current_steps": 45815, "total_steps": 67140, "loss": 0.541, "lr": 1.38555829351123e-05, "epoch": 6.823801012809056, "percentage": 68.24, "elapsed_time": "3:10:16", "remaining_time": "1:28:33", "throughput": 2314.8, "total_tokens": 26426440} {"current_steps": 45820, "total_steps": 67140, "loss": 0.5882, "lr": 1.384976591014917e-05, "epoch": 6.824545725350015, "percentage": 68.25, "elapsed_time": "3:10:17", "remaining_time": "1:28:32", "throughput": 2314.83, "total_tokens": 26429416} {"current_steps": 45825, "total_steps": 67140, "loss": 0.5141, "lr": 1.384394963867352e-05, "epoch": 6.825290437890974, "percentage": 68.25, "elapsed_time": "3:10:18", "remaining_time": "1:28:31", "throughput": 2314.84, "total_tokens": 26432104} {"current_steps": 45830, "total_steps": 67140, "loss": 0.705, "lr": 1.3838134121078403e-05, "epoch": 6.826035150431934, "percentage": 68.26, "elapsed_time": "3:10:19", "remaining_time": "1:28:29", "throughput": 2314.87, "total_tokens": 26435048} {"current_steps": 45835, "total_steps": 67140, "loss": 0.6559, "lr": 1.3832319357756793e-05, "epoch": 6.826779862972892, "percentage": 68.27, "elapsed_time": "3:10:20", "remaining_time": "1:28:28", "throughput": 2314.88, "total_tokens": 26437832} {"current_steps": 45840, "total_steps": 67140, "loss": 0.5797, "lr": 1.3826505349101637e-05, "epoch": 6.827524575513852, "percentage": 68.28, "elapsed_time": "3:10:21", "remaining_time": "1:28:27", "throughput": 2314.88, "total_tokens": 26440392} {"current_steps": 45845, "total_steps": 67140, "loss": 0.4622, "lr": 1.3820692095505819e-05, "epoch": 6.828269288054811, "percentage": 68.28, "elapsed_time": "3:10:23", "remaining_time": "1:28:25", "throughput": 2314.89, "total_tokens": 26443048} {"current_steps": 45850, "total_steps": 67140, "loss": 0.5235, "lr": 1.381487959736218e-05, "epoch": 6.82901400059577, "percentage": 68.29, "elapsed_time": "3:10:24", "remaining_time": "1:28:24", "throughput": 2314.93, "total_tokens": 26446120} {"current_steps": 45855, "total_steps": 67140, "loss": 0.5481, "lr": 1.3809067855063512e-05, "epoch": 6.829758713136729, "percentage": 68.3, "elapsed_time": "3:10:25", "remaining_time": "1:28:23", "throughput": 2314.96, "total_tokens": 26449128} {"current_steps": 45860, "total_steps": 67140, "loss": 0.6864, "lr": 1.3803256869002529e-05, "epoch": 6.830503425677689, "percentage": 68.31, "elapsed_time": "3:10:26", "remaining_time": "1:28:22", "throughput": 2315.0, "total_tokens": 26452264} {"current_steps": 45865, "total_steps": 67140, "loss": 0.5501, "lr": 1.379744663957193e-05, "epoch": 6.831248138218648, "percentage": 68.31, "elapsed_time": "3:10:27", "remaining_time": "1:28:20", "throughput": 2315.02, "total_tokens": 26455176} {"current_steps": 45870, "total_steps": 67140, "loss": 0.5699, "lr": 1.3791637167164337e-05, "epoch": 6.831992850759606, "percentage": 68.32, "elapsed_time": "3:10:28", "remaining_time": "1:28:19", "throughput": 2315.04, "total_tokens": 26457928} {"current_steps": 45875, "total_steps": 67140, "loss": 0.57, "lr": 1.3785828452172333e-05, "epoch": 6.832737563300566, "percentage": 68.33, "elapsed_time": "3:10:30", "remaining_time": "1:28:18", "throughput": 2315.14, "total_tokens": 26462472} {"current_steps": 45880, "total_steps": 67140, "loss": 0.5156, "lr": 1.3780020494988446e-05, "epoch": 6.833482275841525, "percentage": 68.33, "elapsed_time": "3:10:31", "remaining_time": "1:28:17", "throughput": 2315.16, "total_tokens": 26465224} {"current_steps": 45885, "total_steps": 67140, "loss": 0.4934, "lr": 1.3774213296005159e-05, "epoch": 6.834226988382484, "percentage": 68.34, "elapsed_time": "3:10:32", "remaining_time": "1:28:15", "throughput": 2315.17, "total_tokens": 26467976} {"current_steps": 45890, "total_steps": 67140, "loss": 0.534, "lr": 1.3768406855614907e-05, "epoch": 6.834971700923443, "percentage": 68.35, "elapsed_time": "3:10:33", "remaining_time": "1:28:14", "throughput": 2315.19, "total_tokens": 26470888} {"current_steps": 45895, "total_steps": 67140, "loss": 0.5989, "lr": 1.3762601174210044e-05, "epoch": 6.835716413464403, "percentage": 68.36, "elapsed_time": "3:10:34", "remaining_time": "1:28:13", "throughput": 2315.22, "total_tokens": 26473864} {"current_steps": 45900, "total_steps": 67140, "loss": 0.5086, "lr": 1.3756796252182907e-05, "epoch": 6.836461126005362, "percentage": 68.36, "elapsed_time": "3:10:35", "remaining_time": "1:28:11", "throughput": 2315.24, "total_tokens": 26476648} {"current_steps": 45905, "total_steps": 67140, "loss": 0.5889, "lr": 1.3750992089925777e-05, "epoch": 6.837205838546321, "percentage": 68.37, "elapsed_time": "3:10:36", "remaining_time": "1:28:10", "throughput": 2315.25, "total_tokens": 26479336} {"current_steps": 45910, "total_steps": 67140, "loss": 0.6198, "lr": 1.3745188687830857e-05, "epoch": 6.83795055108728, "percentage": 68.38, "elapsed_time": "3:10:38", "remaining_time": "1:28:09", "throughput": 2315.27, "total_tokens": 26482120} {"current_steps": 45915, "total_steps": 67140, "loss": 0.4393, "lr": 1.3739386046290326e-05, "epoch": 6.83869526362824, "percentage": 68.39, "elapsed_time": "3:10:39", "remaining_time": "1:28:07", "throughput": 2315.29, "total_tokens": 26485064} {"current_steps": 45920, "total_steps": 67140, "loss": 0.4275, "lr": 1.3733584165696304e-05, "epoch": 6.839439976169198, "percentage": 68.39, "elapsed_time": "3:10:40", "remaining_time": "1:28:06", "throughput": 2315.31, "total_tokens": 26487848} {"current_steps": 45925, "total_steps": 67140, "loss": 0.7668, "lr": 1.3727783046440868e-05, "epoch": 6.840184688710158, "percentage": 68.4, "elapsed_time": "3:10:41", "remaining_time": "1:28:05", "throughput": 2315.35, "total_tokens": 26491048} {"current_steps": 45930, "total_steps": 67140, "loss": 0.7359, "lr": 1.3721982688916014e-05, "epoch": 6.840929401251117, "percentage": 68.41, "elapsed_time": "3:10:42", "remaining_time": "1:28:04", "throughput": 2315.35, "total_tokens": 26493640} {"current_steps": 45935, "total_steps": 67140, "loss": 0.5846, "lr": 1.3716183093513717e-05, "epoch": 6.8416741137920765, "percentage": 68.42, "elapsed_time": "3:10:43", "remaining_time": "1:28:02", "throughput": 2315.37, "total_tokens": 26496488} {"current_steps": 45940, "total_steps": 67140, "loss": 0.6366, "lr": 1.3710384260625891e-05, "epoch": 6.842418826333035, "percentage": 68.42, "elapsed_time": "3:10:44", "remaining_time": "1:28:01", "throughput": 2315.42, "total_tokens": 26499720} {"current_steps": 45945, "total_steps": 67140, "loss": 0.7178, "lr": 1.3704586190644405e-05, "epoch": 6.843163538873995, "percentage": 68.43, "elapsed_time": "3:10:46", "remaining_time": "1:28:00", "throughput": 2315.44, "total_tokens": 26502632} {"current_steps": 45950, "total_steps": 67140, "loss": 0.5982, "lr": 1.369878888396105e-05, "epoch": 6.843908251414954, "percentage": 68.44, "elapsed_time": "3:10:47", "remaining_time": "1:27:58", "throughput": 2315.47, "total_tokens": 26505576} {"current_steps": 45955, "total_steps": 67140, "loss": 0.6457, "lr": 1.3692992340967598e-05, "epoch": 6.844652963955913, "percentage": 68.45, "elapsed_time": "3:10:48", "remaining_time": "1:27:57", "throughput": 2315.48, "total_tokens": 26508264} {"current_steps": 45960, "total_steps": 67140, "loss": 0.4963, "lr": 1.368719656205576e-05, "epoch": 6.845397676496872, "percentage": 68.45, "elapsed_time": "3:10:49", "remaining_time": "1:27:56", "throughput": 2315.5, "total_tokens": 26511144} {"current_steps": 45965, "total_steps": 67140, "loss": 0.5715, "lr": 1.3681401547617173e-05, "epoch": 6.846142389037832, "percentage": 68.46, "elapsed_time": "3:10:50", "remaining_time": "1:27:54", "throughput": 2315.51, "total_tokens": 26513864} {"current_steps": 45970, "total_steps": 67140, "loss": 0.6772, "lr": 1.3675607298043453e-05, "epoch": 6.84688710157879, "percentage": 68.47, "elapsed_time": "3:10:51", "remaining_time": "1:27:53", "throughput": 2315.53, "total_tokens": 26516744} {"current_steps": 45975, "total_steps": 67140, "loss": 0.4262, "lr": 1.3669813813726151e-05, "epoch": 6.84763181411975, "percentage": 68.48, "elapsed_time": "3:10:52", "remaining_time": "1:27:52", "throughput": 2315.56, "total_tokens": 26519688} {"current_steps": 45980, "total_steps": 67140, "loss": 0.5848, "lr": 1.3664021095056764e-05, "epoch": 6.848376526660709, "percentage": 68.48, "elapsed_time": "3:10:53", "remaining_time": "1:27:51", "throughput": 2315.58, "total_tokens": 26522504} {"current_steps": 45985, "total_steps": 67140, "loss": 0.7813, "lr": 1.3658229142426754e-05, "epoch": 6.8491212392016685, "percentage": 68.49, "elapsed_time": "3:10:55", "remaining_time": "1:27:49", "throughput": 2315.59, "total_tokens": 26525224} {"current_steps": 45990, "total_steps": 67140, "loss": 0.7313, "lr": 1.3652437956227496e-05, "epoch": 6.849865951742627, "percentage": 68.5, "elapsed_time": "3:10:56", "remaining_time": "1:27:48", "throughput": 2315.6, "total_tokens": 26527944} {"current_steps": 45995, "total_steps": 67140, "loss": 0.5284, "lr": 1.3646647536850354e-05, "epoch": 6.850610664283587, "percentage": 68.51, "elapsed_time": "3:10:57", "remaining_time": "1:27:47", "throughput": 2315.62, "total_tokens": 26530728} {"current_steps": 46000, "total_steps": 67140, "loss": 0.538, "lr": 1.3640857884686603e-05, "epoch": 6.851355376824546, "percentage": 68.51, "elapsed_time": "3:10:58", "remaining_time": "1:27:45", "throughput": 2315.63, "total_tokens": 26533416} {"current_steps": 46005, "total_steps": 67140, "loss": 0.5625, "lr": 1.3635069000127493e-05, "epoch": 6.852100089365505, "percentage": 68.52, "elapsed_time": "3:10:59", "remaining_time": "1:27:44", "throughput": 2315.66, "total_tokens": 26536488} {"current_steps": 46010, "total_steps": 67140, "loss": 0.7953, "lr": 1.3629280883564217e-05, "epoch": 6.852844801906464, "percentage": 68.53, "elapsed_time": "3:11:00", "remaining_time": "1:27:43", "throughput": 2315.67, "total_tokens": 26539144} {"current_steps": 46015, "total_steps": 67140, "loss": 0.5057, "lr": 1.3623493535387905e-05, "epoch": 6.853589514447423, "percentage": 68.54, "elapsed_time": "3:11:01", "remaining_time": "1:27:42", "throughput": 2315.69, "total_tokens": 26541992} {"current_steps": 46020, "total_steps": 67140, "loss": 0.5761, "lr": 1.3617706955989656e-05, "epoch": 6.8543342269883825, "percentage": 68.54, "elapsed_time": "3:11:02", "remaining_time": "1:27:40", "throughput": 2315.71, "total_tokens": 26544840} {"current_steps": 46025, "total_steps": 67140, "loss": 0.6235, "lr": 1.3611921145760487e-05, "epoch": 6.855078939529342, "percentage": 68.55, "elapsed_time": "3:11:04", "remaining_time": "1:27:39", "throughput": 2315.75, "total_tokens": 26548040} {"current_steps": 46030, "total_steps": 67140, "loss": 0.5475, "lr": 1.3606136105091393e-05, "epoch": 6.855823652070301, "percentage": 68.56, "elapsed_time": "3:11:05", "remaining_time": "1:27:38", "throughput": 2315.77, "total_tokens": 26550888} {"current_steps": 46035, "total_steps": 67140, "loss": 0.5933, "lr": 1.3600351834373286e-05, "epoch": 6.85656836461126, "percentage": 68.57, "elapsed_time": "3:11:06", "remaining_time": "1:27:36", "throughput": 2315.78, "total_tokens": 26553608} {"current_steps": 46040, "total_steps": 67140, "loss": 0.638, "lr": 1.3594568333997059e-05, "epoch": 6.857313077152219, "percentage": 68.57, "elapsed_time": "3:11:07", "remaining_time": "1:27:35", "throughput": 2315.83, "total_tokens": 26556936} {"current_steps": 46045, "total_steps": 67140, "loss": 0.6177, "lr": 1.3588785604353532e-05, "epoch": 6.858057789693179, "percentage": 68.58, "elapsed_time": "3:11:08", "remaining_time": "1:27:34", "throughput": 2315.84, "total_tokens": 26559624} {"current_steps": 46050, "total_steps": 67140, "loss": 0.5373, "lr": 1.3583003645833478e-05, "epoch": 6.858802502234138, "percentage": 68.59, "elapsed_time": "3:11:09", "remaining_time": "1:27:32", "throughput": 2315.85, "total_tokens": 26562280} {"current_steps": 46055, "total_steps": 67140, "loss": 0.6985, "lr": 1.3577222458827628e-05, "epoch": 6.859547214775096, "percentage": 68.6, "elapsed_time": "3:11:10", "remaining_time": "1:27:31", "throughput": 2315.87, "total_tokens": 26565256} {"current_steps": 46060, "total_steps": 67140, "loss": 0.5617, "lr": 1.3571442043726634e-05, "epoch": 6.860291927316056, "percentage": 68.6, "elapsed_time": "3:11:12", "remaining_time": "1:27:30", "throughput": 2315.89, "total_tokens": 26568040} {"current_steps": 46065, "total_steps": 67140, "loss": 0.549, "lr": 1.356566240092113e-05, "epoch": 6.861036639857015, "percentage": 68.61, "elapsed_time": "3:11:13", "remaining_time": "1:27:29", "throughput": 2315.91, "total_tokens": 26570792} {"current_steps": 46070, "total_steps": 67140, "loss": 0.6676, "lr": 1.3559883530801667e-05, "epoch": 6.8617813523979745, "percentage": 68.62, "elapsed_time": "3:11:14", "remaining_time": "1:27:27", "throughput": 2315.93, "total_tokens": 26573640} {"current_steps": 46075, "total_steps": 67140, "loss": 0.6688, "lr": 1.355410543375876e-05, "epoch": 6.862526064938933, "percentage": 68.63, "elapsed_time": "3:11:15", "remaining_time": "1:27:26", "throughput": 2315.94, "total_tokens": 26576424} {"current_steps": 46080, "total_steps": 67140, "loss": 0.6336, "lr": 1.3548328110182873e-05, "epoch": 6.863270777479893, "percentage": 68.63, "elapsed_time": "3:11:16", "remaining_time": "1:27:25", "throughput": 2315.96, "total_tokens": 26579272} {"current_steps": 46085, "total_steps": 67140, "loss": 0.6311, "lr": 1.3542551560464412e-05, "epoch": 6.864015490020852, "percentage": 68.64, "elapsed_time": "3:11:17", "remaining_time": "1:27:23", "throughput": 2315.97, "total_tokens": 26581992} {"current_steps": 46090, "total_steps": 67140, "loss": 0.4884, "lr": 1.3536775784993744e-05, "epoch": 6.864760202561811, "percentage": 68.65, "elapsed_time": "3:11:18", "remaining_time": "1:27:22", "throughput": 2315.98, "total_tokens": 26584616} {"current_steps": 46095, "total_steps": 67140, "loss": 0.6588, "lr": 1.3531000784161152e-05, "epoch": 6.86550491510277, "percentage": 68.66, "elapsed_time": "3:11:19", "remaining_time": "1:27:21", "throughput": 2316.0, "total_tokens": 26587336} {"current_steps": 46100, "total_steps": 67140, "loss": 0.6148, "lr": 1.3525226558356895e-05, "epoch": 6.86624962764373, "percentage": 68.66, "elapsed_time": "3:11:21", "remaining_time": "1:27:19", "throughput": 2316.01, "total_tokens": 26590120} {"current_steps": 46105, "total_steps": 67140, "loss": 0.53, "lr": 1.3519453107971191e-05, "epoch": 6.8669943401846885, "percentage": 68.67, "elapsed_time": "3:11:22", "remaining_time": "1:27:18", "throughput": 2316.0, "total_tokens": 26592520} {"current_steps": 46110, "total_steps": 67140, "loss": 0.6369, "lr": 1.3513680433394154e-05, "epoch": 6.867739052725648, "percentage": 68.68, "elapsed_time": "3:11:23", "remaining_time": "1:27:17", "throughput": 2316.03, "total_tokens": 26595432} {"current_steps": 46115, "total_steps": 67140, "loss": 0.9019, "lr": 1.3507908535015895e-05, "epoch": 6.868483765266607, "percentage": 68.68, "elapsed_time": "3:11:24", "remaining_time": "1:27:16", "throughput": 2316.04, "total_tokens": 26598216} {"current_steps": 46120, "total_steps": 67140, "loss": 0.8099, "lr": 1.3502137413226453e-05, "epoch": 6.8692284778075665, "percentage": 68.69, "elapsed_time": "3:11:25", "remaining_time": "1:27:14", "throughput": 2316.05, "total_tokens": 26600904} {"current_steps": 46125, "total_steps": 67140, "loss": 0.5153, "lr": 1.349636706841583e-05, "epoch": 6.869973190348525, "percentage": 68.7, "elapsed_time": "3:11:26", "remaining_time": "1:27:13", "throughput": 2316.06, "total_tokens": 26603496} {"current_steps": 46130, "total_steps": 67140, "loss": 0.7207, "lr": 1.349059750097394e-05, "epoch": 6.870717902889485, "percentage": 68.71, "elapsed_time": "3:11:27", "remaining_time": "1:27:12", "throughput": 2316.08, "total_tokens": 26606440} {"current_steps": 46135, "total_steps": 67140, "loss": 0.5725, "lr": 1.3484828711290676e-05, "epoch": 6.871462615430444, "percentage": 68.71, "elapsed_time": "3:11:28", "remaining_time": "1:27:10", "throughput": 2316.11, "total_tokens": 26609320} {"current_steps": 46140, "total_steps": 67140, "loss": 0.6718, "lr": 1.347906069975587e-05, "epoch": 6.872207327971403, "percentage": 68.72, "elapsed_time": "3:11:29", "remaining_time": "1:27:09", "throughput": 2316.13, "total_tokens": 26612264} {"current_steps": 46145, "total_steps": 67140, "loss": 0.5753, "lr": 1.34732934667593e-05, "epoch": 6.872952040512362, "percentage": 68.73, "elapsed_time": "3:11:31", "remaining_time": "1:27:08", "throughput": 2316.16, "total_tokens": 26615208} {"current_steps": 46150, "total_steps": 67140, "loss": 0.6315, "lr": 1.3467527012690707e-05, "epoch": 6.873696753053322, "percentage": 68.74, "elapsed_time": "3:11:32", "remaining_time": "1:27:06", "throughput": 2316.17, "total_tokens": 26617992} {"current_steps": 46155, "total_steps": 67140, "loss": 0.4691, "lr": 1.3461761337939736e-05, "epoch": 6.8744414655942805, "percentage": 68.74, "elapsed_time": "3:11:33", "remaining_time": "1:27:05", "throughput": 2316.21, "total_tokens": 26621160} {"current_steps": 46160, "total_steps": 67140, "loss": 0.7333, "lr": 1.3455996442896036e-05, "epoch": 6.87518617813524, "percentage": 68.75, "elapsed_time": "3:11:34", "remaining_time": "1:27:04", "throughput": 2316.23, "total_tokens": 26623912} {"current_steps": 46165, "total_steps": 67140, "loss": 0.7393, "lr": 1.345023232794915e-05, "epoch": 6.875930890676199, "percentage": 68.76, "elapsed_time": "3:11:35", "remaining_time": "1:27:03", "throughput": 2316.24, "total_tokens": 26626536} {"current_steps": 46170, "total_steps": 67140, "loss": 0.6622, "lr": 1.3444468993488607e-05, "epoch": 6.8766756032171585, "percentage": 68.77, "elapsed_time": "3:11:36", "remaining_time": "1:27:01", "throughput": 2316.27, "total_tokens": 26629640} {"current_steps": 46175, "total_steps": 67140, "loss": 0.4422, "lr": 1.3438706439903866e-05, "epoch": 6.877420315758117, "percentage": 68.77, "elapsed_time": "3:11:37", "remaining_time": "1:27:00", "throughput": 2316.3, "total_tokens": 26632680} {"current_steps": 46180, "total_steps": 67140, "loss": 0.8051, "lr": 1.343294466758434e-05, "epoch": 6.878165028299077, "percentage": 68.78, "elapsed_time": "3:11:39", "remaining_time": "1:26:59", "throughput": 2316.31, "total_tokens": 26635368} {"current_steps": 46185, "total_steps": 67140, "loss": 0.8051, "lr": 1.3427183676919396e-05, "epoch": 6.878909740840036, "percentage": 68.79, "elapsed_time": "3:11:40", "remaining_time": "1:26:57", "throughput": 2316.33, "total_tokens": 26638248} {"current_steps": 46190, "total_steps": 67140, "loss": 0.6986, "lr": 1.3421423468298316e-05, "epoch": 6.879654453380995, "percentage": 68.8, "elapsed_time": "3:11:41", "remaining_time": "1:26:56", "throughput": 2316.34, "total_tokens": 26641032} {"current_steps": 46195, "total_steps": 67140, "loss": 0.4232, "lr": 1.3415664042110376e-05, "epoch": 6.880399165921954, "percentage": 68.8, "elapsed_time": "3:11:42", "remaining_time": "1:26:55", "throughput": 2316.37, "total_tokens": 26643944} {"current_steps": 46200, "total_steps": 67140, "loss": 0.5746, "lr": 1.3409905398744748e-05, "epoch": 6.881143878462913, "percentage": 68.81, "elapsed_time": "3:11:43", "remaining_time": "1:26:53", "throughput": 2316.38, "total_tokens": 26646696} {"current_steps": 46205, "total_steps": 67140, "loss": 0.463, "lr": 1.3404147538590595e-05, "epoch": 6.8818885910038725, "percentage": 68.82, "elapsed_time": "3:11:44", "remaining_time": "1:26:52", "throughput": 2316.41, "total_tokens": 26649640} {"current_steps": 46210, "total_steps": 67140, "loss": 0.8409, "lr": 1.3398390462037002e-05, "epoch": 6.882633303544832, "percentage": 68.83, "elapsed_time": "3:11:45", "remaining_time": "1:26:51", "throughput": 2316.43, "total_tokens": 26652456} {"current_steps": 46215, "total_steps": 67140, "loss": 0.6772, "lr": 1.3392634169473018e-05, "epoch": 6.883378016085791, "percentage": 68.83, "elapsed_time": "3:11:46", "remaining_time": "1:26:50", "throughput": 2316.44, "total_tokens": 26655176} {"current_steps": 46220, "total_steps": 67140, "loss": 0.7072, "lr": 1.338687866128763e-05, "epoch": 6.88412272862675, "percentage": 68.84, "elapsed_time": "3:11:48", "remaining_time": "1:26:48", "throughput": 2316.46, "total_tokens": 26658088} {"current_steps": 46225, "total_steps": 67140, "loss": 0.5968, "lr": 1.3381123937869758e-05, "epoch": 6.884867441167709, "percentage": 68.85, "elapsed_time": "3:11:49", "remaining_time": "1:26:47", "throughput": 2316.49, "total_tokens": 26660936} {"current_steps": 46230, "total_steps": 67140, "loss": 0.6089, "lr": 1.33753699996083e-05, "epoch": 6.885612153708668, "percentage": 68.86, "elapsed_time": "3:11:50", "remaining_time": "1:26:46", "throughput": 2316.5, "total_tokens": 26663656} {"current_steps": 46235, "total_steps": 67140, "loss": 0.771, "lr": 1.3369616846892069e-05, "epoch": 6.886356866249628, "percentage": 68.86, "elapsed_time": "3:11:51", "remaining_time": "1:26:44", "throughput": 2316.52, "total_tokens": 26666568} {"current_steps": 46240, "total_steps": 67140, "loss": 0.5645, "lr": 1.3363864480109842e-05, "epoch": 6.8871015787905865, "percentage": 68.87, "elapsed_time": "3:11:52", "remaining_time": "1:26:43", "throughput": 2316.55, "total_tokens": 26669672} {"current_steps": 46245, "total_steps": 67140, "loss": 0.676, "lr": 1.3358112899650345e-05, "epoch": 6.887846291331546, "percentage": 68.88, "elapsed_time": "3:11:53", "remaining_time": "1:26:42", "throughput": 2316.58, "total_tokens": 26672648} {"current_steps": 46250, "total_steps": 67140, "loss": 0.6482, "lr": 1.3352362105902246e-05, "epoch": 6.888591003872505, "percentage": 68.89, "elapsed_time": "3:11:54", "remaining_time": "1:26:41", "throughput": 2316.61, "total_tokens": 26675656} {"current_steps": 46255, "total_steps": 67140, "loss": 0.6119, "lr": 1.3346612099254172e-05, "epoch": 6.8893357164134645, "percentage": 68.89, "elapsed_time": "3:11:56", "remaining_time": "1:26:39", "throughput": 2316.63, "total_tokens": 26678568} {"current_steps": 46260, "total_steps": 67140, "loss": 0.5689, "lr": 1.3340862880094661e-05, "epoch": 6.890080428954423, "percentage": 68.9, "elapsed_time": "3:11:57", "remaining_time": "1:26:38", "throughput": 2316.64, "total_tokens": 26681224} {"current_steps": 46265, "total_steps": 67140, "loss": 0.5794, "lr": 1.3335114448812235e-05, "epoch": 6.890825141495383, "percentage": 68.91, "elapsed_time": "3:11:58", "remaining_time": "1:26:37", "throughput": 2316.67, "total_tokens": 26684232} {"current_steps": 46270, "total_steps": 67140, "loss": 0.618, "lr": 1.3329366805795357e-05, "epoch": 6.891569854036342, "percentage": 68.92, "elapsed_time": "3:11:59", "remaining_time": "1:26:35", "throughput": 2316.68, "total_tokens": 26686984} {"current_steps": 46275, "total_steps": 67140, "loss": 0.5355, "lr": 1.3323619951432415e-05, "epoch": 6.892314566577301, "percentage": 68.92, "elapsed_time": "3:12:00", "remaining_time": "1:26:34", "throughput": 2316.7, "total_tokens": 26689800} {"current_steps": 46280, "total_steps": 67140, "loss": 0.6992, "lr": 1.3317873886111759e-05, "epoch": 6.89305927911826, "percentage": 68.93, "elapsed_time": "3:12:01", "remaining_time": "1:26:33", "throughput": 2316.73, "total_tokens": 26692808} {"current_steps": 46285, "total_steps": 67140, "loss": 0.7803, "lr": 1.331212861022169e-05, "epoch": 6.89380399165922, "percentage": 68.94, "elapsed_time": "3:12:02", "remaining_time": "1:26:31", "throughput": 2316.74, "total_tokens": 26695432} {"current_steps": 46290, "total_steps": 67140, "loss": 0.585, "lr": 1.3306384124150464e-05, "epoch": 6.8945487042001785, "percentage": 68.95, "elapsed_time": "3:12:04", "remaining_time": "1:26:30", "throughput": 2316.76, "total_tokens": 26698376} {"current_steps": 46295, "total_steps": 67140, "loss": 0.6341, "lr": 1.3300640428286244e-05, "epoch": 6.895293416741138, "percentage": 68.95, "elapsed_time": "3:12:05", "remaining_time": "1:26:29", "throughput": 2316.77, "total_tokens": 26701128} {"current_steps": 46300, "total_steps": 67140, "loss": 0.602, "lr": 1.3294897523017177e-05, "epoch": 6.896038129282097, "percentage": 68.96, "elapsed_time": "3:12:06", "remaining_time": "1:26:28", "throughput": 2316.79, "total_tokens": 26703912} {"current_steps": 46305, "total_steps": 67140, "loss": 0.5515, "lr": 1.3289155408731346e-05, "epoch": 6.896782841823057, "percentage": 68.97, "elapsed_time": "3:12:07", "remaining_time": "1:26:26", "throughput": 2316.83, "total_tokens": 26707080} {"current_steps": 46310, "total_steps": 67140, "loss": 0.7254, "lr": 1.3283414085816793e-05, "epoch": 6.897527554364015, "percentage": 68.98, "elapsed_time": "3:12:08", "remaining_time": "1:26:25", "throughput": 2316.84, "total_tokens": 26709768} {"current_steps": 46315, "total_steps": 67140, "loss": 0.6495, "lr": 1.3277673554661466e-05, "epoch": 6.898272266904975, "percentage": 68.98, "elapsed_time": "3:12:09", "remaining_time": "1:26:24", "throughput": 2316.87, "total_tokens": 26712840} {"current_steps": 46320, "total_steps": 67140, "loss": 0.616, "lr": 1.3271933815653303e-05, "epoch": 6.899016979445934, "percentage": 68.99, "elapsed_time": "3:12:10", "remaining_time": "1:26:22", "throughput": 2316.9, "total_tokens": 26715752} {"current_steps": 46325, "total_steps": 67140, "loss": 0.673, "lr": 1.3266194869180176e-05, "epoch": 6.899761691986893, "percentage": 69.0, "elapsed_time": "3:12:11", "remaining_time": "1:26:21", "throughput": 2316.93, "total_tokens": 26718760} {"current_steps": 46330, "total_steps": 67140, "loss": 0.5556, "lr": 1.3260456715629888e-05, "epoch": 6.900506404527852, "percentage": 69.01, "elapsed_time": "3:12:13", "remaining_time": "1:26:20", "throughput": 2316.97, "total_tokens": 26722120} {"current_steps": 46335, "total_steps": 67140, "loss": 0.619, "lr": 1.3254719355390206e-05, "epoch": 6.901251117068812, "percentage": 69.01, "elapsed_time": "3:12:14", "remaining_time": "1:26:19", "throughput": 2316.99, "total_tokens": 26724936} {"current_steps": 46340, "total_steps": 67140, "loss": 0.5657, "lr": 1.3248982788848832e-05, "epoch": 6.9019958296097705, "percentage": 69.02, "elapsed_time": "3:12:15", "remaining_time": "1:26:17", "throughput": 2317.01, "total_tokens": 26727720} {"current_steps": 46345, "total_steps": 67140, "loss": 0.5462, "lr": 1.3243247016393429e-05, "epoch": 6.90274054215073, "percentage": 69.03, "elapsed_time": "3:12:16", "remaining_time": "1:26:16", "throughput": 2317.02, "total_tokens": 26730536} {"current_steps": 46350, "total_steps": 67140, "loss": 0.5031, "lr": 1.3237512038411604e-05, "epoch": 6.903485254691689, "percentage": 69.03, "elapsed_time": "3:12:17", "remaining_time": "1:26:15", "throughput": 2317.05, "total_tokens": 26733448} {"current_steps": 46355, "total_steps": 67140, "loss": 0.5321, "lr": 1.3231777855290878e-05, "epoch": 6.904229967232649, "percentage": 69.04, "elapsed_time": "3:12:19", "remaining_time": "1:26:13", "throughput": 2317.13, "total_tokens": 26737608} {"current_steps": 46360, "total_steps": 67140, "loss": 0.5289, "lr": 1.3226044467418771e-05, "epoch": 6.904974679773607, "percentage": 69.05, "elapsed_time": "3:12:20", "remaining_time": "1:26:12", "throughput": 2317.14, "total_tokens": 26740360} {"current_steps": 46365, "total_steps": 67140, "loss": 0.5697, "lr": 1.3220311875182701e-05, "epoch": 6.905719392314566, "percentage": 69.06, "elapsed_time": "3:12:21", "remaining_time": "1:26:11", "throughput": 2317.17, "total_tokens": 26743240} {"current_steps": 46370, "total_steps": 67140, "loss": 0.5976, "lr": 1.3214580078970063e-05, "epoch": 6.906464104855526, "percentage": 69.06, "elapsed_time": "3:12:22", "remaining_time": "1:26:10", "throughput": 2317.19, "total_tokens": 26746216} {"current_steps": 46375, "total_steps": 67140, "loss": 0.7559, "lr": 1.3208849079168184e-05, "epoch": 6.907208817396485, "percentage": 69.07, "elapsed_time": "3:12:23", "remaining_time": "1:26:08", "throughput": 2317.23, "total_tokens": 26749576} {"current_steps": 46380, "total_steps": 67140, "loss": 0.625, "lr": 1.3203118876164345e-05, "epoch": 6.907953529937444, "percentage": 69.08, "elapsed_time": "3:12:24", "remaining_time": "1:26:07", "throughput": 2317.27, "total_tokens": 26752648} {"current_steps": 46385, "total_steps": 67140, "loss": 0.4475, "lr": 1.3197389470345778e-05, "epoch": 6.908698242478403, "percentage": 69.09, "elapsed_time": "3:12:26", "remaining_time": "1:26:06", "throughput": 2317.28, "total_tokens": 26755272} {"current_steps": 46390, "total_steps": 67140, "loss": 0.507, "lr": 1.3191660862099647e-05, "epoch": 6.909442955019363, "percentage": 69.09, "elapsed_time": "3:12:27", "remaining_time": "1:26:04", "throughput": 2317.28, "total_tokens": 26757768} {"current_steps": 46395, "total_steps": 67140, "loss": 0.5491, "lr": 1.3185933051813057e-05, "epoch": 6.910187667560322, "percentage": 69.1, "elapsed_time": "3:12:28", "remaining_time": "1:26:03", "throughput": 2317.29, "total_tokens": 26760488} {"current_steps": 46400, "total_steps": 67140, "loss": 0.5447, "lr": 1.3180206039873078e-05, "epoch": 6.910932380101281, "percentage": 69.11, "elapsed_time": "3:12:29", "remaining_time": "1:26:02", "throughput": 2317.32, "total_tokens": 26763464} {"current_steps": 46405, "total_steps": 67140, "loss": 0.6588, "lr": 1.317447982666672e-05, "epoch": 6.91167709264224, "percentage": 69.12, "elapsed_time": "3:12:30", "remaining_time": "1:26:01", "throughput": 2317.34, "total_tokens": 26766472} {"current_steps": 46410, "total_steps": 67140, "loss": 0.5082, "lr": 1.3168754412580934e-05, "epoch": 6.912421805183199, "percentage": 69.12, "elapsed_time": "3:12:31", "remaining_time": "1:25:59", "throughput": 2317.37, "total_tokens": 26769416} {"current_steps": 46415, "total_steps": 67140, "loss": 0.747, "lr": 1.3163029798002625e-05, "epoch": 6.913166517724158, "percentage": 69.13, "elapsed_time": "3:12:32", "remaining_time": "1:25:58", "throughput": 2317.39, "total_tokens": 26772232} {"current_steps": 46420, "total_steps": 67140, "loss": 0.6379, "lr": 1.3157305983318643e-05, "epoch": 6.913911230265118, "percentage": 69.14, "elapsed_time": "3:12:33", "remaining_time": "1:25:57", "throughput": 2317.41, "total_tokens": 26775080} {"current_steps": 46425, "total_steps": 67140, "loss": 0.4169, "lr": 1.3151582968915766e-05, "epoch": 6.9146559428060765, "percentage": 69.15, "elapsed_time": "3:12:35", "remaining_time": "1:25:55", "throughput": 2317.42, "total_tokens": 26777832} {"current_steps": 46430, "total_steps": 67140, "loss": 0.7428, "lr": 1.314586075518075e-05, "epoch": 6.915400655347036, "percentage": 69.15, "elapsed_time": "3:12:36", "remaining_time": "1:25:54", "throughput": 2317.44, "total_tokens": 26780584} {"current_steps": 46435, "total_steps": 67140, "loss": 0.5511, "lr": 1.3140139342500257e-05, "epoch": 6.916145367887995, "percentage": 69.16, "elapsed_time": "3:12:37", "remaining_time": "1:25:53", "throughput": 2317.46, "total_tokens": 26783400} {"current_steps": 46440, "total_steps": 67140, "loss": 0.6267, "lr": 1.3134418731260931e-05, "epoch": 6.916890080428955, "percentage": 69.17, "elapsed_time": "3:12:38", "remaining_time": "1:25:51", "throughput": 2317.49, "total_tokens": 26786472} {"current_steps": 46445, "total_steps": 67140, "loss": 0.6645, "lr": 1.3128698921849344e-05, "epoch": 6.917634792969913, "percentage": 69.18, "elapsed_time": "3:12:39", "remaining_time": "1:25:50", "throughput": 2317.51, "total_tokens": 26789192} {"current_steps": 46450, "total_steps": 67140, "loss": 0.3681, "lr": 1.3122979914652016e-05, "epoch": 6.918379505510873, "percentage": 69.18, "elapsed_time": "3:12:40", "remaining_time": "1:25:49", "throughput": 2317.55, "total_tokens": 26792488} {"current_steps": 46455, "total_steps": 67140, "loss": 0.5401, "lr": 1.3117261710055433e-05, "epoch": 6.919124218051832, "percentage": 69.19, "elapsed_time": "3:12:41", "remaining_time": "1:25:48", "throughput": 2317.57, "total_tokens": 26795336} {"current_steps": 46460, "total_steps": 67140, "loss": 0.6885, "lr": 1.3111544308445977e-05, "epoch": 6.919868930592791, "percentage": 69.2, "elapsed_time": "3:12:42", "remaining_time": "1:25:46", "throughput": 2317.59, "total_tokens": 26798248} {"current_steps": 46465, "total_steps": 67140, "loss": 0.6632, "lr": 1.3105827710210026e-05, "epoch": 6.92061364313375, "percentage": 69.21, "elapsed_time": "3:12:44", "remaining_time": "1:25:45", "throughput": 2317.6, "total_tokens": 26800872} {"current_steps": 46470, "total_steps": 67140, "loss": 0.6865, "lr": 1.3100111915733887e-05, "epoch": 6.92135835567471, "percentage": 69.21, "elapsed_time": "3:12:45", "remaining_time": "1:25:44", "throughput": 2317.62, "total_tokens": 26803720} {"current_steps": 46475, "total_steps": 67140, "loss": 0.6445, "lr": 1.3094396925403793e-05, "epoch": 6.922103068215669, "percentage": 69.22, "elapsed_time": "3:12:46", "remaining_time": "1:25:42", "throughput": 2317.65, "total_tokens": 26806728} {"current_steps": 46480, "total_steps": 67140, "loss": 0.5229, "lr": 1.308868273960595e-05, "epoch": 6.922847780756628, "percentage": 69.23, "elapsed_time": "3:12:47", "remaining_time": "1:25:41", "throughput": 2317.65, "total_tokens": 26809320} {"current_steps": 46485, "total_steps": 67140, "loss": 0.5005, "lr": 1.3082969358726502e-05, "epoch": 6.923592493297587, "percentage": 69.24, "elapsed_time": "3:12:48", "remaining_time": "1:25:40", "throughput": 2317.67, "total_tokens": 26812072} {"current_steps": 46490, "total_steps": 67140, "loss": 0.7128, "lr": 1.3077256783151542e-05, "epoch": 6.924337205838547, "percentage": 69.24, "elapsed_time": "3:12:49", "remaining_time": "1:25:39", "throughput": 2317.69, "total_tokens": 26815048} {"current_steps": 46495, "total_steps": 67140, "loss": 0.8139, "lr": 1.3071545013267084e-05, "epoch": 6.925081918379505, "percentage": 69.25, "elapsed_time": "3:12:50", "remaining_time": "1:25:37", "throughput": 2317.73, "total_tokens": 26818248} {"current_steps": 46500, "total_steps": 67140, "loss": 0.5726, "lr": 1.3065834049459117e-05, "epoch": 6.925826630920465, "percentage": 69.26, "elapsed_time": "3:12:52", "remaining_time": "1:25:36", "throughput": 2317.74, "total_tokens": 26820968} {"current_steps": 46505, "total_steps": 67140, "loss": 0.4148, "lr": 1.3060123892113562e-05, "epoch": 6.926571343461424, "percentage": 69.27, "elapsed_time": "3:12:53", "remaining_time": "1:25:35", "throughput": 2317.77, "total_tokens": 26823912} {"current_steps": 46510, "total_steps": 67140, "loss": 0.6855, "lr": 1.3054414541616305e-05, "epoch": 6.927316056002383, "percentage": 69.27, "elapsed_time": "3:12:54", "remaining_time": "1:25:33", "throughput": 2317.78, "total_tokens": 26826632} {"current_steps": 46515, "total_steps": 67140, "loss": 0.5658, "lr": 1.3048705998353133e-05, "epoch": 6.928060768543342, "percentage": 69.28, "elapsed_time": "3:12:55", "remaining_time": "1:25:32", "throughput": 2317.8, "total_tokens": 26829480} {"current_steps": 46520, "total_steps": 67140, "loss": 0.6819, "lr": 1.3042998262709821e-05, "epoch": 6.928805481084302, "percentage": 69.29, "elapsed_time": "3:12:56", "remaining_time": "1:25:31", "throughput": 2317.81, "total_tokens": 26832168} {"current_steps": 46525, "total_steps": 67140, "loss": 0.645, "lr": 1.303729133507208e-05, "epoch": 6.929550193625261, "percentage": 69.3, "elapsed_time": "3:12:57", "remaining_time": "1:25:29", "throughput": 2317.84, "total_tokens": 26835080} {"current_steps": 46530, "total_steps": 67140, "loss": 0.7366, "lr": 1.3031585215825545e-05, "epoch": 6.930294906166219, "percentage": 69.3, "elapsed_time": "3:12:58", "remaining_time": "1:25:28", "throughput": 2317.87, "total_tokens": 26838088} {"current_steps": 46535, "total_steps": 67140, "loss": 0.6105, "lr": 1.302587990535582e-05, "epoch": 6.931039618707179, "percentage": 69.31, "elapsed_time": "3:12:59", "remaining_time": "1:25:27", "throughput": 2317.88, "total_tokens": 26840872} {"current_steps": 46540, "total_steps": 67140, "loss": 0.6974, "lr": 1.302017540404845e-05, "epoch": 6.931784331248139, "percentage": 69.32, "elapsed_time": "3:13:01", "remaining_time": "1:25:26", "throughput": 2317.91, "total_tokens": 26843880} {"current_steps": 46545, "total_steps": 67140, "loss": 0.576, "lr": 1.3014471712288917e-05, "epoch": 6.932529043789097, "percentage": 69.33, "elapsed_time": "3:13:02", "remaining_time": "1:25:24", "throughput": 2317.94, "total_tokens": 26846856} {"current_steps": 46550, "total_steps": 67140, "loss": 0.5715, "lr": 1.300876883046267e-05, "epoch": 6.933273756330056, "percentage": 69.33, "elapsed_time": "3:13:03", "remaining_time": "1:25:23", "throughput": 2317.95, "total_tokens": 26849640} {"current_steps": 46555, "total_steps": 67140, "loss": 0.4711, "lr": 1.3003066758955068e-05, "epoch": 6.934018468871016, "percentage": 69.34, "elapsed_time": "3:13:04", "remaining_time": "1:25:22", "throughput": 2317.98, "total_tokens": 26852648} {"current_steps": 46560, "total_steps": 67140, "loss": 0.6516, "lr": 1.2997365498151431e-05, "epoch": 6.9347631814119755, "percentage": 69.35, "elapsed_time": "3:13:05", "remaining_time": "1:25:20", "throughput": 2318.0, "total_tokens": 26855560} {"current_steps": 46565, "total_steps": 67140, "loss": 0.5855, "lr": 1.2991665048437036e-05, "epoch": 6.935507893952934, "percentage": 69.36, "elapsed_time": "3:13:06", "remaining_time": "1:25:19", "throughput": 2318.02, "total_tokens": 26858472} {"current_steps": 46570, "total_steps": 67140, "loss": 0.662, "lr": 1.2985965410197092e-05, "epoch": 6.936252606493893, "percentage": 69.36, "elapsed_time": "3:13:07", "remaining_time": "1:25:18", "throughput": 2318.03, "total_tokens": 26861096} {"current_steps": 46575, "total_steps": 67140, "loss": 0.5184, "lr": 1.2980266583816763e-05, "epoch": 6.936997319034853, "percentage": 69.37, "elapsed_time": "3:13:09", "remaining_time": "1:25:17", "throughput": 2318.06, "total_tokens": 26864008} {"current_steps": 46580, "total_steps": 67140, "loss": 0.5053, "lr": 1.2974568569681147e-05, "epoch": 6.937742031575811, "percentage": 69.38, "elapsed_time": "3:13:10", "remaining_time": "1:25:15", "throughput": 2318.07, "total_tokens": 26866760} {"current_steps": 46585, "total_steps": 67140, "loss": 0.5683, "lr": 1.2968871368175306e-05, "epoch": 6.938486744116771, "percentage": 69.38, "elapsed_time": "3:13:11", "remaining_time": "1:25:14", "throughput": 2318.08, "total_tokens": 26869416} {"current_steps": 46590, "total_steps": 67140, "loss": 0.6816, "lr": 1.2963174979684223e-05, "epoch": 6.93923145665773, "percentage": 69.39, "elapsed_time": "3:13:12", "remaining_time": "1:25:13", "throughput": 2318.1, "total_tokens": 26872296} {"current_steps": 46595, "total_steps": 67140, "loss": 0.5595, "lr": 1.2957479404592826e-05, "epoch": 6.939976169198689, "percentage": 69.4, "elapsed_time": "3:13:13", "remaining_time": "1:25:11", "throughput": 2318.13, "total_tokens": 26875336} {"current_steps": 46600, "total_steps": 67140, "loss": 0.7539, "lr": 1.2951784643286014e-05, "epoch": 6.940720881739648, "percentage": 69.41, "elapsed_time": "3:13:14", "remaining_time": "1:25:10", "throughput": 2318.14, "total_tokens": 26877896} {"current_steps": 46605, "total_steps": 67140, "loss": 0.665, "lr": 1.2946090696148606e-05, "epoch": 6.941465594280608, "percentage": 69.41, "elapsed_time": "3:13:15", "remaining_time": "1:25:09", "throughput": 2318.16, "total_tokens": 26880872} {"current_steps": 46610, "total_steps": 67140, "loss": 0.6743, "lr": 1.2940397563565381e-05, "epoch": 6.942210306821567, "percentage": 69.42, "elapsed_time": "3:13:16", "remaining_time": "1:25:08", "throughput": 2318.2, "total_tokens": 26883944} {"current_steps": 46615, "total_steps": 67140, "loss": 0.4977, "lr": 1.2934705245921058e-05, "epoch": 6.942955019362526, "percentage": 69.43, "elapsed_time": "3:13:18", "remaining_time": "1:25:06", "throughput": 2318.23, "total_tokens": 26887016} {"current_steps": 46620, "total_steps": 67140, "loss": 0.4151, "lr": 1.2929013743600316e-05, "epoch": 6.943699731903485, "percentage": 69.44, "elapsed_time": "3:13:19", "remaining_time": "1:25:05", "throughput": 2318.25, "total_tokens": 26889992} {"current_steps": 46625, "total_steps": 67140, "loss": 0.696, "lr": 1.2923323056987733e-05, "epoch": 6.944444444444445, "percentage": 69.44, "elapsed_time": "3:13:20", "remaining_time": "1:25:04", "throughput": 2318.27, "total_tokens": 26892744} {"current_steps": 46630, "total_steps": 67140, "loss": 0.6733, "lr": 1.2917633186467886e-05, "epoch": 6.945189156985403, "percentage": 69.45, "elapsed_time": "3:13:21", "remaining_time": "1:25:02", "throughput": 2318.28, "total_tokens": 26895400} {"current_steps": 46635, "total_steps": 67140, "loss": 0.5421, "lr": 1.2911944132425261e-05, "epoch": 6.945933869526363, "percentage": 69.46, "elapsed_time": "3:13:22", "remaining_time": "1:25:01", "throughput": 2318.29, "total_tokens": 26898152} {"current_steps": 46640, "total_steps": 67140, "loss": 0.6282, "lr": 1.2906255895244301e-05, "epoch": 6.946678582067322, "percentage": 69.47, "elapsed_time": "3:13:23", "remaining_time": "1:25:00", "throughput": 2318.3, "total_tokens": 26900840} {"current_steps": 46645, "total_steps": 67140, "loss": 0.5509, "lr": 1.29005684753094e-05, "epoch": 6.9474232946082815, "percentage": 69.47, "elapsed_time": "3:13:24", "remaining_time": "1:24:58", "throughput": 2318.32, "total_tokens": 26903688} {"current_steps": 46650, "total_steps": 67140, "loss": 0.7131, "lr": 1.2894881873004889e-05, "epoch": 6.94816800714924, "percentage": 69.48, "elapsed_time": "3:13:25", "remaining_time": "1:24:57", "throughput": 2318.35, "total_tokens": 26906760} {"current_steps": 46655, "total_steps": 67140, "loss": 0.5622, "lr": 1.288919608871505e-05, "epoch": 6.9489127196902, "percentage": 69.49, "elapsed_time": "3:13:27", "remaining_time": "1:24:56", "throughput": 2318.37, "total_tokens": 26909512} {"current_steps": 46660, "total_steps": 67140, "loss": 0.9223, "lr": 1.2883511122824093e-05, "epoch": 6.949657432231159, "percentage": 69.5, "elapsed_time": "3:13:28", "remaining_time": "1:24:55", "throughput": 2318.38, "total_tokens": 26912296} {"current_steps": 46665, "total_steps": 67140, "loss": 0.5301, "lr": 1.2877826975716195e-05, "epoch": 6.950402144772118, "percentage": 69.5, "elapsed_time": "3:13:29", "remaining_time": "1:24:53", "throughput": 2318.38, "total_tokens": 26914888} {"current_steps": 46670, "total_steps": 67140, "loss": 0.5877, "lr": 1.2872143647775476e-05, "epoch": 6.951146857313077, "percentage": 69.51, "elapsed_time": "3:13:30", "remaining_time": "1:24:52", "throughput": 2318.42, "total_tokens": 26918120} {"current_steps": 46675, "total_steps": 67140, "loss": 0.5355, "lr": 1.2866461139385966e-05, "epoch": 6.951891569854037, "percentage": 69.52, "elapsed_time": "3:13:31", "remaining_time": "1:24:51", "throughput": 2318.44, "total_tokens": 26920968} {"current_steps": 46680, "total_steps": 67140, "loss": 0.6567, "lr": 1.2860779450931684e-05, "epoch": 6.952636282394995, "percentage": 69.53, "elapsed_time": "3:13:32", "remaining_time": "1:24:49", "throughput": 2318.47, "total_tokens": 26924072} {"current_steps": 46685, "total_steps": 67140, "loss": 0.4678, "lr": 1.285509858279657e-05, "epoch": 6.953380994935955, "percentage": 69.53, "elapsed_time": "3:13:33", "remaining_time": "1:24:48", "throughput": 2318.49, "total_tokens": 26926920} {"current_steps": 46690, "total_steps": 67140, "loss": 0.556, "lr": 1.2849418535364527e-05, "epoch": 6.954125707476914, "percentage": 69.54, "elapsed_time": "3:13:35", "remaining_time": "1:24:47", "throughput": 2318.5, "total_tokens": 26929640} {"current_steps": 46695, "total_steps": 67140, "loss": 0.7635, "lr": 1.284373930901937e-05, "epoch": 6.9548704200178735, "percentage": 69.55, "elapsed_time": "3:13:36", "remaining_time": "1:24:46", "throughput": 2318.52, "total_tokens": 26932424} {"current_steps": 46700, "total_steps": 67140, "loss": 0.5964, "lr": 1.2838060904144888e-05, "epoch": 6.955615132558832, "percentage": 69.56, "elapsed_time": "3:13:37", "remaining_time": "1:24:44", "throughput": 2318.53, "total_tokens": 26935272} {"current_steps": 46705, "total_steps": 67140, "loss": 0.6381, "lr": 1.28323833211248e-05, "epoch": 6.956359845099792, "percentage": 69.56, "elapsed_time": "3:13:38", "remaining_time": "1:24:43", "throughput": 2318.56, "total_tokens": 26938216} {"current_steps": 46710, "total_steps": 67140, "loss": 0.5788, "lr": 1.2826706560342788e-05, "epoch": 6.957104557640751, "percentage": 69.57, "elapsed_time": "3:13:39", "remaining_time": "1:24:42", "throughput": 2318.58, "total_tokens": 26941192} {"current_steps": 46715, "total_steps": 67140, "loss": 0.6141, "lr": 1.2821030622182444e-05, "epoch": 6.957849270181709, "percentage": 69.58, "elapsed_time": "3:13:40", "remaining_time": "1:24:40", "throughput": 2318.6, "total_tokens": 26944040} {"current_steps": 46720, "total_steps": 67140, "loss": 0.6017, "lr": 1.2815355507027344e-05, "epoch": 6.958593982722669, "percentage": 69.59, "elapsed_time": "3:13:41", "remaining_time": "1:24:39", "throughput": 2318.6, "total_tokens": 26946536} {"current_steps": 46725, "total_steps": 67140, "loss": 0.4768, "lr": 1.280968121526097e-05, "epoch": 6.959338695263629, "percentage": 69.59, "elapsed_time": "3:13:43", "remaining_time": "1:24:38", "throughput": 2318.62, "total_tokens": 26949320} {"current_steps": 46730, "total_steps": 67140, "loss": 0.7256, "lr": 1.2804007747266778e-05, "epoch": 6.9600834078045875, "percentage": 69.6, "elapsed_time": "3:13:44", "remaining_time": "1:24:37", "throughput": 2318.64, "total_tokens": 26952264} {"current_steps": 46735, "total_steps": 67140, "loss": 0.5688, "lr": 1.2798335103428157e-05, "epoch": 6.960828120345546, "percentage": 69.61, "elapsed_time": "3:13:45", "remaining_time": "1:24:35", "throughput": 2318.66, "total_tokens": 26955080} {"current_steps": 46740, "total_steps": 67140, "loss": 0.7386, "lr": 1.2792663284128443e-05, "epoch": 6.961572832886506, "percentage": 69.62, "elapsed_time": "3:13:46", "remaining_time": "1:24:34", "throughput": 2318.67, "total_tokens": 26957768} {"current_steps": 46745, "total_steps": 67140, "loss": 0.584, "lr": 1.2786992289750909e-05, "epoch": 6.962317545427465, "percentage": 69.62, "elapsed_time": "3:13:47", "remaining_time": "1:24:33", "throughput": 2318.71, "total_tokens": 26960936} {"current_steps": 46750, "total_steps": 67140, "loss": 0.5813, "lr": 1.2781322120678796e-05, "epoch": 6.963062257968424, "percentage": 69.63, "elapsed_time": "3:13:48", "remaining_time": "1:24:31", "throughput": 2318.74, "total_tokens": 26963944} {"current_steps": 46755, "total_steps": 67140, "loss": 0.5732, "lr": 1.2775652777295252e-05, "epoch": 6.963806970509383, "percentage": 69.64, "elapsed_time": "3:13:49", "remaining_time": "1:24:30", "throughput": 2318.76, "total_tokens": 26966920} {"current_steps": 46760, "total_steps": 67140, "loss": 0.65, "lr": 1.2769984259983386e-05, "epoch": 6.964551683050343, "percentage": 69.65, "elapsed_time": "3:13:51", "remaining_time": "1:24:29", "throughput": 2318.8, "total_tokens": 26970088} {"current_steps": 46765, "total_steps": 67140, "loss": 0.5753, "lr": 1.2764316569126258e-05, "epoch": 6.965296395591301, "percentage": 69.65, "elapsed_time": "3:13:52", "remaining_time": "1:24:28", "throughput": 2318.82, "total_tokens": 26972968} {"current_steps": 46770, "total_steps": 67140, "loss": 0.4484, "lr": 1.275864970510687e-05, "epoch": 6.966041108132261, "percentage": 69.66, "elapsed_time": "3:13:53", "remaining_time": "1:24:26", "throughput": 2318.83, "total_tokens": 26975752} {"current_steps": 46775, "total_steps": 67140, "loss": 0.7117, "lr": 1.2752983668308167e-05, "epoch": 6.96678582067322, "percentage": 69.67, "elapsed_time": "3:13:54", "remaining_time": "1:24:25", "throughput": 2318.87, "total_tokens": 26978856} {"current_steps": 46780, "total_steps": 67140, "loss": 0.5734, "lr": 1.2747318459113033e-05, "epoch": 6.9675305332141795, "percentage": 69.68, "elapsed_time": "3:13:55", "remaining_time": "1:24:24", "throughput": 2318.88, "total_tokens": 26981608} {"current_steps": 46785, "total_steps": 67140, "loss": 0.6452, "lr": 1.2741654077904313e-05, "epoch": 6.968275245755138, "percentage": 69.68, "elapsed_time": "3:13:56", "remaining_time": "1:24:22", "throughput": 2318.9, "total_tokens": 26984456} {"current_steps": 46790, "total_steps": 67140, "loss": 0.6161, "lr": 1.273599052506476e-05, "epoch": 6.969019958296098, "percentage": 69.69, "elapsed_time": "3:13:57", "remaining_time": "1:24:21", "throughput": 2318.91, "total_tokens": 26987208} {"current_steps": 46795, "total_steps": 67140, "loss": 0.5574, "lr": 1.2730327800977116e-05, "epoch": 6.969764670837057, "percentage": 69.7, "elapsed_time": "3:13:59", "remaining_time": "1:24:20", "throughput": 2318.93, "total_tokens": 26990184} {"current_steps": 46800, "total_steps": 67140, "loss": 0.5346, "lr": 1.2724665906024025e-05, "epoch": 6.970509383378016, "percentage": 69.71, "elapsed_time": "3:14:00", "remaining_time": "1:24:18", "throughput": 2318.95, "total_tokens": 26992872} {"current_steps": 46805, "total_steps": 67140, "loss": 0.5957, "lr": 1.2719004840588106e-05, "epoch": 6.971254095918975, "percentage": 69.71, "elapsed_time": "3:14:01", "remaining_time": "1:24:17", "throughput": 2318.96, "total_tokens": 26995624} {"current_steps": 46810, "total_steps": 67140, "loss": 0.6635, "lr": 1.2713344605051905e-05, "epoch": 6.971998808459935, "percentage": 69.72, "elapsed_time": "3:14:02", "remaining_time": "1:24:16", "throughput": 2319.0, "total_tokens": 26998760} {"current_steps": 46815, "total_steps": 67140, "loss": 0.379, "lr": 1.2707685199797926e-05, "epoch": 6.9727435210008935, "percentage": 69.73, "elapsed_time": "3:14:03", "remaining_time": "1:24:15", "throughput": 2319.01, "total_tokens": 27001448} {"current_steps": 46820, "total_steps": 67140, "loss": 0.6719, "lr": 1.270202662520861e-05, "epoch": 6.973488233541853, "percentage": 69.73, "elapsed_time": "3:14:04", "remaining_time": "1:24:13", "throughput": 2319.03, "total_tokens": 27004264} {"current_steps": 46825, "total_steps": 67140, "loss": 0.5, "lr": 1.2696368881666325e-05, "epoch": 6.974232946082812, "percentage": 69.74, "elapsed_time": "3:14:05", "remaining_time": "1:24:12", "throughput": 2319.05, "total_tokens": 27007176} {"current_steps": 46830, "total_steps": 67140, "loss": 0.7683, "lr": 1.2690711969553412e-05, "epoch": 6.9749776586237715, "percentage": 69.75, "elapsed_time": "3:14:06", "remaining_time": "1:24:11", "throughput": 2319.07, "total_tokens": 27010088} {"current_steps": 46835, "total_steps": 67140, "loss": 0.4409, "lr": 1.2685055889252146e-05, "epoch": 6.97572237116473, "percentage": 69.76, "elapsed_time": "3:14:08", "remaining_time": "1:24:09", "throughput": 2319.08, "total_tokens": 27012776} {"current_steps": 46840, "total_steps": 67140, "loss": 0.7243, "lr": 1.2679400641144723e-05, "epoch": 6.97646708370569, "percentage": 69.76, "elapsed_time": "3:14:09", "remaining_time": "1:24:08", "throughput": 2319.11, "total_tokens": 27015688} {"current_steps": 46845, "total_steps": 67140, "loss": 0.6147, "lr": 1.2673746225613315e-05, "epoch": 6.977211796246649, "percentage": 69.77, "elapsed_time": "3:14:10", "remaining_time": "1:24:07", "throughput": 2319.13, "total_tokens": 27018568} {"current_steps": 46850, "total_steps": 67140, "loss": 0.557, "lr": 1.2668092643040018e-05, "epoch": 6.977956508787608, "percentage": 69.78, "elapsed_time": "3:14:11", "remaining_time": "1:24:06", "throughput": 2319.14, "total_tokens": 27021288} {"current_steps": 46855, "total_steps": 67140, "loss": 0.6256, "lr": 1.2662439893806899e-05, "epoch": 6.978701221328567, "percentage": 69.79, "elapsed_time": "3:14:12", "remaining_time": "1:24:04", "throughput": 2319.16, "total_tokens": 27024200} {"current_steps": 46860, "total_steps": 67140, "loss": 0.6093, "lr": 1.2656787978295913e-05, "epoch": 6.979445933869527, "percentage": 69.79, "elapsed_time": "3:14:13", "remaining_time": "1:24:03", "throughput": 2319.18, "total_tokens": 27027048} {"current_steps": 46865, "total_steps": 67140, "loss": 0.4445, "lr": 1.265113689688902e-05, "epoch": 6.9801906464104855, "percentage": 69.8, "elapsed_time": "3:14:14", "remaining_time": "1:24:02", "throughput": 2319.2, "total_tokens": 27029896} {"current_steps": 46870, "total_steps": 67140, "loss": 0.5451, "lr": 1.2645486649968085e-05, "epoch": 6.980935358951445, "percentage": 69.81, "elapsed_time": "3:14:15", "remaining_time": "1:24:00", "throughput": 2319.21, "total_tokens": 27032616} {"current_steps": 46875, "total_steps": 67140, "loss": 0.4719, "lr": 1.2639837237914943e-05, "epoch": 6.981680071492404, "percentage": 69.82, "elapsed_time": "3:14:17", "remaining_time": "1:23:59", "throughput": 2319.22, "total_tokens": 27035304} {"current_steps": 46880, "total_steps": 67140, "loss": 0.4706, "lr": 1.2634188661111335e-05, "epoch": 6.982424784033363, "percentage": 69.82, "elapsed_time": "3:14:18", "remaining_time": "1:23:58", "throughput": 2319.24, "total_tokens": 27038184} {"current_steps": 46885, "total_steps": 67140, "loss": 0.8694, "lr": 1.2628540919938991e-05, "epoch": 6.983169496574322, "percentage": 69.83, "elapsed_time": "3:14:19", "remaining_time": "1:23:56", "throughput": 2319.26, "total_tokens": 27040904} {"current_steps": 46890, "total_steps": 67140, "loss": 0.5119, "lr": 1.2622894014779547e-05, "epoch": 6.983914209115282, "percentage": 69.84, "elapsed_time": "3:14:20", "remaining_time": "1:23:55", "throughput": 2319.27, "total_tokens": 27043720} {"current_steps": 46895, "total_steps": 67140, "loss": 0.6231, "lr": 1.2617247946014604e-05, "epoch": 6.984658921656241, "percentage": 69.85, "elapsed_time": "3:14:21", "remaining_time": "1:23:54", "throughput": 2319.31, "total_tokens": 27046984} {"current_steps": 46900, "total_steps": 67140, "loss": 0.5453, "lr": 1.2611602714025696e-05, "epoch": 6.9854036341971995, "percentage": 69.85, "elapsed_time": "3:14:22", "remaining_time": "1:23:53", "throughput": 2319.33, "total_tokens": 27049800} {"current_steps": 46905, "total_steps": 67140, "loss": 0.5977, "lr": 1.2605958319194311e-05, "epoch": 6.986148346738159, "percentage": 69.86, "elapsed_time": "3:14:23", "remaining_time": "1:23:51", "throughput": 2319.38, "total_tokens": 27053064} {"current_steps": 46910, "total_steps": 67140, "loss": 0.5847, "lr": 1.2600314761901874e-05, "epoch": 6.986893059279119, "percentage": 69.87, "elapsed_time": "3:14:25", "remaining_time": "1:23:50", "throughput": 2319.39, "total_tokens": 27055816} {"current_steps": 46915, "total_steps": 67140, "loss": 0.6032, "lr": 1.259467204252976e-05, "epoch": 6.9876377718200775, "percentage": 69.88, "elapsed_time": "3:14:26", "remaining_time": "1:23:49", "throughput": 2319.4, "total_tokens": 27058632} {"current_steps": 46920, "total_steps": 67140, "loss": 0.6647, "lr": 1.2589030161459275e-05, "epoch": 6.988382484361036, "percentage": 69.88, "elapsed_time": "3:14:27", "remaining_time": "1:23:47", "throughput": 2319.42, "total_tokens": 27061480} {"current_steps": 46925, "total_steps": 67140, "loss": 0.5072, "lr": 1.2583389119071659e-05, "epoch": 6.989127196901996, "percentage": 69.89, "elapsed_time": "3:14:28", "remaining_time": "1:23:46", "throughput": 2319.44, "total_tokens": 27064328} {"current_steps": 46930, "total_steps": 67140, "loss": 0.5646, "lr": 1.2577748915748127e-05, "epoch": 6.989871909442955, "percentage": 69.9, "elapsed_time": "3:14:29", "remaining_time": "1:23:45", "throughput": 2319.47, "total_tokens": 27067336} {"current_steps": 46935, "total_steps": 67140, "loss": 0.7531, "lr": 1.2572109551869815e-05, "epoch": 6.990616621983914, "percentage": 69.91, "elapsed_time": "3:14:30", "remaining_time": "1:23:44", "throughput": 2319.49, "total_tokens": 27070120} {"current_steps": 46940, "total_steps": 67140, "loss": 0.6499, "lr": 1.2566471027817817e-05, "epoch": 6.991361334524873, "percentage": 69.91, "elapsed_time": "3:14:31", "remaining_time": "1:23:42", "throughput": 2319.51, "total_tokens": 27073064} {"current_steps": 46945, "total_steps": 67140, "loss": 0.5034, "lr": 1.256083334397315e-05, "epoch": 6.992106047065833, "percentage": 69.92, "elapsed_time": "3:14:32", "remaining_time": "1:23:41", "throughput": 2319.53, "total_tokens": 27075784} {"current_steps": 46950, "total_steps": 67140, "loss": 0.7518, "lr": 1.2555196500716803e-05, "epoch": 6.9928507596067915, "percentage": 69.93, "elapsed_time": "3:14:34", "remaining_time": "1:23:40", "throughput": 2319.56, "total_tokens": 27078856} {"current_steps": 46955, "total_steps": 67140, "loss": 0.5071, "lr": 1.2549560498429683e-05, "epoch": 6.993595472147751, "percentage": 69.94, "elapsed_time": "3:14:35", "remaining_time": "1:23:38", "throughput": 2319.59, "total_tokens": 27081992} {"current_steps": 46960, "total_steps": 67140, "loss": 0.5957, "lr": 1.2543925337492631e-05, "epoch": 6.99434018468871, "percentage": 69.94, "elapsed_time": "3:14:36", "remaining_time": "1:23:37", "throughput": 2319.61, "total_tokens": 27084840} {"current_steps": 46965, "total_steps": 67140, "loss": 0.5566, "lr": 1.2538291018286462e-05, "epoch": 6.9950848972296695, "percentage": 69.95, "elapsed_time": "3:14:37", "remaining_time": "1:23:36", "throughput": 2319.63, "total_tokens": 27087688} {"current_steps": 46970, "total_steps": 67140, "loss": 0.6397, "lr": 1.2532657541191922e-05, "epoch": 6.995829609770628, "percentage": 69.96, "elapsed_time": "3:14:38", "remaining_time": "1:23:35", "throughput": 2319.66, "total_tokens": 27090760} {"current_steps": 46975, "total_steps": 67140, "loss": 0.5122, "lr": 1.2527024906589698e-05, "epoch": 6.996574322311588, "percentage": 69.97, "elapsed_time": "3:14:39", "remaining_time": "1:23:33", "throughput": 2319.68, "total_tokens": 27093640} {"current_steps": 46980, "total_steps": 67140, "loss": 0.5139, "lr": 1.252139311486042e-05, "epoch": 6.997319034852547, "percentage": 69.97, "elapsed_time": "3:14:41", "remaining_time": "1:23:32", "throughput": 2319.72, "total_tokens": 27096840} {"current_steps": 46985, "total_steps": 67140, "loss": 0.5692, "lr": 1.2515762166384668e-05, "epoch": 6.998063747393506, "percentage": 69.98, "elapsed_time": "3:14:42", "remaining_time": "1:23:31", "throughput": 2319.76, "total_tokens": 27099976} {"current_steps": 46990, "total_steps": 67140, "loss": 0.6966, "lr": 1.2510132061542939e-05, "epoch": 6.998808459934465, "percentage": 69.99, "elapsed_time": "3:14:43", "remaining_time": "1:23:30", "throughput": 2319.79, "total_tokens": 27103112} {"current_steps": 46995, "total_steps": 67140, "loss": 0.6635, "lr": 1.2504502800715723e-05, "epoch": 6.999553172475425, "percentage": 70.0, "elapsed_time": "3:14:44", "remaining_time": "1:23:28", "throughput": 2319.82, "total_tokens": 27106056} {"current_steps": 46998, "total_steps": 67140, "eval_loss": 0.6671453714370728, "epoch": 7.0, "percentage": 70.0, "elapsed_time": "3:15:59", "remaining_time": "1:23:59", "throughput": 2305.16, "total_tokens": 27107328} {"current_steps": 47000, "total_steps": 67140, "loss": 0.7574, "lr": 1.2498874384283389e-05, "epoch": 7.0002978850163835, "percentage": 70.0, "elapsed_time": "3:16:01", "remaining_time": "1:24:00", "throughput": 2304.81, "total_tokens": 27108544} {"current_steps": 47005, "total_steps": 67140, "loss": 0.6061, "lr": 1.24932468126263e-05, "epoch": 7.001042597557343, "percentage": 70.01, "elapsed_time": "3:16:02", "remaining_time": "1:23:58", "throughput": 2304.83, "total_tokens": 27111360} {"current_steps": 47010, "total_steps": 67140, "loss": 0.5041, "lr": 1.248762008612474e-05, "epoch": 7.001787310098302, "percentage": 70.02, "elapsed_time": "3:16:03", "remaining_time": "1:23:57", "throughput": 2304.84, "total_tokens": 27114080} {"current_steps": 47015, "total_steps": 67140, "loss": 0.5633, "lr": 1.2481994205158948e-05, "epoch": 7.0025320226392616, "percentage": 70.03, "elapsed_time": "3:16:05", "remaining_time": "1:23:56", "throughput": 2304.88, "total_tokens": 27117216} {"current_steps": 47020, "total_steps": 67140, "loss": 0.579, "lr": 1.2476369170109098e-05, "epoch": 7.00327673518022, "percentage": 70.03, "elapsed_time": "3:16:06", "remaining_time": "1:23:54", "throughput": 2304.88, "total_tokens": 27119840} {"current_steps": 47025, "total_steps": 67140, "loss": 0.4027, "lr": 1.2470744981355296e-05, "epoch": 7.00402144772118, "percentage": 70.04, "elapsed_time": "3:16:07", "remaining_time": "1:23:53", "throughput": 2304.89, "total_tokens": 27122528} {"current_steps": 47030, "total_steps": 67140, "loss": 0.5654, "lr": 1.2465121639277605e-05, "epoch": 7.004766160262139, "percentage": 70.05, "elapsed_time": "3:16:08", "remaining_time": "1:23:52", "throughput": 2304.92, "total_tokens": 27125472} {"current_steps": 47035, "total_steps": 67140, "loss": 0.7079, "lr": 1.2459499144256042e-05, "epoch": 7.005510872803098, "percentage": 70.06, "elapsed_time": "3:16:09", "remaining_time": "1:23:50", "throughput": 2304.96, "total_tokens": 27128704} {"current_steps": 47040, "total_steps": 67140, "loss": 0.5557, "lr": 1.2453877496670532e-05, "epoch": 7.006255585344057, "percentage": 70.06, "elapsed_time": "3:16:10", "remaining_time": "1:23:49", "throughput": 2304.99, "total_tokens": 27131712} {"current_steps": 47045, "total_steps": 67140, "loss": 0.5275, "lr": 1.244825669690097e-05, "epoch": 7.007000297885017, "percentage": 70.07, "elapsed_time": "3:16:12", "remaining_time": "1:23:48", "throughput": 2305.02, "total_tokens": 27134688} {"current_steps": 47050, "total_steps": 67140, "loss": 0.6447, "lr": 1.24426367453272e-05, "epoch": 7.0077450104259755, "percentage": 70.08, "elapsed_time": "3:16:13", "remaining_time": "1:23:47", "throughput": 2305.04, "total_tokens": 27137632} {"current_steps": 47055, "total_steps": 67140, "loss": 0.7815, "lr": 1.2437017642328971e-05, "epoch": 7.008489722966935, "percentage": 70.08, "elapsed_time": "3:16:14", "remaining_time": "1:23:45", "throughput": 2305.06, "total_tokens": 27140448} {"current_steps": 47060, "total_steps": 67140, "loss": 0.6217, "lr": 1.2431399388286017e-05, "epoch": 7.009234435507894, "percentage": 70.09, "elapsed_time": "3:16:15", "remaining_time": "1:23:44", "throughput": 2305.08, "total_tokens": 27143328} {"current_steps": 47065, "total_steps": 67140, "loss": 0.5499, "lr": 1.242578198357799e-05, "epoch": 7.009979148048854, "percentage": 70.1, "elapsed_time": "3:16:16", "remaining_time": "1:23:43", "throughput": 2305.1, "total_tokens": 27146144} {"current_steps": 47070, "total_steps": 67140, "loss": 0.5463, "lr": 1.2420165428584493e-05, "epoch": 7.010723860589812, "percentage": 70.11, "elapsed_time": "3:16:17", "remaining_time": "1:23:41", "throughput": 2305.12, "total_tokens": 27148864} {"current_steps": 47075, "total_steps": 67140, "loss": 0.6384, "lr": 1.2414549723685082e-05, "epoch": 7.011468573130771, "percentage": 70.11, "elapsed_time": "3:16:18", "remaining_time": "1:23:40", "throughput": 2305.17, "total_tokens": 27152288} {"current_steps": 47080, "total_steps": 67140, "loss": 0.8501, "lr": 1.240893486925922e-05, "epoch": 7.012213285671731, "percentage": 70.12, "elapsed_time": "3:16:20", "remaining_time": "1:23:39", "throughput": 2305.2, "total_tokens": 27155264} {"current_steps": 47085, "total_steps": 67140, "loss": 0.6273, "lr": 1.2403320865686361e-05, "epoch": 7.0129579982126895, "percentage": 70.13, "elapsed_time": "3:16:21", "remaining_time": "1:23:37", "throughput": 2305.21, "total_tokens": 27157920} {"current_steps": 47090, "total_steps": 67140, "loss": 0.6466, "lr": 1.239770771334585e-05, "epoch": 7.013702710753649, "percentage": 70.14, "elapsed_time": "3:16:22", "remaining_time": "1:23:36", "throughput": 2305.25, "total_tokens": 27161216} {"current_steps": 47095, "total_steps": 67140, "loss": 0.3434, "lr": 1.2392095412617017e-05, "epoch": 7.014447423294608, "percentage": 70.14, "elapsed_time": "3:16:23", "remaining_time": "1:23:35", "throughput": 2305.28, "total_tokens": 27164256} {"current_steps": 47100, "total_steps": 67140, "loss": 0.6365, "lr": 1.2386483963879114e-05, "epoch": 7.0151921358355676, "percentage": 70.15, "elapsed_time": "3:16:24", "remaining_time": "1:23:34", "throughput": 2305.3, "total_tokens": 27167168} {"current_steps": 47105, "total_steps": 67140, "loss": 0.5574, "lr": 1.2380873367511344e-05, "epoch": 7.015936848376526, "percentage": 70.16, "elapsed_time": "3:16:25", "remaining_time": "1:23:32", "throughput": 2305.31, "total_tokens": 27169824} {"current_steps": 47110, "total_steps": 67140, "loss": 0.5547, "lr": 1.2375263623892846e-05, "epoch": 7.016681560917486, "percentage": 70.17, "elapsed_time": "3:16:26", "remaining_time": "1:23:31", "throughput": 2305.33, "total_tokens": 27172544} {"current_steps": 47115, "total_steps": 67140, "loss": 0.5239, "lr": 1.2369654733402714e-05, "epoch": 7.017426273458445, "percentage": 70.17, "elapsed_time": "3:16:28", "remaining_time": "1:23:30", "throughput": 2305.36, "total_tokens": 27175712} {"current_steps": 47120, "total_steps": 67140, "loss": 0.4587, "lr": 1.2364046696419962e-05, "epoch": 7.018170985999404, "percentage": 70.18, "elapsed_time": "3:16:29", "remaining_time": "1:23:28", "throughput": 2305.37, "total_tokens": 27178368} {"current_steps": 47125, "total_steps": 67140, "loss": 0.5632, "lr": 1.235843951332355e-05, "epoch": 7.018915698540363, "percentage": 70.19, "elapsed_time": "3:16:30", "remaining_time": "1:23:27", "throughput": 2305.38, "total_tokens": 27181120} {"current_steps": 47130, "total_steps": 67140, "loss": 0.6324, "lr": 1.2352833184492402e-05, "epoch": 7.019660411081323, "percentage": 70.2, "elapsed_time": "3:16:31", "remaining_time": "1:23:26", "throughput": 2305.39, "total_tokens": 27183744} {"current_steps": 47135, "total_steps": 67140, "loss": 0.5748, "lr": 1.2347227710305365e-05, "epoch": 7.0204051236222815, "percentage": 70.2, "elapsed_time": "3:16:32", "remaining_time": "1:23:24", "throughput": 2305.42, "total_tokens": 27186784} {"current_steps": 47140, "total_steps": 67140, "loss": 0.4788, "lr": 1.2341623091141238e-05, "epoch": 7.021149836163241, "percentage": 70.21, "elapsed_time": "3:16:33", "remaining_time": "1:23:23", "throughput": 2305.44, "total_tokens": 27189600} {"current_steps": 47145, "total_steps": 67140, "loss": 0.7464, "lr": 1.2336019327378756e-05, "epoch": 7.0218945487042, "percentage": 70.22, "elapsed_time": "3:16:34", "remaining_time": "1:23:22", "throughput": 2305.46, "total_tokens": 27192480} {"current_steps": 47150, "total_steps": 67140, "loss": 0.4004, "lr": 1.2330416419396612e-05, "epoch": 7.02263926124516, "percentage": 70.23, "elapsed_time": "3:16:35", "remaining_time": "1:23:21", "throughput": 2305.48, "total_tokens": 27195296} {"current_steps": 47155, "total_steps": 67140, "loss": 0.5901, "lr": 1.2324814367573411e-05, "epoch": 7.023383973786118, "percentage": 70.23, "elapsed_time": "3:16:37", "remaining_time": "1:23:19", "throughput": 2305.52, "total_tokens": 27198592} {"current_steps": 47160, "total_steps": 67140, "loss": 0.484, "lr": 1.2319213172287716e-05, "epoch": 7.024128686327078, "percentage": 70.24, "elapsed_time": "3:16:38", "remaining_time": "1:23:18", "throughput": 2305.56, "total_tokens": 27201824} {"current_steps": 47165, "total_steps": 67140, "loss": 0.6545, "lr": 1.231361283391804e-05, "epoch": 7.024873398868037, "percentage": 70.25, "elapsed_time": "3:16:39", "remaining_time": "1:23:17", "throughput": 2305.58, "total_tokens": 27204576} {"current_steps": 47170, "total_steps": 67140, "loss": 0.6098, "lr": 1.2308013352842826e-05, "epoch": 7.025618111408996, "percentage": 70.26, "elapsed_time": "3:16:40", "remaining_time": "1:23:15", "throughput": 2305.6, "total_tokens": 27207488} {"current_steps": 47175, "total_steps": 67140, "loss": 0.6857, "lr": 1.230241472944047e-05, "epoch": 7.026362823949955, "percentage": 70.26, "elapsed_time": "3:16:41", "remaining_time": "1:23:14", "throughput": 2305.62, "total_tokens": 27210336} {"current_steps": 47180, "total_steps": 67140, "loss": 0.5825, "lr": 1.22968169640893e-05, "epoch": 7.027107536490915, "percentage": 70.27, "elapsed_time": "3:16:42", "remaining_time": "1:23:13", "throughput": 2305.66, "total_tokens": 27213536} {"current_steps": 47185, "total_steps": 67140, "loss": 0.7198, "lr": 1.2291220057167602e-05, "epoch": 7.0278522490318736, "percentage": 70.28, "elapsed_time": "3:16:44", "remaining_time": "1:23:12", "throughput": 2305.67, "total_tokens": 27216288} {"current_steps": 47190, "total_steps": 67140, "loss": 0.8069, "lr": 1.2285624009053573e-05, "epoch": 7.028596961572833, "percentage": 70.29, "elapsed_time": "3:16:45", "remaining_time": "1:23:10", "throughput": 2305.69, "total_tokens": 27219072} {"current_steps": 47195, "total_steps": 67140, "loss": 0.4916, "lr": 1.2280028820125391e-05, "epoch": 7.029341674113792, "percentage": 70.29, "elapsed_time": "3:16:46", "remaining_time": "1:23:09", "throughput": 2305.72, "total_tokens": 27222016} {"current_steps": 47200, "total_steps": 67140, "loss": 0.6295, "lr": 1.2274434490761135e-05, "epoch": 7.030086386654752, "percentage": 70.3, "elapsed_time": "3:16:47", "remaining_time": "1:23:08", "throughput": 2305.74, "total_tokens": 27224960} {"current_steps": 47205, "total_steps": 67140, "loss": 0.509, "lr": 1.226884102133886e-05, "epoch": 7.03083109919571, "percentage": 70.31, "elapsed_time": "3:16:48", "remaining_time": "1:23:06", "throughput": 2305.77, "total_tokens": 27228000} {"current_steps": 47210, "total_steps": 67140, "loss": 0.5151, "lr": 1.2263248412236547e-05, "epoch": 7.03157581173667, "percentage": 70.32, "elapsed_time": "3:16:49", "remaining_time": "1:23:05", "throughput": 2305.79, "total_tokens": 27230688} {"current_steps": 47215, "total_steps": 67140, "loss": 0.6981, "lr": 1.2257656663832129e-05, "epoch": 7.032320524277629, "percentage": 70.32, "elapsed_time": "3:16:50", "remaining_time": "1:23:04", "throughput": 2305.79, "total_tokens": 27233152} {"current_steps": 47220, "total_steps": 67140, "loss": 0.5449, "lr": 1.225206577650346e-05, "epoch": 7.033065236818588, "percentage": 70.33, "elapsed_time": "3:16:52", "remaining_time": "1:23:02", "throughput": 2305.84, "total_tokens": 27236576} {"current_steps": 47225, "total_steps": 67140, "loss": 0.3806, "lr": 1.2246475750628355e-05, "epoch": 7.033809949359547, "percentage": 70.34, "elapsed_time": "3:16:53", "remaining_time": "1:23:01", "throughput": 2305.85, "total_tokens": 27239232} {"current_steps": 47230, "total_steps": 67140, "loss": 0.5668, "lr": 1.2240886586584568e-05, "epoch": 7.034554661900507, "percentage": 70.35, "elapsed_time": "3:16:54", "remaining_time": "1:23:00", "throughput": 2305.87, "total_tokens": 27242048} {"current_steps": 47235, "total_steps": 67140, "loss": 0.617, "lr": 1.2235298284749803e-05, "epoch": 7.035299374441466, "percentage": 70.35, "elapsed_time": "3:16:55", "remaining_time": "1:22:59", "throughput": 2305.88, "total_tokens": 27244800} {"current_steps": 47240, "total_steps": 67140, "loss": 0.5339, "lr": 1.2229710845501669e-05, "epoch": 7.036044086982425, "percentage": 70.36, "elapsed_time": "3:16:56", "remaining_time": "1:22:57", "throughput": 2305.89, "total_tokens": 27247584} {"current_steps": 47245, "total_steps": 67140, "loss": 0.4686, "lr": 1.2224124269217756e-05, "epoch": 7.036788799523384, "percentage": 70.37, "elapsed_time": "3:16:57", "remaining_time": "1:22:56", "throughput": 2305.92, "total_tokens": 27250464} {"current_steps": 47250, "total_steps": 67140, "loss": 0.5598, "lr": 1.2218538556275594e-05, "epoch": 7.037533512064343, "percentage": 70.38, "elapsed_time": "3:16:58", "remaining_time": "1:22:55", "throughput": 2305.93, "total_tokens": 27253216} {"current_steps": 47255, "total_steps": 67140, "loss": 0.4215, "lr": 1.2212953707052619e-05, "epoch": 7.038278224605302, "percentage": 70.38, "elapsed_time": "3:16:59", "remaining_time": "1:22:53", "throughput": 2305.95, "total_tokens": 27256064} {"current_steps": 47260, "total_steps": 67140, "loss": 0.6144, "lr": 1.2207369721926243e-05, "epoch": 7.039022937146261, "percentage": 70.39, "elapsed_time": "3:17:01", "remaining_time": "1:22:52", "throughput": 2305.98, "total_tokens": 27259040} {"current_steps": 47265, "total_steps": 67140, "loss": 0.4105, "lr": 1.2201786601273813e-05, "epoch": 7.039767649687221, "percentage": 70.4, "elapsed_time": "3:17:02", "remaining_time": "1:22:51", "throughput": 2306.0, "total_tokens": 27261888} {"current_steps": 47270, "total_steps": 67140, "loss": 0.6548, "lr": 1.2196204345472609e-05, "epoch": 7.0405123622281796, "percentage": 70.41, "elapsed_time": "3:17:03", "remaining_time": "1:22:49", "throughput": 2306.01, "total_tokens": 27264544} {"current_steps": 47275, "total_steps": 67140, "loss": 0.9148, "lr": 1.2190622954899869e-05, "epoch": 7.041257074769139, "percentage": 70.41, "elapsed_time": "3:17:04", "remaining_time": "1:22:48", "throughput": 2306.03, "total_tokens": 27267392} {"current_steps": 47280, "total_steps": 67140, "loss": 0.4991, "lr": 1.218504242993274e-05, "epoch": 7.042001787310098, "percentage": 70.42, "elapsed_time": "3:17:05", "remaining_time": "1:22:47", "throughput": 2306.04, "total_tokens": 27270112} {"current_steps": 47285, "total_steps": 67140, "loss": 0.5842, "lr": 1.2179462770948355e-05, "epoch": 7.042746499851058, "percentage": 70.43, "elapsed_time": "3:17:06", "remaining_time": "1:22:46", "throughput": 2306.05, "total_tokens": 27272800} {"current_steps": 47290, "total_steps": 67140, "loss": 0.474, "lr": 1.2173883978323739e-05, "epoch": 7.043491212392016, "percentage": 70.43, "elapsed_time": "3:17:07", "remaining_time": "1:22:44", "throughput": 2306.06, "total_tokens": 27275424} {"current_steps": 47295, "total_steps": 67140, "loss": 0.6386, "lr": 1.2168306052435896e-05, "epoch": 7.044235924932976, "percentage": 70.44, "elapsed_time": "3:17:08", "remaining_time": "1:22:43", "throughput": 2306.09, "total_tokens": 27278592} {"current_steps": 47300, "total_steps": 67140, "loss": 0.4769, "lr": 1.216272899366176e-05, "epoch": 7.044980637473935, "percentage": 70.45, "elapsed_time": "3:17:10", "remaining_time": "1:22:42", "throughput": 2306.14, "total_tokens": 27281984} {"current_steps": 47305, "total_steps": 67140, "loss": 0.6989, "lr": 1.2157152802378207e-05, "epoch": 7.045725350014894, "percentage": 70.46, "elapsed_time": "3:17:11", "remaining_time": "1:22:40", "throughput": 2306.16, "total_tokens": 27284832} {"current_steps": 47310, "total_steps": 67140, "loss": 0.7008, "lr": 1.2151577478962054e-05, "epoch": 7.046470062555853, "percentage": 70.46, "elapsed_time": "3:17:12", "remaining_time": "1:22:39", "throughput": 2306.19, "total_tokens": 27287808} {"current_steps": 47315, "total_steps": 67140, "loss": 0.7541, "lr": 1.2146003023790064e-05, "epoch": 7.047214775096813, "percentage": 70.47, "elapsed_time": "3:17:13", "remaining_time": "1:22:38", "throughput": 2306.21, "total_tokens": 27290592} {"current_steps": 47320, "total_steps": 67140, "loss": 0.5134, "lr": 1.2140429437238932e-05, "epoch": 7.047959487637772, "percentage": 70.48, "elapsed_time": "3:17:14", "remaining_time": "1:22:36", "throughput": 2306.22, "total_tokens": 27293248} {"current_steps": 47325, "total_steps": 67140, "loss": 0.7908, "lr": 1.213485671968528e-05, "epoch": 7.048704200178731, "percentage": 70.49, "elapsed_time": "3:17:15", "remaining_time": "1:22:35", "throughput": 2306.26, "total_tokens": 27296512} {"current_steps": 47330, "total_steps": 67140, "loss": 0.6907, "lr": 1.2129284871505712e-05, "epoch": 7.04944891271969, "percentage": 70.49, "elapsed_time": "3:17:16", "remaining_time": "1:22:34", "throughput": 2306.28, "total_tokens": 27299360} {"current_steps": 47335, "total_steps": 67140, "loss": 0.707, "lr": 1.2123713893076741e-05, "epoch": 7.05019362526065, "percentage": 70.5, "elapsed_time": "3:17:18", "remaining_time": "1:22:33", "throughput": 2306.31, "total_tokens": 27302336} {"current_steps": 47340, "total_steps": 67140, "loss": 0.4242, "lr": 1.2118143784774832e-05, "epoch": 7.050938337801608, "percentage": 70.51, "elapsed_time": "3:17:19", "remaining_time": "1:22:31", "throughput": 2306.34, "total_tokens": 27305344} {"current_steps": 47345, "total_steps": 67140, "loss": 0.7087, "lr": 1.2112574546976397e-05, "epoch": 7.051683050342568, "percentage": 70.52, "elapsed_time": "3:17:20", "remaining_time": "1:22:30", "throughput": 2306.36, "total_tokens": 27308128} {"current_steps": 47350, "total_steps": 67140, "loss": 0.5685, "lr": 1.210700618005778e-05, "epoch": 7.052427762883527, "percentage": 70.52, "elapsed_time": "3:17:21", "remaining_time": "1:22:29", "throughput": 2306.37, "total_tokens": 27310784} {"current_steps": 47355, "total_steps": 67140, "loss": 0.3912, "lr": 1.2101438684395264e-05, "epoch": 7.053172475424486, "percentage": 70.53, "elapsed_time": "3:17:22", "remaining_time": "1:22:27", "throughput": 2306.38, "total_tokens": 27313536} {"current_steps": 47360, "total_steps": 67140, "loss": 0.6335, "lr": 1.2095872060365084e-05, "epoch": 7.053917187965445, "percentage": 70.54, "elapsed_time": "3:17:23", "remaining_time": "1:22:26", "throughput": 2306.4, "total_tokens": 27316416} {"current_steps": 47365, "total_steps": 67140, "loss": 0.6232, "lr": 1.20903063083434e-05, "epoch": 7.054661900506405, "percentage": 70.55, "elapsed_time": "3:17:24", "remaining_time": "1:22:25", "throughput": 2306.42, "total_tokens": 27319264} {"current_steps": 47370, "total_steps": 67140, "loss": 0.4663, "lr": 1.2084741428706328e-05, "epoch": 7.055406613047364, "percentage": 70.55, "elapsed_time": "3:17:25", "remaining_time": "1:22:23", "throughput": 2306.44, "total_tokens": 27322080} {"current_steps": 47375, "total_steps": 67140, "loss": 0.5462, "lr": 1.207917742182992e-05, "epoch": 7.056151325588323, "percentage": 70.56, "elapsed_time": "3:17:27", "remaining_time": "1:22:22", "throughput": 2306.47, "total_tokens": 27325056} {"current_steps": 47380, "total_steps": 67140, "loss": 0.688, "lr": 1.2073614288090179e-05, "epoch": 7.056896038129282, "percentage": 70.57, "elapsed_time": "3:17:28", "remaining_time": "1:22:21", "throughput": 2306.48, "total_tokens": 27327840} {"current_steps": 47385, "total_steps": 67140, "loss": 0.5486, "lr": 1.206805202786302e-05, "epoch": 7.057640750670242, "percentage": 70.58, "elapsed_time": "3:17:29", "remaining_time": "1:22:20", "throughput": 2306.51, "total_tokens": 27330720} {"current_steps": 47390, "total_steps": 67140, "loss": 0.7091, "lr": 1.2062490641524327e-05, "epoch": 7.0583854632112, "percentage": 70.58, "elapsed_time": "3:17:30", "remaining_time": "1:22:18", "throughput": 2306.52, "total_tokens": 27333536} {"current_steps": 47395, "total_steps": 67140, "loss": 0.3706, "lr": 1.2056930129449918e-05, "epoch": 7.05913017575216, "percentage": 70.59, "elapsed_time": "3:17:31", "remaining_time": "1:22:17", "throughput": 2306.55, "total_tokens": 27336416} {"current_steps": 47400, "total_steps": 67140, "loss": 0.4784, "lr": 1.2051370492015556e-05, "epoch": 7.059874888293119, "percentage": 70.6, "elapsed_time": "3:17:32", "remaining_time": "1:22:16", "throughput": 2306.55, "total_tokens": 27339040} {"current_steps": 47405, "total_steps": 67140, "loss": 0.5616, "lr": 1.2045811729596922e-05, "epoch": 7.0606196008340785, "percentage": 70.61, "elapsed_time": "3:17:33", "remaining_time": "1:22:14", "throughput": 2306.58, "total_tokens": 27342016} {"current_steps": 47410, "total_steps": 67140, "loss": 0.5593, "lr": 1.2040253842569665e-05, "epoch": 7.061364313375037, "percentage": 70.61, "elapsed_time": "3:17:35", "remaining_time": "1:22:13", "throughput": 2306.59, "total_tokens": 27344768} {"current_steps": 47415, "total_steps": 67140, "loss": 0.5489, "lr": 1.2034696831309369e-05, "epoch": 7.062109025915996, "percentage": 70.62, "elapsed_time": "3:17:36", "remaining_time": "1:22:12", "throughput": 2306.63, "total_tokens": 27347776} {"current_steps": 47420, "total_steps": 67140, "loss": 0.5417, "lr": 1.202914069619154e-05, "epoch": 7.062853738456956, "percentage": 70.63, "elapsed_time": "3:17:37", "remaining_time": "1:22:10", "throughput": 2306.65, "total_tokens": 27350752} {"current_steps": 47425, "total_steps": 67140, "loss": 0.6523, "lr": 1.202358543759165e-05, "epoch": 7.063598450997914, "percentage": 70.64, "elapsed_time": "3:17:38", "remaining_time": "1:22:09", "throughput": 2306.67, "total_tokens": 27353504} {"current_steps": 47430, "total_steps": 67140, "loss": 0.5954, "lr": 1.2018031055885093e-05, "epoch": 7.064343163538874, "percentage": 70.64, "elapsed_time": "3:17:39", "remaining_time": "1:22:08", "throughput": 2306.7, "total_tokens": 27356448} {"current_steps": 47435, "total_steps": 67140, "loss": 0.5034, "lr": 1.2012477551447222e-05, "epoch": 7.065087876079833, "percentage": 70.65, "elapsed_time": "3:17:40", "remaining_time": "1:22:07", "throughput": 2306.7, "total_tokens": 27359040} {"current_steps": 47440, "total_steps": 67140, "loss": 0.6112, "lr": 1.2006924924653318e-05, "epoch": 7.065832588620792, "percentage": 70.66, "elapsed_time": "3:17:41", "remaining_time": "1:22:05", "throughput": 2306.72, "total_tokens": 27361824} {"current_steps": 47445, "total_steps": 67140, "loss": 0.5048, "lr": 1.2001373175878597e-05, "epoch": 7.066577301161751, "percentage": 70.67, "elapsed_time": "3:17:42", "remaining_time": "1:22:04", "throughput": 2306.76, "total_tokens": 27364960} {"current_steps": 47450, "total_steps": 67140, "loss": 0.757, "lr": 1.1995822305498233e-05, "epoch": 7.067322013702711, "percentage": 70.67, "elapsed_time": "3:17:44", "remaining_time": "1:22:03", "throughput": 2306.78, "total_tokens": 27367840} {"current_steps": 47455, "total_steps": 67140, "loss": 0.5516, "lr": 1.1990272313887321e-05, "epoch": 7.06806672624367, "percentage": 70.68, "elapsed_time": "3:17:45", "remaining_time": "1:22:01", "throughput": 2306.78, "total_tokens": 27370368} {"current_steps": 47460, "total_steps": 67140, "loss": 0.7957, "lr": 1.1984723201420911e-05, "epoch": 7.068811438784629, "percentage": 70.69, "elapsed_time": "3:17:46", "remaining_time": "1:22:00", "throughput": 2306.8, "total_tokens": 27373216} {"current_steps": 47465, "total_steps": 67140, "loss": 0.4907, "lr": 1.1979174968473991e-05, "epoch": 7.069556151325588, "percentage": 70.7, "elapsed_time": "3:17:47", "remaining_time": "1:21:59", "throughput": 2306.82, "total_tokens": 27376160} {"current_steps": 47470, "total_steps": 67140, "loss": 0.5007, "lr": 1.1973627615421487e-05, "epoch": 7.070300863866548, "percentage": 70.7, "elapsed_time": "3:17:48", "remaining_time": "1:21:57", "throughput": 2306.87, "total_tokens": 27379424} {"current_steps": 47475, "total_steps": 67140, "loss": 0.4895, "lr": 1.1968081142638268e-05, "epoch": 7.071045576407506, "percentage": 70.71, "elapsed_time": "3:17:49", "remaining_time": "1:21:56", "throughput": 2306.88, "total_tokens": 27382240} {"current_steps": 47480, "total_steps": 67140, "loss": 0.6742, "lr": 1.1962535550499152e-05, "epoch": 7.071790288948466, "percentage": 70.72, "elapsed_time": "3:17:50", "remaining_time": "1:21:55", "throughput": 2306.92, "total_tokens": 27385312} {"current_steps": 47485, "total_steps": 67140, "loss": 0.5551, "lr": 1.1956990839378877e-05, "epoch": 7.072535001489425, "percentage": 70.73, "elapsed_time": "3:17:52", "remaining_time": "1:21:54", "throughput": 2306.93, "total_tokens": 27388064} {"current_steps": 47490, "total_steps": 67140, "loss": 0.5465, "lr": 1.1951447009652119e-05, "epoch": 7.0732797140303845, "percentage": 70.73, "elapsed_time": "3:17:53", "remaining_time": "1:21:52", "throughput": 2306.96, "total_tokens": 27391136} {"current_steps": 47495, "total_steps": 67140, "loss": 0.6061, "lr": 1.1945904061693524e-05, "epoch": 7.074024426571343, "percentage": 70.74, "elapsed_time": "3:17:54", "remaining_time": "1:21:51", "throughput": 2306.98, "total_tokens": 27393824} {"current_steps": 47500, "total_steps": 67140, "loss": 0.5006, "lr": 1.1940361995877658e-05, "epoch": 7.074769139112303, "percentage": 70.75, "elapsed_time": "3:17:55", "remaining_time": "1:21:50", "throughput": 2307.0, "total_tokens": 27396704} {"current_steps": 47505, "total_steps": 67140, "loss": 0.6376, "lr": 1.1934820812579031e-05, "epoch": 7.075513851653262, "percentage": 70.76, "elapsed_time": "3:17:56", "remaining_time": "1:21:48", "throughput": 2307.02, "total_tokens": 27399616} {"current_steps": 47510, "total_steps": 67140, "loss": 0.5219, "lr": 1.1929280512172095e-05, "epoch": 7.076258564194221, "percentage": 70.76, "elapsed_time": "3:17:57", "remaining_time": "1:21:47", "throughput": 2307.04, "total_tokens": 27402496} {"current_steps": 47515, "total_steps": 67140, "loss": 0.5641, "lr": 1.1923741095031248e-05, "epoch": 7.07700327673518, "percentage": 70.77, "elapsed_time": "3:17:58", "remaining_time": "1:21:46", "throughput": 2307.06, "total_tokens": 27405280} {"current_steps": 47520, "total_steps": 67140, "loss": 0.6617, "lr": 1.1918202561530813e-05, "epoch": 7.07774798927614, "percentage": 70.78, "elapsed_time": "3:18:00", "remaining_time": "1:21:45", "throughput": 2307.09, "total_tokens": 27408320} {"current_steps": 47525, "total_steps": 67140, "loss": 0.5139, "lr": 1.1912664912045057e-05, "epoch": 7.078492701817098, "percentage": 70.78, "elapsed_time": "3:18:01", "remaining_time": "1:21:43", "throughput": 2307.12, "total_tokens": 27411360} {"current_steps": 47530, "total_steps": 67140, "loss": 0.6156, "lr": 1.1907128146948193e-05, "epoch": 7.079237414358058, "percentage": 70.79, "elapsed_time": "3:18:02", "remaining_time": "1:21:42", "throughput": 2307.15, "total_tokens": 27414336} {"current_steps": 47535, "total_steps": 67140, "loss": 0.6039, "lr": 1.190159226661438e-05, "epoch": 7.079982126899017, "percentage": 70.8, "elapsed_time": "3:18:03", "remaining_time": "1:21:41", "throughput": 2307.17, "total_tokens": 27417088} {"current_steps": 47540, "total_steps": 67140, "loss": 0.3998, "lr": 1.1896057271417707e-05, "epoch": 7.0807268394399765, "percentage": 70.81, "elapsed_time": "3:18:04", "remaining_time": "1:21:39", "throughput": 2307.18, "total_tokens": 27419840} {"current_steps": 47545, "total_steps": 67140, "loss": 0.4436, "lr": 1.1890523161732214e-05, "epoch": 7.081471551980935, "percentage": 70.81, "elapsed_time": "3:18:05", "remaining_time": "1:21:38", "throughput": 2307.2, "total_tokens": 27422752} {"current_steps": 47550, "total_steps": 67140, "loss": 0.4339, "lr": 1.188498993793186e-05, "epoch": 7.082216264521895, "percentage": 70.82, "elapsed_time": "3:18:06", "remaining_time": "1:21:37", "throughput": 2307.22, "total_tokens": 27425568} {"current_steps": 47555, "total_steps": 67140, "loss": 0.5551, "lr": 1.187945760039056e-05, "epoch": 7.082960977062854, "percentage": 70.83, "elapsed_time": "3:18:08", "remaining_time": "1:21:35", "throughput": 2307.26, "total_tokens": 27428672} {"current_steps": 47560, "total_steps": 67140, "loss": 0.7793, "lr": 1.1873926149482183e-05, "epoch": 7.083705689603813, "percentage": 70.84, "elapsed_time": "3:18:09", "remaining_time": "1:21:34", "throughput": 2307.26, "total_tokens": 27431232} {"current_steps": 47565, "total_steps": 67140, "loss": 0.6724, "lr": 1.1868395585580503e-05, "epoch": 7.084450402144772, "percentage": 70.84, "elapsed_time": "3:18:10", "remaining_time": "1:21:33", "throughput": 2307.28, "total_tokens": 27434144} {"current_steps": 47570, "total_steps": 67140, "loss": 0.5534, "lr": 1.186286590905926e-05, "epoch": 7.085195114685732, "percentage": 70.85, "elapsed_time": "3:18:11", "remaining_time": "1:21:32", "throughput": 2307.33, "total_tokens": 27437408} {"current_steps": 47575, "total_steps": 67140, "loss": 0.6297, "lr": 1.1857337120292123e-05, "epoch": 7.0859398272266905, "percentage": 70.86, "elapsed_time": "3:18:12", "remaining_time": "1:21:30", "throughput": 2307.35, "total_tokens": 27440256} {"current_steps": 47580, "total_steps": 67140, "loss": 0.6122, "lr": 1.1851809219652721e-05, "epoch": 7.08668453976765, "percentage": 70.87, "elapsed_time": "3:18:13", "remaining_time": "1:21:29", "throughput": 2307.36, "total_tokens": 27443008} {"current_steps": 47585, "total_steps": 67140, "loss": 0.6894, "lr": 1.1846282207514586e-05, "epoch": 7.087429252308609, "percentage": 70.87, "elapsed_time": "3:18:14", "remaining_time": "1:21:28", "throughput": 2307.39, "total_tokens": 27445952} {"current_steps": 47590, "total_steps": 67140, "loss": 0.6325, "lr": 1.184075608425122e-05, "epoch": 7.088173964849568, "percentage": 70.88, "elapsed_time": "3:18:15", "remaining_time": "1:21:26", "throughput": 2307.41, "total_tokens": 27448864} {"current_steps": 47595, "total_steps": 67140, "loss": 0.6508, "lr": 1.1835230850236057e-05, "epoch": 7.088918677390527, "percentage": 70.89, "elapsed_time": "3:18:17", "remaining_time": "1:21:25", "throughput": 2307.43, "total_tokens": 27451648} {"current_steps": 47600, "total_steps": 67140, "loss": 0.4723, "lr": 1.1829706505842478e-05, "epoch": 7.089663389931486, "percentage": 70.9, "elapsed_time": "3:18:18", "remaining_time": "1:21:24", "throughput": 2307.48, "total_tokens": 27455072} {"current_steps": 47605, "total_steps": 67140, "loss": 0.8043, "lr": 1.1824183051443776e-05, "epoch": 7.090408102472446, "percentage": 70.9, "elapsed_time": "3:18:19", "remaining_time": "1:21:22", "throughput": 2307.49, "total_tokens": 27457760} {"current_steps": 47610, "total_steps": 67140, "loss": 0.5291, "lr": 1.1818660487413217e-05, "epoch": 7.091152815013404, "percentage": 70.91, "elapsed_time": "3:18:20", "remaining_time": "1:21:21", "throughput": 2307.51, "total_tokens": 27460480} {"current_steps": 47615, "total_steps": 67140, "loss": 0.5575, "lr": 1.1813138814123997e-05, "epoch": 7.091897527554364, "percentage": 70.92, "elapsed_time": "3:18:21", "remaining_time": "1:21:20", "throughput": 2307.54, "total_tokens": 27463584} {"current_steps": 47620, "total_steps": 67140, "loss": 0.5843, "lr": 1.1807618031949235e-05, "epoch": 7.092642240095323, "percentage": 70.93, "elapsed_time": "3:18:22", "remaining_time": "1:21:19", "throughput": 2307.57, "total_tokens": 27466528} {"current_steps": 47625, "total_steps": 67140, "loss": 0.4793, "lr": 1.1802098141262008e-05, "epoch": 7.0933869526362825, "percentage": 70.93, "elapsed_time": "3:18:23", "remaining_time": "1:21:17", "throughput": 2307.58, "total_tokens": 27469280} {"current_steps": 47630, "total_steps": 67140, "loss": 0.5483, "lr": 1.1796579142435332e-05, "epoch": 7.094131665177241, "percentage": 70.94, "elapsed_time": "3:18:25", "remaining_time": "1:21:16", "throughput": 2307.61, "total_tokens": 27472192} {"current_steps": 47635, "total_steps": 67140, "loss": 0.6358, "lr": 1.1791061035842158e-05, "epoch": 7.094876377718201, "percentage": 70.95, "elapsed_time": "3:18:26", "remaining_time": "1:21:15", "throughput": 2307.63, "total_tokens": 27475136} {"current_steps": 47640, "total_steps": 67140, "loss": 0.6095, "lr": 1.178554382185538e-05, "epoch": 7.09562109025916, "percentage": 70.96, "elapsed_time": "3:18:27", "remaining_time": "1:21:13", "throughput": 2307.65, "total_tokens": 27477984} {"current_steps": 47645, "total_steps": 67140, "loss": 0.4956, "lr": 1.1780027500847818e-05, "epoch": 7.096365802800119, "percentage": 70.96, "elapsed_time": "3:18:28", "remaining_time": "1:21:12", "throughput": 2307.68, "total_tokens": 27480864} {"current_steps": 47650, "total_steps": 67140, "loss": 0.4231, "lr": 1.177451207319226e-05, "epoch": 7.097110515341078, "percentage": 70.97, "elapsed_time": "3:18:29", "remaining_time": "1:21:11", "throughput": 2307.7, "total_tokens": 27483744} {"current_steps": 47655, "total_steps": 67140, "loss": 0.5116, "lr": 1.1768997539261392e-05, "epoch": 7.097855227882038, "percentage": 70.98, "elapsed_time": "3:18:30", "remaining_time": "1:21:10", "throughput": 2307.71, "total_tokens": 27486464} {"current_steps": 47660, "total_steps": 67140, "loss": 0.5022, "lr": 1.176348389942788e-05, "epoch": 7.0985999404229965, "percentage": 70.99, "elapsed_time": "3:18:31", "remaining_time": "1:21:08", "throughput": 2307.73, "total_tokens": 27489408} {"current_steps": 47665, "total_steps": 67140, "loss": 0.6304, "lr": 1.175797115406431e-05, "epoch": 7.099344652963956, "percentage": 70.99, "elapsed_time": "3:18:32", "remaining_time": "1:21:07", "throughput": 2307.75, "total_tokens": 27492160} {"current_steps": 47670, "total_steps": 67140, "loss": 0.6006, "lr": 1.1752459303543209e-05, "epoch": 7.100089365504915, "percentage": 71.0, "elapsed_time": "3:18:34", "remaining_time": "1:21:06", "throughput": 2307.78, "total_tokens": 27495296} {"current_steps": 47675, "total_steps": 67140, "loss": 0.6538, "lr": 1.174694834823705e-05, "epoch": 7.1008340780458745, "percentage": 71.01, "elapsed_time": "3:18:35", "remaining_time": "1:21:04", "throughput": 2307.8, "total_tokens": 27498176} {"current_steps": 47680, "total_steps": 67140, "loss": 0.4484, "lr": 1.1741438288518248e-05, "epoch": 7.101578790586833, "percentage": 71.02, "elapsed_time": "3:18:36", "remaining_time": "1:21:03", "throughput": 2307.81, "total_tokens": 27500864} {"current_steps": 47685, "total_steps": 67140, "loss": 0.6654, "lr": 1.173592912475914e-05, "epoch": 7.102323503127793, "percentage": 71.02, "elapsed_time": "3:18:37", "remaining_time": "1:21:02", "throughput": 2307.85, "total_tokens": 27504128} {"current_steps": 47690, "total_steps": 67140, "loss": 0.4782, "lr": 1.1730420857332002e-05, "epoch": 7.103068215668752, "percentage": 71.03, "elapsed_time": "3:18:38", "remaining_time": "1:21:00", "throughput": 2307.87, "total_tokens": 27506912} {"current_steps": 47695, "total_steps": 67140, "loss": 0.6898, "lr": 1.1724913486609077e-05, "epoch": 7.103812928209711, "percentage": 71.04, "elapsed_time": "3:18:39", "remaining_time": "1:20:59", "throughput": 2307.87, "total_tokens": 27509376} {"current_steps": 47700, "total_steps": 67140, "loss": 0.68, "lr": 1.1719407012962524e-05, "epoch": 7.10455764075067, "percentage": 71.05, "elapsed_time": "3:18:40", "remaining_time": "1:20:58", "throughput": 2307.9, "total_tokens": 27512384} {"current_steps": 47705, "total_steps": 67140, "loss": 0.7663, "lr": 1.1713901436764451e-05, "epoch": 7.10530235329163, "percentage": 71.05, "elapsed_time": "3:18:42", "remaining_time": "1:20:57", "throughput": 2307.93, "total_tokens": 27515360} {"current_steps": 47710, "total_steps": 67140, "loss": 0.5593, "lr": 1.1708396758386911e-05, "epoch": 7.1060470658325885, "percentage": 71.06, "elapsed_time": "3:18:43", "remaining_time": "1:20:55", "throughput": 2307.95, "total_tokens": 27518208} {"current_steps": 47715, "total_steps": 67140, "loss": 0.6879, "lr": 1.1702892978201868e-05, "epoch": 7.106791778373548, "percentage": 71.07, "elapsed_time": "3:18:44", "remaining_time": "1:20:54", "throughput": 2307.96, "total_tokens": 27520864} {"current_steps": 47720, "total_steps": 67140, "loss": 0.7284, "lr": 1.1697390096581265e-05, "epoch": 7.107536490914507, "percentage": 71.08, "elapsed_time": "3:18:45", "remaining_time": "1:20:53", "throughput": 2307.98, "total_tokens": 27523744} {"current_steps": 47725, "total_steps": 67140, "loss": 0.7318, "lr": 1.1691888113896945e-05, "epoch": 7.1082812034554665, "percentage": 71.08, "elapsed_time": "3:18:46", "remaining_time": "1:20:51", "throughput": 2308.02, "total_tokens": 27526976} {"current_steps": 47730, "total_steps": 67140, "loss": 0.5616, "lr": 1.1686387030520721e-05, "epoch": 7.109025915996425, "percentage": 71.09, "elapsed_time": "3:18:47", "remaining_time": "1:20:50", "throughput": 2308.03, "total_tokens": 27529664} {"current_steps": 47735, "total_steps": 67140, "loss": 0.5508, "lr": 1.168088684682433e-05, "epoch": 7.109770628537385, "percentage": 71.1, "elapsed_time": "3:18:48", "remaining_time": "1:20:49", "throughput": 2308.05, "total_tokens": 27532544} {"current_steps": 47740, "total_steps": 67140, "loss": 0.5312, "lr": 1.1675387563179455e-05, "epoch": 7.110515341078344, "percentage": 71.11, "elapsed_time": "3:18:50", "remaining_time": "1:20:47", "throughput": 2308.07, "total_tokens": 27535360} {"current_steps": 47745, "total_steps": 67140, "loss": 0.4188, "lr": 1.1669889179957725e-05, "epoch": 7.111260053619303, "percentage": 71.11, "elapsed_time": "3:18:51", "remaining_time": "1:20:46", "throughput": 2308.08, "total_tokens": 27538048} {"current_steps": 47750, "total_steps": 67140, "loss": 0.7124, "lr": 1.1664391697530677e-05, "epoch": 7.112004766160262, "percentage": 71.12, "elapsed_time": "3:18:52", "remaining_time": "1:20:45", "throughput": 2308.11, "total_tokens": 27541056} {"current_steps": 47755, "total_steps": 67140, "loss": 0.5547, "lr": 1.1658895116269821e-05, "epoch": 7.112749478701222, "percentage": 71.13, "elapsed_time": "3:18:53", "remaining_time": "1:20:44", "throughput": 2308.13, "total_tokens": 27544000} {"current_steps": 47760, "total_steps": 67140, "loss": 0.7941, "lr": 1.16533994365466e-05, "epoch": 7.1134941912421805, "percentage": 71.13, "elapsed_time": "3:18:54", "remaining_time": "1:20:42", "throughput": 2308.16, "total_tokens": 27546848} {"current_steps": 47765, "total_steps": 67140, "loss": 0.6176, "lr": 1.1647904658732373e-05, "epoch": 7.114238903783139, "percentage": 71.14, "elapsed_time": "3:18:55", "remaining_time": "1:20:41", "throughput": 2308.18, "total_tokens": 27549792} {"current_steps": 47770, "total_steps": 67140, "loss": 0.7843, "lr": 1.1642410783198465e-05, "epoch": 7.114983616324099, "percentage": 71.15, "elapsed_time": "3:18:56", "remaining_time": "1:20:40", "throughput": 2308.21, "total_tokens": 27552800} {"current_steps": 47775, "total_steps": 67140, "loss": 0.53, "lr": 1.1636917810316126e-05, "epoch": 7.115728328865058, "percentage": 71.16, "elapsed_time": "3:18:58", "remaining_time": "1:20:38", "throughput": 2308.25, "total_tokens": 27555968} {"current_steps": 47780, "total_steps": 67140, "loss": 0.4708, "lr": 1.1631425740456562e-05, "epoch": 7.116473041406017, "percentage": 71.16, "elapsed_time": "3:18:59", "remaining_time": "1:20:37", "throughput": 2308.26, "total_tokens": 27558688} {"current_steps": 47785, "total_steps": 67140, "loss": 0.7351, "lr": 1.1625934573990882e-05, "epoch": 7.117217753946976, "percentage": 71.17, "elapsed_time": "3:19:00", "remaining_time": "1:20:36", "throughput": 2308.3, "total_tokens": 27561888} {"current_steps": 47790, "total_steps": 67140, "loss": 0.7377, "lr": 1.1620444311290172e-05, "epoch": 7.117962466487936, "percentage": 71.18, "elapsed_time": "3:19:01", "remaining_time": "1:20:35", "throughput": 2308.33, "total_tokens": 27564896} {"current_steps": 47795, "total_steps": 67140, "loss": 0.6665, "lr": 1.1614954952725434e-05, "epoch": 7.1187071790288945, "percentage": 71.19, "elapsed_time": "3:19:02", "remaining_time": "1:20:33", "throughput": 2308.36, "total_tokens": 27568000} {"current_steps": 47800, "total_steps": 67140, "loss": 0.6711, "lr": 1.1609466498667634e-05, "epoch": 7.119451891569854, "percentage": 71.19, "elapsed_time": "3:19:03", "remaining_time": "1:20:32", "throughput": 2308.37, "total_tokens": 27570816} {"current_steps": 47805, "total_steps": 67140, "loss": 0.5913, "lr": 1.1603978949487634e-05, "epoch": 7.120196604110813, "percentage": 71.2, "elapsed_time": "3:19:04", "remaining_time": "1:20:31", "throughput": 2308.39, "total_tokens": 27573664} {"current_steps": 47810, "total_steps": 67140, "loss": 0.6809, "lr": 1.1598492305556274e-05, "epoch": 7.1209413166517725, "percentage": 71.21, "elapsed_time": "3:19:06", "remaining_time": "1:20:29", "throughput": 2308.41, "total_tokens": 27576512} {"current_steps": 47815, "total_steps": 67140, "loss": 0.5294, "lr": 1.1593006567244328e-05, "epoch": 7.121686029192731, "percentage": 71.22, "elapsed_time": "3:19:07", "remaining_time": "1:20:28", "throughput": 2308.44, "total_tokens": 27579424} {"current_steps": 47820, "total_steps": 67140, "loss": 0.4628, "lr": 1.1587521734922476e-05, "epoch": 7.122430741733691, "percentage": 71.22, "elapsed_time": "3:19:08", "remaining_time": "1:20:27", "throughput": 2308.45, "total_tokens": 27582240} {"current_steps": 47825, "total_steps": 67140, "loss": 0.5709, "lr": 1.1582037808961377e-05, "epoch": 7.12317545427465, "percentage": 71.23, "elapsed_time": "3:19:09", "remaining_time": "1:20:26", "throughput": 2308.47, "total_tokens": 27585056} {"current_steps": 47830, "total_steps": 67140, "loss": 0.5168, "lr": 1.1576554789731608e-05, "epoch": 7.123920166815609, "percentage": 71.24, "elapsed_time": "3:19:10", "remaining_time": "1:20:24", "throughput": 2308.48, "total_tokens": 27587744} {"current_steps": 47835, "total_steps": 67140, "loss": 0.4325, "lr": 1.1571072677603691e-05, "epoch": 7.124664879356568, "percentage": 71.25, "elapsed_time": "3:19:11", "remaining_time": "1:20:23", "throughput": 2308.5, "total_tokens": 27590496} {"current_steps": 47840, "total_steps": 67140, "loss": 0.4317, "lr": 1.1565591472948095e-05, "epoch": 7.125409591897528, "percentage": 71.25, "elapsed_time": "3:19:12", "remaining_time": "1:20:22", "throughput": 2308.52, "total_tokens": 27593408} {"current_steps": 47845, "total_steps": 67140, "loss": 0.4868, "lr": 1.1560111176135197e-05, "epoch": 7.1261543044384865, "percentage": 71.26, "elapsed_time": "3:19:13", "remaining_time": "1:20:20", "throughput": 2308.54, "total_tokens": 27596224} {"current_steps": 47850, "total_steps": 67140, "loss": 0.5606, "lr": 1.1554631787535353e-05, "epoch": 7.126899016979446, "percentage": 71.27, "elapsed_time": "3:19:15", "remaining_time": "1:20:19", "throughput": 2308.55, "total_tokens": 27598976} {"current_steps": 47855, "total_steps": 67140, "loss": 0.6866, "lr": 1.1549153307518817e-05, "epoch": 7.127643729520405, "percentage": 71.28, "elapsed_time": "3:19:16", "remaining_time": "1:20:18", "throughput": 2308.58, "total_tokens": 27601920} {"current_steps": 47860, "total_steps": 67140, "loss": 0.4733, "lr": 1.1543675736455814e-05, "epoch": 7.128388442061365, "percentage": 71.28, "elapsed_time": "3:19:17", "remaining_time": "1:20:16", "throughput": 2308.58, "total_tokens": 27604512} {"current_steps": 47865, "total_steps": 67140, "loss": 0.5445, "lr": 1.1538199074716493e-05, "epoch": 7.129133154602323, "percentage": 71.29, "elapsed_time": "3:19:18", "remaining_time": "1:20:15", "throughput": 2308.59, "total_tokens": 27607072} {"current_steps": 47870, "total_steps": 67140, "loss": 0.6862, "lr": 1.1532723322670952e-05, "epoch": 7.129877867143283, "percentage": 71.3, "elapsed_time": "3:19:19", "remaining_time": "1:20:14", "throughput": 2308.6, "total_tokens": 27609856} {"current_steps": 47875, "total_steps": 67140, "loss": 0.6008, "lr": 1.152724848068922e-05, "epoch": 7.130622579684242, "percentage": 71.31, "elapsed_time": "3:19:20", "remaining_time": "1:20:12", "throughput": 2308.62, "total_tokens": 27612640} {"current_steps": 47880, "total_steps": 67140, "loss": 0.5582, "lr": 1.152177454914125e-05, "epoch": 7.131367292225201, "percentage": 71.31, "elapsed_time": "3:19:21", "remaining_time": "1:20:11", "throughput": 2308.64, "total_tokens": 27615552} {"current_steps": 47885, "total_steps": 67140, "loss": 0.6423, "lr": 1.151630152839697e-05, "epoch": 7.13211200476616, "percentage": 71.32, "elapsed_time": "3:19:22", "remaining_time": "1:20:10", "throughput": 2308.67, "total_tokens": 27618560} {"current_steps": 47890, "total_steps": 67140, "loss": 0.649, "lr": 1.1510829418826199e-05, "epoch": 7.13285671730712, "percentage": 71.33, "elapsed_time": "3:19:24", "remaining_time": "1:20:09", "throughput": 2308.7, "total_tokens": 27621600} {"current_steps": 47895, "total_steps": 67140, "loss": 0.5568, "lr": 1.1505358220798736e-05, "epoch": 7.1336014298480785, "percentage": 71.34, "elapsed_time": "3:19:25", "remaining_time": "1:20:07", "throughput": 2308.72, "total_tokens": 27624448} {"current_steps": 47900, "total_steps": 67140, "loss": 0.6884, "lr": 1.1499887934684297e-05, "epoch": 7.134346142389038, "percentage": 71.34, "elapsed_time": "3:19:26", "remaining_time": "1:20:06", "throughput": 2308.73, "total_tokens": 27627104} {"current_steps": 47905, "total_steps": 67140, "loss": 0.4231, "lr": 1.1494418560852546e-05, "epoch": 7.135090854929997, "percentage": 71.35, "elapsed_time": "3:19:27", "remaining_time": "1:20:05", "throughput": 2308.74, "total_tokens": 27629856} {"current_steps": 47910, "total_steps": 67140, "loss": 0.7129, "lr": 1.1488950099673087e-05, "epoch": 7.135835567470957, "percentage": 71.36, "elapsed_time": "3:19:28", "remaining_time": "1:20:03", "throughput": 2308.77, "total_tokens": 27632896} {"current_steps": 47915, "total_steps": 67140, "loss": 0.5258, "lr": 1.148348255151544e-05, "epoch": 7.136580280011915, "percentage": 71.37, "elapsed_time": "3:19:29", "remaining_time": "1:20:02", "throughput": 2308.78, "total_tokens": 27635488} {"current_steps": 47920, "total_steps": 67140, "loss": 0.7527, "lr": 1.1478015916749089e-05, "epoch": 7.137324992552875, "percentage": 71.37, "elapsed_time": "3:19:30", "remaining_time": "1:20:01", "throughput": 2308.8, "total_tokens": 27638400} {"current_steps": 47925, "total_steps": 67140, "loss": 0.5606, "lr": 1.147255019574345e-05, "epoch": 7.138069705093834, "percentage": 71.38, "elapsed_time": "3:19:32", "remaining_time": "1:20:00", "throughput": 2308.84, "total_tokens": 27641504} {"current_steps": 47930, "total_steps": 67140, "loss": 0.413, "lr": 1.1467085388867866e-05, "epoch": 7.1388144176347925, "percentage": 71.39, "elapsed_time": "3:19:33", "remaining_time": "1:19:58", "throughput": 2308.86, "total_tokens": 27644480} {"current_steps": 47935, "total_steps": 67140, "loss": 0.4525, "lr": 1.1461621496491628e-05, "epoch": 7.139559130175752, "percentage": 71.4, "elapsed_time": "3:19:34", "remaining_time": "1:19:57", "throughput": 2308.9, "total_tokens": 27647552} {"current_steps": 47940, "total_steps": 67140, "loss": 0.7176, "lr": 1.1456158518983967e-05, "epoch": 7.140303842716711, "percentage": 71.4, "elapsed_time": "3:19:35", "remaining_time": "1:19:56", "throughput": 2308.92, "total_tokens": 27650464} {"current_steps": 47945, "total_steps": 67140, "loss": 0.4254, "lr": 1.1450696456714057e-05, "epoch": 7.141048555257671, "percentage": 71.41, "elapsed_time": "3:19:36", "remaining_time": "1:19:54", "throughput": 2308.94, "total_tokens": 27653376} {"current_steps": 47950, "total_steps": 67140, "loss": 0.4003, "lr": 1.1445235310050987e-05, "epoch": 7.141793267798629, "percentage": 71.42, "elapsed_time": "3:19:37", "remaining_time": "1:19:53", "throughput": 2308.97, "total_tokens": 27656288} {"current_steps": 47955, "total_steps": 67140, "loss": 0.4222, "lr": 1.14397750793638e-05, "epoch": 7.142537980339589, "percentage": 71.43, "elapsed_time": "3:19:38", "remaining_time": "1:19:52", "throughput": 2308.98, "total_tokens": 27658976} {"current_steps": 47960, "total_steps": 67140, "loss": 0.6034, "lr": 1.1434315765021485e-05, "epoch": 7.143282692880548, "percentage": 71.43, "elapsed_time": "3:19:39", "remaining_time": "1:19:50", "throughput": 2308.99, "total_tokens": 27661600} {"current_steps": 47965, "total_steps": 67140, "loss": 0.5514, "lr": 1.1428857367392964e-05, "epoch": 7.144027405421507, "percentage": 71.44, "elapsed_time": "3:19:41", "remaining_time": "1:19:49", "throughput": 2308.99, "total_tokens": 27664224} {"current_steps": 47970, "total_steps": 67140, "loss": 0.565, "lr": 1.1423399886847077e-05, "epoch": 7.144772117962466, "percentage": 71.45, "elapsed_time": "3:19:42", "remaining_time": "1:19:48", "throughput": 2309.01, "total_tokens": 27667040} {"current_steps": 47975, "total_steps": 67140, "loss": 0.4927, "lr": 1.1417943323752629e-05, "epoch": 7.145516830503426, "percentage": 71.46, "elapsed_time": "3:19:43", "remaining_time": "1:19:47", "throughput": 2309.04, "total_tokens": 27669952} {"current_steps": 47980, "total_steps": 67140, "loss": 0.6825, "lr": 1.1412487678478357e-05, "epoch": 7.1462615430443845, "percentage": 71.46, "elapsed_time": "3:19:44", "remaining_time": "1:19:45", "throughput": 2309.05, "total_tokens": 27672704} {"current_steps": 47985, "total_steps": 67140, "loss": 0.6143, "lr": 1.1407032951392916e-05, "epoch": 7.147006255585344, "percentage": 71.47, "elapsed_time": "3:19:45", "remaining_time": "1:19:44", "throughput": 2309.09, "total_tokens": 27675904} {"current_steps": 47990, "total_steps": 67140, "loss": 0.5925, "lr": 1.1401579142864924e-05, "epoch": 7.147750968126303, "percentage": 71.48, "elapsed_time": "3:19:46", "remaining_time": "1:19:43", "throughput": 2309.12, "total_tokens": 27679040} {"current_steps": 47995, "total_steps": 67140, "loss": 1.0727, "lr": 1.1396126253262926e-05, "epoch": 7.148495680667263, "percentage": 71.48, "elapsed_time": "3:19:47", "remaining_time": "1:19:41", "throughput": 2309.15, "total_tokens": 27682112} {"current_steps": 48000, "total_steps": 67140, "loss": 0.5863, "lr": 1.1390674282955408e-05, "epoch": 7.149240393208221, "percentage": 71.49, "elapsed_time": "3:19:49", "remaining_time": "1:19:40", "throughput": 2309.17, "total_tokens": 27684800} {"current_steps": 48005, "total_steps": 67140, "loss": 0.7333, "lr": 1.1385223232310799e-05, "epoch": 7.149985105749181, "percentage": 71.5, "elapsed_time": "3:19:50", "remaining_time": "1:19:39", "throughput": 2309.2, "total_tokens": 27687776} {"current_steps": 48010, "total_steps": 67140, "loss": 0.5663, "lr": 1.1379773101697439e-05, "epoch": 7.15072981829014, "percentage": 71.51, "elapsed_time": "3:19:51", "remaining_time": "1:19:38", "throughput": 2309.22, "total_tokens": 27690656} {"current_steps": 48015, "total_steps": 67140, "loss": 0.6865, "lr": 1.1374323891483649e-05, "epoch": 7.151474530831099, "percentage": 71.51, "elapsed_time": "3:19:52", "remaining_time": "1:19:36", "throughput": 2309.25, "total_tokens": 27693856} {"current_steps": 48020, "total_steps": 67140, "loss": 0.5372, "lr": 1.136887560203764e-05, "epoch": 7.152219243372058, "percentage": 71.52, "elapsed_time": "3:19:53", "remaining_time": "1:19:35", "throughput": 2309.28, "total_tokens": 27696832} {"current_steps": 48025, "total_steps": 67140, "loss": 0.5149, "lr": 1.13634282337276e-05, "epoch": 7.152963955913018, "percentage": 71.53, "elapsed_time": "3:19:54", "remaining_time": "1:19:34", "throughput": 2309.29, "total_tokens": 27699584} {"current_steps": 48030, "total_steps": 67140, "loss": 0.4804, "lr": 1.1357981786921636e-05, "epoch": 7.153708668453977, "percentage": 71.54, "elapsed_time": "3:19:55", "remaining_time": "1:19:32", "throughput": 2309.29, "total_tokens": 27702016} {"current_steps": 48035, "total_steps": 67140, "loss": 0.3747, "lr": 1.13525362619878e-05, "epoch": 7.154453380994936, "percentage": 71.54, "elapsed_time": "3:19:57", "remaining_time": "1:19:31", "throughput": 2309.3, "total_tokens": 27704736} {"current_steps": 48040, "total_steps": 67140, "loss": 0.5222, "lr": 1.1347091659294087e-05, "epoch": 7.155198093535895, "percentage": 71.55, "elapsed_time": "3:19:58", "remaining_time": "1:19:30", "throughput": 2309.31, "total_tokens": 27707392} {"current_steps": 48045, "total_steps": 67140, "loss": 0.5186, "lr": 1.13416479792084e-05, "epoch": 7.155942806076855, "percentage": 71.56, "elapsed_time": "3:19:59", "remaining_time": "1:19:28", "throughput": 2309.32, "total_tokens": 27710048} {"current_steps": 48050, "total_steps": 67140, "loss": 0.7807, "lr": 1.1336205222098622e-05, "epoch": 7.156687518617813, "percentage": 71.57, "elapsed_time": "3:20:00", "remaining_time": "1:19:27", "throughput": 2309.34, "total_tokens": 27712992} {"current_steps": 48055, "total_steps": 67140, "loss": 0.4956, "lr": 1.1330763388332533e-05, "epoch": 7.157432231158773, "percentage": 71.57, "elapsed_time": "3:20:01", "remaining_time": "1:19:26", "throughput": 2309.36, "total_tokens": 27715808} {"current_steps": 48060, "total_steps": 67140, "loss": 0.6303, "lr": 1.1325322478277877e-05, "epoch": 7.158176943699732, "percentage": 71.58, "elapsed_time": "3:20:02", "remaining_time": "1:19:25", "throughput": 2309.37, "total_tokens": 27718528} {"current_steps": 48065, "total_steps": 67140, "loss": 0.5883, "lr": 1.1319882492302333e-05, "epoch": 7.158921656240691, "percentage": 71.59, "elapsed_time": "3:20:03", "remaining_time": "1:19:23", "throughput": 2309.4, "total_tokens": 27721568} {"current_steps": 48070, "total_steps": 67140, "loss": 0.603, "lr": 1.131444343077351e-05, "epoch": 7.15966636878165, "percentage": 71.6, "elapsed_time": "3:20:04", "remaining_time": "1:19:22", "throughput": 2309.42, "total_tokens": 27724416} {"current_steps": 48075, "total_steps": 67140, "loss": 0.6192, "lr": 1.1309005294058968e-05, "epoch": 7.16041108132261, "percentage": 71.6, "elapsed_time": "3:20:06", "remaining_time": "1:19:21", "throughput": 2309.45, "total_tokens": 27727392} {"current_steps": 48080, "total_steps": 67140, "loss": 0.6721, "lr": 1.1303568082526178e-05, "epoch": 7.161155793863569, "percentage": 71.61, "elapsed_time": "3:20:07", "remaining_time": "1:19:19", "throughput": 2309.47, "total_tokens": 27730304} {"current_steps": 48085, "total_steps": 67140, "loss": 0.5868, "lr": 1.1298131796542576e-05, "epoch": 7.161900506404528, "percentage": 71.62, "elapsed_time": "3:20:08", "remaining_time": "1:19:18", "throughput": 2309.49, "total_tokens": 27733056} {"current_steps": 48090, "total_steps": 67140, "loss": 0.6605, "lr": 1.1292696436475514e-05, "epoch": 7.162645218945487, "percentage": 71.63, "elapsed_time": "3:20:09", "remaining_time": "1:19:17", "throughput": 2309.5, "total_tokens": 27735776} {"current_steps": 48095, "total_steps": 67140, "loss": 0.7548, "lr": 1.1287262002692295e-05, "epoch": 7.163389931486447, "percentage": 71.63, "elapsed_time": "3:20:10", "remaining_time": "1:19:16", "throughput": 2309.52, "total_tokens": 27738624} {"current_steps": 48100, "total_steps": 67140, "loss": 0.445, "lr": 1.1281828495560157e-05, "epoch": 7.164134644027405, "percentage": 71.64, "elapsed_time": "3:20:11", "remaining_time": "1:19:14", "throughput": 2309.55, "total_tokens": 27741632} {"current_steps": 48105, "total_steps": 67140, "loss": 0.6318, "lr": 1.1276395915446278e-05, "epoch": 7.164879356568365, "percentage": 71.65, "elapsed_time": "3:20:12", "remaining_time": "1:19:13", "throughput": 2309.6, "total_tokens": 27745120} {"current_steps": 48110, "total_steps": 67140, "loss": 0.4206, "lr": 1.1270964262717773e-05, "epoch": 7.165624069109324, "percentage": 71.66, "elapsed_time": "3:20:14", "remaining_time": "1:19:12", "throughput": 2309.62, "total_tokens": 27747872} {"current_steps": 48115, "total_steps": 67140, "loss": 0.5118, "lr": 1.126553353774168e-05, "epoch": 7.166368781650283, "percentage": 71.66, "elapsed_time": "3:20:15", "remaining_time": "1:19:10", "throughput": 2309.62, "total_tokens": 27750464} {"current_steps": 48120, "total_steps": 67140, "loss": 0.5515, "lr": 1.1260103740884986e-05, "epoch": 7.167113494191242, "percentage": 71.67, "elapsed_time": "3:20:16", "remaining_time": "1:19:09", "throughput": 2309.64, "total_tokens": 27753344} {"current_steps": 48125, "total_steps": 67140, "loss": 0.5787, "lr": 1.1254674872514629e-05, "epoch": 7.167858206732201, "percentage": 71.68, "elapsed_time": "3:20:17", "remaining_time": "1:19:08", "throughput": 2309.65, "total_tokens": 27756000} {"current_steps": 48130, "total_steps": 67140, "loss": 0.6241, "lr": 1.124924693299745e-05, "epoch": 7.168602919273161, "percentage": 71.69, "elapsed_time": "3:20:18", "remaining_time": "1:19:06", "throughput": 2309.68, "total_tokens": 27758912} {"current_steps": 48135, "total_steps": 67140, "loss": 0.5931, "lr": 1.124381992270026e-05, "epoch": 7.169347631814119, "percentage": 71.69, "elapsed_time": "3:20:19", "remaining_time": "1:19:05", "throughput": 2309.69, "total_tokens": 27761664} {"current_steps": 48140, "total_steps": 67140, "loss": 0.5505, "lr": 1.123839384198979e-05, "epoch": 7.170092344355079, "percentage": 71.7, "elapsed_time": "3:20:20", "remaining_time": "1:19:04", "throughput": 2309.7, "total_tokens": 27764384} {"current_steps": 48145, "total_steps": 67140, "loss": 0.4597, "lr": 1.123296869123272e-05, "epoch": 7.170837056896038, "percentage": 71.71, "elapsed_time": "3:20:21", "remaining_time": "1:19:03", "throughput": 2309.74, "total_tokens": 27767488} {"current_steps": 48150, "total_steps": 67140, "loss": 0.6156, "lr": 1.1227544470795645e-05, "epoch": 7.171581769436997, "percentage": 71.72, "elapsed_time": "3:20:23", "remaining_time": "1:19:01", "throughput": 2309.77, "total_tokens": 27770560} {"current_steps": 48155, "total_steps": 67140, "loss": 0.4993, "lr": 1.122212118104512e-05, "epoch": 7.172326481977956, "percentage": 71.72, "elapsed_time": "3:20:24", "remaining_time": "1:19:00", "throughput": 2309.79, "total_tokens": 27773440} {"current_steps": 48160, "total_steps": 67140, "loss": 0.6402, "lr": 1.1216698822347629e-05, "epoch": 7.173071194518916, "percentage": 71.73, "elapsed_time": "3:20:25", "remaining_time": "1:18:59", "throughput": 2309.81, "total_tokens": 27776224} {"current_steps": 48165, "total_steps": 67140, "loss": 0.6258, "lr": 1.1211277395069603e-05, "epoch": 7.173815907059875, "percentage": 71.74, "elapsed_time": "3:20:26", "remaining_time": "1:18:57", "throughput": 2309.83, "total_tokens": 27779104} {"current_steps": 48170, "total_steps": 67140, "loss": 0.6351, "lr": 1.120585689957738e-05, "epoch": 7.174560619600834, "percentage": 71.75, "elapsed_time": "3:20:27", "remaining_time": "1:18:56", "throughput": 2309.84, "total_tokens": 27781792} {"current_steps": 48175, "total_steps": 67140, "loss": 0.5334, "lr": 1.1200437336237265e-05, "epoch": 7.175305332141793, "percentage": 71.75, "elapsed_time": "3:20:28", "remaining_time": "1:18:55", "throughput": 2309.85, "total_tokens": 27784576} {"current_steps": 48180, "total_steps": 67140, "loss": 0.5483, "lr": 1.11950187054155e-05, "epoch": 7.176050044682753, "percentage": 71.76, "elapsed_time": "3:20:29", "remaining_time": "1:18:54", "throughput": 2309.87, "total_tokens": 27787296} {"current_steps": 48185, "total_steps": 67140, "loss": 0.7014, "lr": 1.1189601007478233e-05, "epoch": 7.176794757223711, "percentage": 71.77, "elapsed_time": "3:20:30", "remaining_time": "1:18:52", "throughput": 2309.88, "total_tokens": 27790080} {"current_steps": 48190, "total_steps": 67140, "loss": 0.5014, "lr": 1.1184184242791581e-05, "epoch": 7.177539469764671, "percentage": 71.78, "elapsed_time": "3:20:32", "remaining_time": "1:18:51", "throughput": 2309.91, "total_tokens": 27793152} {"current_steps": 48195, "total_steps": 67140, "loss": 0.6742, "lr": 1.1178768411721589e-05, "epoch": 7.17828418230563, "percentage": 71.78, "elapsed_time": "3:20:33", "remaining_time": "1:18:50", "throughput": 2309.95, "total_tokens": 27796352} {"current_steps": 48200, "total_steps": 67140, "loss": 0.5916, "lr": 1.1173353514634232e-05, "epoch": 7.1790288948465895, "percentage": 71.79, "elapsed_time": "3:20:34", "remaining_time": "1:18:48", "throughput": 2309.96, "total_tokens": 27799040} {"current_steps": 48205, "total_steps": 67140, "loss": 0.7128, "lr": 1.116793955189544e-05, "epoch": 7.179773607387548, "percentage": 71.8, "elapsed_time": "3:20:35", "remaining_time": "1:18:47", "throughput": 2309.98, "total_tokens": 27801888} {"current_steps": 48210, "total_steps": 67140, "loss": 0.7468, "lr": 1.1162526523871048e-05, "epoch": 7.180518319928508, "percentage": 71.81, "elapsed_time": "3:20:36", "remaining_time": "1:18:46", "throughput": 2310.0, "total_tokens": 27804736} {"current_steps": 48215, "total_steps": 67140, "loss": 0.6666, "lr": 1.115711443092686e-05, "epoch": 7.181263032469467, "percentage": 71.81, "elapsed_time": "3:20:37", "remaining_time": "1:18:44", "throughput": 2310.02, "total_tokens": 27807488} {"current_steps": 48220, "total_steps": 67140, "loss": 0.6839, "lr": 1.115170327342859e-05, "epoch": 7.182007745010426, "percentage": 71.82, "elapsed_time": "3:20:38", "remaining_time": "1:18:43", "throughput": 2310.04, "total_tokens": 27810368} {"current_steps": 48225, "total_steps": 67140, "loss": 0.8166, "lr": 1.1146293051741913e-05, "epoch": 7.182752457551385, "percentage": 71.83, "elapsed_time": "3:20:40", "remaining_time": "1:18:42", "throughput": 2310.05, "total_tokens": 27813088} {"current_steps": 48230, "total_steps": 67140, "loss": 0.5511, "lr": 1.1140883766232422e-05, "epoch": 7.183497170092345, "percentage": 71.83, "elapsed_time": "3:20:41", "remaining_time": "1:18:41", "throughput": 2310.06, "total_tokens": 27815840} {"current_steps": 48235, "total_steps": 67140, "loss": 0.5753, "lr": 1.1135475417265662e-05, "epoch": 7.184241882633303, "percentage": 71.84, "elapsed_time": "3:20:42", "remaining_time": "1:18:39", "throughput": 2310.09, "total_tokens": 27818720} {"current_steps": 48240, "total_steps": 67140, "loss": 0.7426, "lr": 1.113006800520711e-05, "epoch": 7.184986595174263, "percentage": 71.85, "elapsed_time": "3:20:43", "remaining_time": "1:18:38", "throughput": 2310.11, "total_tokens": 27821632} {"current_steps": 48245, "total_steps": 67140, "loss": 0.5412, "lr": 1.1124661530422176e-05, "epoch": 7.185731307715222, "percentage": 71.86, "elapsed_time": "3:20:44", "remaining_time": "1:18:37", "throughput": 2310.13, "total_tokens": 27824448} {"current_steps": 48250, "total_steps": 67140, "loss": 0.5416, "lr": 1.111925599327619e-05, "epoch": 7.1864760202561815, "percentage": 71.86, "elapsed_time": "3:20:45", "remaining_time": "1:18:35", "throughput": 2310.16, "total_tokens": 27827552} {"current_steps": 48255, "total_steps": 67140, "loss": 0.5577, "lr": 1.111385139413445e-05, "epoch": 7.18722073279714, "percentage": 71.87, "elapsed_time": "3:20:46", "remaining_time": "1:18:34", "throughput": 2310.17, "total_tokens": 27830304} {"current_steps": 48260, "total_steps": 67140, "loss": 0.5761, "lr": 1.1108447733362177e-05, "epoch": 7.1879654453381, "percentage": 71.88, "elapsed_time": "3:20:47", "remaining_time": "1:18:33", "throughput": 2310.2, "total_tokens": 27833280} {"current_steps": 48265, "total_steps": 67140, "loss": 0.4004, "lr": 1.1103045011324526e-05, "epoch": 7.188710157879059, "percentage": 71.89, "elapsed_time": "3:20:49", "remaining_time": "1:18:32", "throughput": 2310.22, "total_tokens": 27836032} {"current_steps": 48270, "total_steps": 67140, "loss": 0.5935, "lr": 1.1097643228386593e-05, "epoch": 7.189454870420018, "percentage": 71.89, "elapsed_time": "3:20:50", "remaining_time": "1:18:30", "throughput": 2310.23, "total_tokens": 27838816} {"current_steps": 48275, "total_steps": 67140, "loss": 0.7627, "lr": 1.1092242384913415e-05, "epoch": 7.190199582960977, "percentage": 71.9, "elapsed_time": "3:20:51", "remaining_time": "1:18:29", "throughput": 2310.24, "total_tokens": 27841536} {"current_steps": 48280, "total_steps": 67140, "loss": 0.5298, "lr": 1.1086842481269943e-05, "epoch": 7.190944295501936, "percentage": 71.91, "elapsed_time": "3:20:52", "remaining_time": "1:18:28", "throughput": 2310.26, "total_tokens": 27844320} {"current_steps": 48285, "total_steps": 67140, "loss": 0.6114, "lr": 1.10814435178211e-05, "epoch": 7.1916890080428955, "percentage": 71.92, "elapsed_time": "3:20:53", "remaining_time": "1:18:26", "throughput": 2310.28, "total_tokens": 27847264} {"current_steps": 48290, "total_steps": 67140, "loss": 0.8372, "lr": 1.1076045494931705e-05, "epoch": 7.192433720583854, "percentage": 71.92, "elapsed_time": "3:20:54", "remaining_time": "1:18:25", "throughput": 2310.3, "total_tokens": 27850048} {"current_steps": 48295, "total_steps": 67140, "loss": 0.5906, "lr": 1.1070648412966548e-05, "epoch": 7.193178433124814, "percentage": 71.93, "elapsed_time": "3:20:55", "remaining_time": "1:18:24", "throughput": 2310.31, "total_tokens": 27852736} {"current_steps": 48300, "total_steps": 67140, "loss": 0.6266, "lr": 1.1065252272290333e-05, "epoch": 7.193923145665773, "percentage": 71.94, "elapsed_time": "3:20:57", "remaining_time": "1:18:22", "throughput": 2310.36, "total_tokens": 27856064} {"current_steps": 48305, "total_steps": 67140, "loss": 0.4257, "lr": 1.1059857073267718e-05, "epoch": 7.194667858206732, "percentage": 71.95, "elapsed_time": "3:20:58", "remaining_time": "1:18:21", "throughput": 2310.37, "total_tokens": 27858720} {"current_steps": 48310, "total_steps": 67140, "loss": 0.5568, "lr": 1.1054462816263295e-05, "epoch": 7.195412570747691, "percentage": 71.95, "elapsed_time": "3:20:59", "remaining_time": "1:18:20", "throughput": 2310.38, "total_tokens": 27861408} {"current_steps": 48315, "total_steps": 67140, "loss": 0.4868, "lr": 1.1049069501641567e-05, "epoch": 7.196157283288651, "percentage": 71.96, "elapsed_time": "3:21:00", "remaining_time": "1:18:19", "throughput": 2310.4, "total_tokens": 27864352} {"current_steps": 48320, "total_steps": 67140, "loss": 0.6128, "lr": 1.1043677129767002e-05, "epoch": 7.196901995829609, "percentage": 71.97, "elapsed_time": "3:21:01", "remaining_time": "1:18:17", "throughput": 2310.43, "total_tokens": 27867264} {"current_steps": 48325, "total_steps": 67140, "loss": 0.5911, "lr": 1.1038285701004003e-05, "epoch": 7.197646708370569, "percentage": 71.98, "elapsed_time": "3:21:02", "remaining_time": "1:18:16", "throughput": 2310.44, "total_tokens": 27869984} {"current_steps": 48330, "total_steps": 67140, "loss": 0.4814, "lr": 1.1032895215716881e-05, "epoch": 7.198391420911528, "percentage": 71.98, "elapsed_time": "3:21:03", "remaining_time": "1:18:15", "throughput": 2310.46, "total_tokens": 27872832} {"current_steps": 48335, "total_steps": 67140, "loss": 0.5209, "lr": 1.1027505674269916e-05, "epoch": 7.1991361334524875, "percentage": 71.99, "elapsed_time": "3:21:04", "remaining_time": "1:18:13", "throughput": 2310.48, "total_tokens": 27875744} {"current_steps": 48340, "total_steps": 67140, "loss": 0.8337, "lr": 1.102211707702731e-05, "epoch": 7.199880845993446, "percentage": 72.0, "elapsed_time": "3:21:06", "remaining_time": "1:18:12", "throughput": 2310.52, "total_tokens": 27878880} {"current_steps": 48345, "total_steps": 67140, "loss": 0.5124, "lr": 1.1016729424353212e-05, "epoch": 7.200625558534406, "percentage": 72.01, "elapsed_time": "3:21:07", "remaining_time": "1:18:11", "throughput": 2310.54, "total_tokens": 27881760} {"current_steps": 48350, "total_steps": 67140, "loss": 0.3849, "lr": 1.1011342716611678e-05, "epoch": 7.201370271075365, "percentage": 72.01, "elapsed_time": "3:21:08", "remaining_time": "1:18:10", "throughput": 2310.56, "total_tokens": 27884672} {"current_steps": 48355, "total_steps": 67140, "loss": 0.6155, "lr": 1.1005956954166729e-05, "epoch": 7.202114983616324, "percentage": 72.02, "elapsed_time": "3:21:09", "remaining_time": "1:18:08", "throughput": 2310.57, "total_tokens": 27887456} {"current_steps": 48360, "total_steps": 67140, "loss": 0.6346, "lr": 1.1000572137382314e-05, "epoch": 7.202859696157283, "percentage": 72.03, "elapsed_time": "3:21:10", "remaining_time": "1:18:07", "throughput": 2310.59, "total_tokens": 27890304} {"current_steps": 48365, "total_steps": 67140, "loss": 0.589, "lr": 1.0995188266622324e-05, "epoch": 7.203604408698243, "percentage": 72.04, "elapsed_time": "3:21:11", "remaining_time": "1:18:06", "throughput": 2310.63, "total_tokens": 27893472} {"current_steps": 48370, "total_steps": 67140, "loss": 0.7246, "lr": 1.0989805342250564e-05, "epoch": 7.2043491212392015, "percentage": 72.04, "elapsed_time": "3:21:12", "remaining_time": "1:18:04", "throughput": 2310.64, "total_tokens": 27896192} {"current_steps": 48375, "total_steps": 67140, "loss": 0.7803, "lr": 1.0984423364630796e-05, "epoch": 7.205093833780161, "percentage": 72.05, "elapsed_time": "3:21:14", "remaining_time": "1:18:03", "throughput": 2310.65, "total_tokens": 27898848} {"current_steps": 48380, "total_steps": 67140, "loss": 0.4602, "lr": 1.0979042334126724e-05, "epoch": 7.20583854632112, "percentage": 72.06, "elapsed_time": "3:21:15", "remaining_time": "1:18:02", "throughput": 2310.68, "total_tokens": 27901984} {"current_steps": 48385, "total_steps": 67140, "loss": 0.5741, "lr": 1.0973662251101957e-05, "epoch": 7.2065832588620795, "percentage": 72.07, "elapsed_time": "3:21:16", "remaining_time": "1:18:01", "throughput": 2310.69, "total_tokens": 27904640} {"current_steps": 48390, "total_steps": 67140, "loss": 0.5907, "lr": 1.0968283115920067e-05, "epoch": 7.207327971403038, "percentage": 72.07, "elapsed_time": "3:21:17", "remaining_time": "1:17:59", "throughput": 2310.7, "total_tokens": 27907232} {"current_steps": 48395, "total_steps": 67140, "loss": 0.498, "lr": 1.0962904928944556e-05, "epoch": 7.208072683943998, "percentage": 72.08, "elapsed_time": "3:21:18", "remaining_time": "1:17:58", "throughput": 2310.72, "total_tokens": 27910080} {"current_steps": 48400, "total_steps": 67140, "loss": 0.7021, "lr": 1.095752769053886e-05, "epoch": 7.208817396484957, "percentage": 72.09, "elapsed_time": "3:21:19", "remaining_time": "1:17:57", "throughput": 2310.74, "total_tokens": 27913024} {"current_steps": 48405, "total_steps": 67140, "loss": 0.6109, "lr": 1.0952151401066358e-05, "epoch": 7.209562109025916, "percentage": 72.1, "elapsed_time": "3:21:20", "remaining_time": "1:17:55", "throughput": 2310.75, "total_tokens": 27915616} {"current_steps": 48410, "total_steps": 67140, "loss": 0.8185, "lr": 1.0946776060890352e-05, "epoch": 7.210306821566875, "percentage": 72.1, "elapsed_time": "3:21:21", "remaining_time": "1:17:54", "throughput": 2310.77, "total_tokens": 27918432} {"current_steps": 48415, "total_steps": 67140, "loss": 0.6069, "lr": 1.0941401670374071e-05, "epoch": 7.211051534107835, "percentage": 72.11, "elapsed_time": "3:21:23", "remaining_time": "1:17:53", "throughput": 2310.78, "total_tokens": 27921184} {"current_steps": 48420, "total_steps": 67140, "loss": 0.5146, "lr": 1.093602822988071e-05, "epoch": 7.2117962466487935, "percentage": 72.12, "elapsed_time": "3:21:24", "remaining_time": "1:17:51", "throughput": 2310.8, "total_tokens": 27924000} {"current_steps": 48425, "total_steps": 67140, "loss": 0.5636, "lr": 1.0930655739773379e-05, "epoch": 7.212540959189753, "percentage": 72.13, "elapsed_time": "3:21:25", "remaining_time": "1:17:50", "throughput": 2310.83, "total_tokens": 27927104} {"current_steps": 48430, "total_steps": 67140, "loss": 0.5716, "lr": 1.0925284200415134e-05, "epoch": 7.213285671730712, "percentage": 72.13, "elapsed_time": "3:21:26", "remaining_time": "1:17:49", "throughput": 2310.84, "total_tokens": 27929728} {"current_steps": 48435, "total_steps": 67140, "loss": 0.6992, "lr": 1.0919913612168959e-05, "epoch": 7.2140303842716715, "percentage": 72.14, "elapsed_time": "3:21:27", "remaining_time": "1:17:48", "throughput": 2310.85, "total_tokens": 27932448} {"current_steps": 48440, "total_steps": 67140, "loss": 0.6993, "lr": 1.0914543975397785e-05, "epoch": 7.21477509681263, "percentage": 72.15, "elapsed_time": "3:21:28", "remaining_time": "1:17:46", "throughput": 2310.87, "total_tokens": 27935296} {"current_steps": 48445, "total_steps": 67140, "loss": 0.6614, "lr": 1.090917529046446e-05, "epoch": 7.21551980935359, "percentage": 72.16, "elapsed_time": "3:21:29", "remaining_time": "1:17:45", "throughput": 2310.89, "total_tokens": 27938240} {"current_steps": 48450, "total_steps": 67140, "loss": 0.4478, "lr": 1.0903807557731771e-05, "epoch": 7.216264521894549, "percentage": 72.16, "elapsed_time": "3:21:30", "remaining_time": "1:17:44", "throughput": 2310.91, "total_tokens": 27941088} {"current_steps": 48455, "total_steps": 67140, "loss": 0.5677, "lr": 1.0898440777562458e-05, "epoch": 7.217009234435508, "percentage": 72.17, "elapsed_time": "3:21:32", "remaining_time": "1:17:42", "throughput": 2310.93, "total_tokens": 27943936} {"current_steps": 48460, "total_steps": 67140, "loss": 0.391, "lr": 1.0893074950319182e-05, "epoch": 7.217753946976467, "percentage": 72.18, "elapsed_time": "3:21:33", "remaining_time": "1:17:41", "throughput": 2310.96, "total_tokens": 27946880} {"current_steps": 48465, "total_steps": 67140, "loss": 0.451, "lr": 1.0887710076364548e-05, "epoch": 7.218498659517426, "percentage": 72.18, "elapsed_time": "3:21:34", "remaining_time": "1:17:40", "throughput": 2310.97, "total_tokens": 27949600} {"current_steps": 48470, "total_steps": 67140, "loss": 0.8429, "lr": 1.088234615606109e-05, "epoch": 7.2192433720583855, "percentage": 72.19, "elapsed_time": "3:21:35", "remaining_time": "1:17:39", "throughput": 2310.99, "total_tokens": 27952480} {"current_steps": 48475, "total_steps": 67140, "loss": 0.6238, "lr": 1.0876983189771292e-05, "epoch": 7.219988084599344, "percentage": 72.2, "elapsed_time": "3:21:36", "remaining_time": "1:17:37", "throughput": 2311.0, "total_tokens": 27955232} {"current_steps": 48480, "total_steps": 67140, "loss": 0.6207, "lr": 1.0871621177857539e-05, "epoch": 7.220732797140304, "percentage": 72.21, "elapsed_time": "3:21:37", "remaining_time": "1:17:36", "throughput": 2311.01, "total_tokens": 27957952} {"current_steps": 48485, "total_steps": 67140, "loss": 0.5746, "lr": 1.0866260120682195e-05, "epoch": 7.221477509681263, "percentage": 72.21, "elapsed_time": "3:21:38", "remaining_time": "1:17:35", "throughput": 2311.03, "total_tokens": 27960704} {"current_steps": 48490, "total_steps": 67140, "loss": 0.6109, "lr": 1.0860900018607518e-05, "epoch": 7.222222222222222, "percentage": 72.22, "elapsed_time": "3:21:39", "remaining_time": "1:17:33", "throughput": 2311.05, "total_tokens": 27963552} {"current_steps": 48495, "total_steps": 67140, "loss": 0.6116, "lr": 1.0855540871995734e-05, "epoch": 7.222966934763181, "percentage": 72.23, "elapsed_time": "3:21:41", "remaining_time": "1:17:32", "throughput": 2311.07, "total_tokens": 27966464} {"current_steps": 48500, "total_steps": 67140, "loss": 0.5928, "lr": 1.085018268120899e-05, "epoch": 7.223711647304141, "percentage": 72.24, "elapsed_time": "3:21:42", "remaining_time": "1:17:31", "throughput": 2311.1, "total_tokens": 27969408} {"current_steps": 48505, "total_steps": 67140, "loss": 0.5799, "lr": 1.0844825446609368e-05, "epoch": 7.2244563598450995, "percentage": 72.24, "elapsed_time": "3:21:43", "remaining_time": "1:17:29", "throughput": 2311.12, "total_tokens": 27972288} {"current_steps": 48510, "total_steps": 67140, "loss": 0.5791, "lr": 1.0839469168558905e-05, "epoch": 7.225201072386059, "percentage": 72.25, "elapsed_time": "3:21:44", "remaining_time": "1:17:28", "throughput": 2311.15, "total_tokens": 27975296} {"current_steps": 48515, "total_steps": 67140, "loss": 0.6147, "lr": 1.0834113847419534e-05, "epoch": 7.225945784927018, "percentage": 72.26, "elapsed_time": "3:21:45", "remaining_time": "1:17:27", "throughput": 2311.17, "total_tokens": 27978176} {"current_steps": 48520, "total_steps": 67140, "loss": 0.5202, "lr": 1.0828759483553152e-05, "epoch": 7.2266904974679775, "percentage": 72.27, "elapsed_time": "3:21:46", "remaining_time": "1:17:26", "throughput": 2311.2, "total_tokens": 27981216} {"current_steps": 48525, "total_steps": 67140, "loss": 0.609, "lr": 1.082340607732159e-05, "epoch": 7.227435210008936, "percentage": 72.27, "elapsed_time": "3:21:47", "remaining_time": "1:17:24", "throughput": 2311.22, "total_tokens": 27984096} {"current_steps": 48530, "total_steps": 67140, "loss": 0.4941, "lr": 1.0818053629086617e-05, "epoch": 7.228179922549896, "percentage": 72.28, "elapsed_time": "3:21:49", "remaining_time": "1:17:23", "throughput": 2311.23, "total_tokens": 27986816} {"current_steps": 48535, "total_steps": 67140, "loss": 0.5164, "lr": 1.081270213920991e-05, "epoch": 7.228924635090855, "percentage": 72.29, "elapsed_time": "3:21:50", "remaining_time": "1:17:22", "throughput": 2311.25, "total_tokens": 27989632} {"current_steps": 48540, "total_steps": 67140, "loss": 0.5963, "lr": 1.0807351608053113e-05, "epoch": 7.229669347631814, "percentage": 72.3, "elapsed_time": "3:21:51", "remaining_time": "1:17:20", "throughput": 2311.27, "total_tokens": 27992512} {"current_steps": 48545, "total_steps": 67140, "loss": 0.614, "lr": 1.0802002035977799e-05, "epoch": 7.230414060172773, "percentage": 72.3, "elapsed_time": "3:21:52", "remaining_time": "1:17:19", "throughput": 2311.29, "total_tokens": 27995360} {"current_steps": 48550, "total_steps": 67140, "loss": 0.6305, "lr": 1.0796653423345452e-05, "epoch": 7.231158772713733, "percentage": 72.31, "elapsed_time": "3:21:53", "remaining_time": "1:17:18", "throughput": 2311.33, "total_tokens": 27998464} {"current_steps": 48555, "total_steps": 67140, "loss": 0.5168, "lr": 1.079130577051752e-05, "epoch": 7.2319034852546915, "percentage": 72.32, "elapsed_time": "3:21:54", "remaining_time": "1:17:17", "throughput": 2311.35, "total_tokens": 28001344} {"current_steps": 48560, "total_steps": 67140, "loss": 0.498, "lr": 1.0785959077855378e-05, "epoch": 7.232648197795651, "percentage": 72.33, "elapsed_time": "3:21:55", "remaining_time": "1:17:15", "throughput": 2311.37, "total_tokens": 28004224} {"current_steps": 48565, "total_steps": 67140, "loss": 0.5544, "lr": 1.0780613345720331e-05, "epoch": 7.23339291033661, "percentage": 72.33, "elapsed_time": "3:21:56", "remaining_time": "1:17:14", "throughput": 2311.38, "total_tokens": 28007008} {"current_steps": 48570, "total_steps": 67140, "loss": 0.5338, "lr": 1.077526857447363e-05, "epoch": 7.23413762287757, "percentage": 72.34, "elapsed_time": "3:21:58", "remaining_time": "1:17:13", "throughput": 2311.4, "total_tokens": 28009792} {"current_steps": 48575, "total_steps": 67140, "loss": 0.6372, "lr": 1.0769924764476446e-05, "epoch": 7.234882335418528, "percentage": 72.35, "elapsed_time": "3:21:59", "remaining_time": "1:17:11", "throughput": 2311.42, "total_tokens": 28012608} {"current_steps": 48580, "total_steps": 67140, "loss": 0.4677, "lr": 1.0764581916089883e-05, "epoch": 7.235627047959488, "percentage": 72.36, "elapsed_time": "3:22:00", "remaining_time": "1:17:10", "throughput": 2311.43, "total_tokens": 28015392} {"current_steps": 48585, "total_steps": 67140, "loss": 0.6498, "lr": 1.0759240029674994e-05, "epoch": 7.236371760500447, "percentage": 72.36, "elapsed_time": "3:22:01", "remaining_time": "1:17:09", "throughput": 2311.45, "total_tokens": 28018240} {"current_steps": 48590, "total_steps": 67140, "loss": 0.6464, "lr": 1.0753899105592768e-05, "epoch": 7.237116473041406, "percentage": 72.37, "elapsed_time": "3:22:02", "remaining_time": "1:17:08", "throughput": 2311.47, "total_tokens": 28021152} {"current_steps": 48595, "total_steps": 67140, "loss": 0.5172, "lr": 1.0748559144204117e-05, "epoch": 7.237861185582365, "percentage": 72.38, "elapsed_time": "3:22:03", "remaining_time": "1:17:06", "throughput": 2311.51, "total_tokens": 28024416} {"current_steps": 48600, "total_steps": 67140, "loss": 0.6592, "lr": 1.07432201458699e-05, "epoch": 7.238605898123325, "percentage": 72.39, "elapsed_time": "3:22:04", "remaining_time": "1:17:05", "throughput": 2311.54, "total_tokens": 28027360} {"current_steps": 48605, "total_steps": 67140, "loss": 0.5509, "lr": 1.0737882110950911e-05, "epoch": 7.2393506106642835, "percentage": 72.39, "elapsed_time": "3:22:06", "remaining_time": "1:17:04", "throughput": 2311.56, "total_tokens": 28030368} {"current_steps": 48610, "total_steps": 67140, "loss": 0.6623, "lr": 1.0732545039807862e-05, "epoch": 7.240095323205243, "percentage": 72.4, "elapsed_time": "3:22:07", "remaining_time": "1:17:02", "throughput": 2311.58, "total_tokens": 28033216} {"current_steps": 48615, "total_steps": 67140, "loss": 0.618, "lr": 1.0727208932801403e-05, "epoch": 7.240840035746202, "percentage": 72.41, "elapsed_time": "3:22:08", "remaining_time": "1:17:01", "throughput": 2311.61, "total_tokens": 28036096} {"current_steps": 48620, "total_steps": 67140, "loss": 0.4552, "lr": 1.0721873790292136e-05, "epoch": 7.241584748287162, "percentage": 72.42, "elapsed_time": "3:22:09", "remaining_time": "1:17:00", "throughput": 2311.62, "total_tokens": 28038816} {"current_steps": 48625, "total_steps": 67140, "loss": 0.6198, "lr": 1.0716539612640586e-05, "epoch": 7.24232946082812, "percentage": 72.42, "elapsed_time": "3:22:10", "remaining_time": "1:16:58", "throughput": 2311.64, "total_tokens": 28041632} {"current_steps": 48630, "total_steps": 67140, "loss": 0.6957, "lr": 1.071120640020722e-05, "epoch": 7.243074173369079, "percentage": 72.43, "elapsed_time": "3:22:11", "remaining_time": "1:16:57", "throughput": 2311.66, "total_tokens": 28044480} {"current_steps": 48635, "total_steps": 67140, "loss": 0.4895, "lr": 1.0705874153352428e-05, "epoch": 7.243818885910039, "percentage": 72.44, "elapsed_time": "3:22:12", "remaining_time": "1:16:56", "throughput": 2311.71, "total_tokens": 28047936} {"current_steps": 48640, "total_steps": 67140, "loss": 0.5729, "lr": 1.0700542872436557e-05, "epoch": 7.2445635984509975, "percentage": 72.45, "elapsed_time": "3:22:14", "remaining_time": "1:16:55", "throughput": 2311.73, "total_tokens": 28050944} {"current_steps": 48645, "total_steps": 67140, "loss": 0.4644, "lr": 1.0695212557819851e-05, "epoch": 7.245308310991957, "percentage": 72.45, "elapsed_time": "3:22:15", "remaining_time": "1:16:53", "throughput": 2311.78, "total_tokens": 28054240} {"current_steps": 48650, "total_steps": 67140, "loss": 0.4253, "lr": 1.0689883209862527e-05, "epoch": 7.246053023532916, "percentage": 72.46, "elapsed_time": "3:22:16", "remaining_time": "1:16:52", "throughput": 2311.8, "total_tokens": 28057088} {"current_steps": 48655, "total_steps": 67140, "loss": 0.7245, "lr": 1.0684554828924711e-05, "epoch": 7.246797736073876, "percentage": 72.47, "elapsed_time": "3:22:17", "remaining_time": "1:16:51", "throughput": 2311.83, "total_tokens": 28060256} {"current_steps": 48660, "total_steps": 67140, "loss": 0.4548, "lr": 1.0679227415366475e-05, "epoch": 7.247542448614834, "percentage": 72.48, "elapsed_time": "3:22:18", "remaining_time": "1:16:50", "throughput": 2311.86, "total_tokens": 28063264} {"current_steps": 48665, "total_steps": 67140, "loss": 0.4445, "lr": 1.0673900969547826e-05, "epoch": 7.248287161155794, "percentage": 72.48, "elapsed_time": "3:22:19", "remaining_time": "1:16:48", "throughput": 2311.89, "total_tokens": 28066240} {"current_steps": 48670, "total_steps": 67140, "loss": 0.4623, "lr": 1.0668575491828706e-05, "epoch": 7.249031873696753, "percentage": 72.49, "elapsed_time": "3:22:21", "remaining_time": "1:16:47", "throughput": 2311.9, "total_tokens": 28068992} {"current_steps": 48675, "total_steps": 67140, "loss": 0.5648, "lr": 1.0663250982568993e-05, "epoch": 7.249776586237712, "percentage": 72.5, "elapsed_time": "3:22:22", "remaining_time": "1:16:46", "throughput": 2311.92, "total_tokens": 28071872} {"current_steps": 48680, "total_steps": 67140, "loss": 0.5139, "lr": 1.0657927442128482e-05, "epoch": 7.250521298778671, "percentage": 72.51, "elapsed_time": "3:22:23", "remaining_time": "1:16:44", "throughput": 2311.95, "total_tokens": 28074944} {"current_steps": 48685, "total_steps": 67140, "loss": 0.4777, "lr": 1.0652604870866923e-05, "epoch": 7.251266011319631, "percentage": 72.51, "elapsed_time": "3:22:24", "remaining_time": "1:16:43", "throughput": 2311.97, "total_tokens": 28077824} {"current_steps": 48690, "total_steps": 67140, "loss": 0.5082, "lr": 1.0647283269144003e-05, "epoch": 7.2520107238605895, "percentage": 72.52, "elapsed_time": "3:22:25", "remaining_time": "1:16:42", "throughput": 2311.99, "total_tokens": 28080672} {"current_steps": 48695, "total_steps": 67140, "loss": 0.5488, "lr": 1.064196263731932e-05, "epoch": 7.252755436401549, "percentage": 72.53, "elapsed_time": "3:22:26", "remaining_time": "1:16:41", "throughput": 2312.01, "total_tokens": 28083520} {"current_steps": 48700, "total_steps": 67140, "loss": 0.7136, "lr": 1.0636642975752423e-05, "epoch": 7.253500148942508, "percentage": 72.54, "elapsed_time": "3:22:27", "remaining_time": "1:16:39", "throughput": 2312.03, "total_tokens": 28086464} {"current_steps": 48705, "total_steps": 67140, "loss": 0.6003, "lr": 1.0631324284802799e-05, "epoch": 7.254244861483468, "percentage": 72.54, "elapsed_time": "3:22:29", "remaining_time": "1:16:38", "throughput": 2312.08, "total_tokens": 28089824} {"current_steps": 48710, "total_steps": 67140, "loss": 0.6823, "lr": 1.0626006564829868e-05, "epoch": 7.254989574024426, "percentage": 72.55, "elapsed_time": "3:22:30", "remaining_time": "1:16:37", "throughput": 2312.08, "total_tokens": 28092384} {"current_steps": 48715, "total_steps": 67140, "loss": 0.7507, "lr": 1.0620689816192967e-05, "epoch": 7.255734286565386, "percentage": 72.56, "elapsed_time": "3:22:31", "remaining_time": "1:16:35", "throughput": 2312.1, "total_tokens": 28095136} {"current_steps": 48720, "total_steps": 67140, "loss": 0.4593, "lr": 1.0615374039251382e-05, "epoch": 7.256478999106345, "percentage": 72.56, "elapsed_time": "3:22:32", "remaining_time": "1:16:34", "throughput": 2312.12, "total_tokens": 28098080} {"current_steps": 48725, "total_steps": 67140, "loss": 0.6152, "lr": 1.061005923436434e-05, "epoch": 7.257223711647304, "percentage": 72.57, "elapsed_time": "3:22:33", "remaining_time": "1:16:33", "throughput": 2312.15, "total_tokens": 28101088} {"current_steps": 48730, "total_steps": 67140, "loss": 0.5432, "lr": 1.0604745401890997e-05, "epoch": 7.257968424188263, "percentage": 72.58, "elapsed_time": "3:22:34", "remaining_time": "1:16:32", "throughput": 2312.16, "total_tokens": 28103744} {"current_steps": 48735, "total_steps": 67140, "loss": 0.6104, "lr": 1.0599432542190424e-05, "epoch": 7.258713136729223, "percentage": 72.59, "elapsed_time": "3:22:35", "remaining_time": "1:16:30", "throughput": 2312.17, "total_tokens": 28106400} {"current_steps": 48740, "total_steps": 67140, "loss": 0.5638, "lr": 1.0594120655621659e-05, "epoch": 7.259457849270182, "percentage": 72.59, "elapsed_time": "3:22:37", "remaining_time": "1:16:29", "throughput": 2312.19, "total_tokens": 28109280} {"current_steps": 48745, "total_steps": 67140, "loss": 0.5517, "lr": 1.0588809742543643e-05, "epoch": 7.260202561811141, "percentage": 72.6, "elapsed_time": "3:22:38", "remaining_time": "1:16:28", "throughput": 2312.2, "total_tokens": 28111968} {"current_steps": 48750, "total_steps": 67140, "loss": 0.4761, "lr": 1.0583499803315271e-05, "epoch": 7.2609472743521, "percentage": 72.61, "elapsed_time": "3:22:39", "remaining_time": "1:16:26", "throughput": 2312.23, "total_tokens": 28115040} {"current_steps": 48755, "total_steps": 67140, "loss": 0.3946, "lr": 1.0578190838295371e-05, "epoch": 7.26169198689306, "percentage": 72.62, "elapsed_time": "3:22:40", "remaining_time": "1:16:25", "throughput": 2312.25, "total_tokens": 28118016} {"current_steps": 48760, "total_steps": 67140, "loss": 0.5555, "lr": 1.0572882847842696e-05, "epoch": 7.262436699434018, "percentage": 72.62, "elapsed_time": "3:22:41", "remaining_time": "1:16:24", "throughput": 2312.28, "total_tokens": 28120896} {"current_steps": 48765, "total_steps": 67140, "loss": 0.5742, "lr": 1.0567575832315947e-05, "epoch": 7.263181411974978, "percentage": 72.63, "elapsed_time": "3:22:42", "remaining_time": "1:16:22", "throughput": 2312.29, "total_tokens": 28123648} {"current_steps": 48770, "total_steps": 67140, "loss": 0.6815, "lr": 1.056226979207375e-05, "epoch": 7.263926124515937, "percentage": 72.64, "elapsed_time": "3:22:43", "remaining_time": "1:16:21", "throughput": 2312.32, "total_tokens": 28126720} {"current_steps": 48775, "total_steps": 67140, "loss": 0.4423, "lr": 1.0556964727474664e-05, "epoch": 7.264670837056896, "percentage": 72.65, "elapsed_time": "3:22:45", "remaining_time": "1:16:20", "throughput": 2312.34, "total_tokens": 28129664} {"current_steps": 48780, "total_steps": 67140, "loss": 0.7016, "lr": 1.055166063887717e-05, "epoch": 7.265415549597855, "percentage": 72.65, "elapsed_time": "3:22:46", "remaining_time": "1:16:19", "throughput": 2312.38, "total_tokens": 28132768} {"current_steps": 48785, "total_steps": 67140, "loss": 0.5427, "lr": 1.0546357526639705e-05, "epoch": 7.266160262138815, "percentage": 72.66, "elapsed_time": "3:22:47", "remaining_time": "1:16:17", "throughput": 2312.43, "total_tokens": 28136352} {"current_steps": 48790, "total_steps": 67140, "loss": 0.4479, "lr": 1.0541055391120638e-05, "epoch": 7.266904974679774, "percentage": 72.67, "elapsed_time": "3:22:48", "remaining_time": "1:16:16", "throughput": 2312.46, "total_tokens": 28139232} {"current_steps": 48795, "total_steps": 67140, "loss": 0.5915, "lr": 1.053575423267826e-05, "epoch": 7.267649687220732, "percentage": 72.68, "elapsed_time": "3:22:49", "remaining_time": "1:16:15", "throughput": 2312.47, "total_tokens": 28141984} {"current_steps": 48800, "total_steps": 67140, "loss": 0.4553, "lr": 1.0530454051670805e-05, "epoch": 7.268394399761692, "percentage": 72.68, "elapsed_time": "3:22:50", "remaining_time": "1:16:14", "throughput": 2312.49, "total_tokens": 28144768} {"current_steps": 48805, "total_steps": 67140, "loss": 0.8078, "lr": 1.0525154848456442e-05, "epoch": 7.269139112302652, "percentage": 72.69, "elapsed_time": "3:22:51", "remaining_time": "1:16:12", "throughput": 2312.5, "total_tokens": 28147552} {"current_steps": 48810, "total_steps": 67140, "loss": 0.6139, "lr": 1.0519856623393268e-05, "epoch": 7.26988382484361, "percentage": 72.7, "elapsed_time": "3:22:53", "remaining_time": "1:16:11", "throughput": 2312.5, "total_tokens": 28150144} {"current_steps": 48815, "total_steps": 67140, "loss": 0.7577, "lr": 1.05145593768393e-05, "epoch": 7.270628537384569, "percentage": 72.71, "elapsed_time": "3:22:54", "remaining_time": "1:16:10", "throughput": 2312.53, "total_tokens": 28153088} {"current_steps": 48820, "total_steps": 67140, "loss": 0.4904, "lr": 1.0509263109152518e-05, "epoch": 7.271373249925529, "percentage": 72.71, "elapsed_time": "3:22:55", "remaining_time": "1:16:08", "throughput": 2312.56, "total_tokens": 28156096} {"current_steps": 48825, "total_steps": 67140, "loss": 0.645, "lr": 1.0503967820690817e-05, "epoch": 7.272117962466488, "percentage": 72.72, "elapsed_time": "3:22:56", "remaining_time": "1:16:07", "throughput": 2312.58, "total_tokens": 28159008} {"current_steps": 48830, "total_steps": 67140, "loss": 0.5725, "lr": 1.0498673511812035e-05, "epoch": 7.272862675007447, "percentage": 72.73, "elapsed_time": "3:22:57", "remaining_time": "1:16:06", "throughput": 2312.61, "total_tokens": 28161984} {"current_steps": 48835, "total_steps": 67140, "loss": 0.6437, "lr": 1.0493380182873941e-05, "epoch": 7.273607387548406, "percentage": 72.74, "elapsed_time": "3:22:58", "remaining_time": "1:16:04", "throughput": 2312.62, "total_tokens": 28164672} {"current_steps": 48840, "total_steps": 67140, "loss": 0.6739, "lr": 1.0488087834234242e-05, "epoch": 7.274352100089366, "percentage": 72.74, "elapsed_time": "3:22:59", "remaining_time": "1:16:03", "throughput": 2312.63, "total_tokens": 28167424} {"current_steps": 48845, "total_steps": 67140, "loss": 0.5679, "lr": 1.0482796466250554e-05, "epoch": 7.275096812630324, "percentage": 72.75, "elapsed_time": "3:23:00", "remaining_time": "1:16:02", "throughput": 2312.66, "total_tokens": 28170400} {"current_steps": 48850, "total_steps": 67140, "loss": 0.5251, "lr": 1.0477506079280472e-05, "epoch": 7.275841525171284, "percentage": 72.76, "elapsed_time": "3:23:02", "remaining_time": "1:16:01", "throughput": 2312.71, "total_tokens": 28173824} {"current_steps": 48855, "total_steps": 67140, "loss": 0.4671, "lr": 1.0472216673681476e-05, "epoch": 7.276586237712243, "percentage": 72.77, "elapsed_time": "3:23:03", "remaining_time": "1:15:59", "throughput": 2312.72, "total_tokens": 28176416} {"current_steps": 48860, "total_steps": 67140, "loss": 0.6552, "lr": 1.0466928249811009e-05, "epoch": 7.277330950253202, "percentage": 72.77, "elapsed_time": "3:23:04", "remaining_time": "1:15:58", "throughput": 2312.75, "total_tokens": 28179424} {"current_steps": 48865, "total_steps": 67140, "loss": 0.5292, "lr": 1.0461640808026444e-05, "epoch": 7.278075662794161, "percentage": 72.78, "elapsed_time": "3:23:05", "remaining_time": "1:15:57", "throughput": 2312.77, "total_tokens": 28182368} {"current_steps": 48870, "total_steps": 67140, "loss": 0.5971, "lr": 1.0456354348685085e-05, "epoch": 7.278820375335121, "percentage": 72.79, "elapsed_time": "3:23:06", "remaining_time": "1:15:55", "throughput": 2312.81, "total_tokens": 28185504} {"current_steps": 48875, "total_steps": 67140, "loss": 0.5955, "lr": 1.0451068872144179e-05, "epoch": 7.27956508787608, "percentage": 72.8, "elapsed_time": "3:23:07", "remaining_time": "1:15:54", "throughput": 2312.82, "total_tokens": 28188256} {"current_steps": 48880, "total_steps": 67140, "loss": 0.7898, "lr": 1.0445784378760876e-05, "epoch": 7.280309800417039, "percentage": 72.8, "elapsed_time": "3:23:08", "remaining_time": "1:15:53", "throughput": 2312.85, "total_tokens": 28191200} {"current_steps": 48885, "total_steps": 67140, "loss": 0.4693, "lr": 1.0440500868892294e-05, "epoch": 7.281054512957998, "percentage": 72.81, "elapsed_time": "3:23:10", "remaining_time": "1:15:52", "throughput": 2312.87, "total_tokens": 28194144} {"current_steps": 48890, "total_steps": 67140, "loss": 0.6992, "lr": 1.0435218342895475e-05, "epoch": 7.281799225498958, "percentage": 72.82, "elapsed_time": "3:23:11", "remaining_time": "1:15:50", "throughput": 2312.88, "total_tokens": 28196768} {"current_steps": 48895, "total_steps": 67140, "loss": 0.7536, "lr": 1.0429936801127377e-05, "epoch": 7.282543938039916, "percentage": 72.83, "elapsed_time": "3:23:12", "remaining_time": "1:15:49", "throughput": 2312.91, "total_tokens": 28199776} {"current_steps": 48900, "total_steps": 67140, "loss": 0.566, "lr": 1.0424656243944913e-05, "epoch": 7.283288650580876, "percentage": 72.83, "elapsed_time": "3:23:13", "remaining_time": "1:15:48", "throughput": 2312.92, "total_tokens": 28202560} {"current_steps": 48905, "total_steps": 67140, "loss": 0.781, "lr": 1.0419376671704928e-05, "epoch": 7.284033363121835, "percentage": 72.84, "elapsed_time": "3:23:14", "remaining_time": "1:15:46", "throughput": 2312.95, "total_tokens": 28205632} {"current_steps": 48910, "total_steps": 67140, "loss": 0.5349, "lr": 1.0414098084764178e-05, "epoch": 7.2847780756627944, "percentage": 72.85, "elapsed_time": "3:23:15", "remaining_time": "1:15:45", "throughput": 2312.96, "total_tokens": 28208320} {"current_steps": 48915, "total_steps": 67140, "loss": 0.498, "lr": 1.0408820483479382e-05, "epoch": 7.285522788203753, "percentage": 72.86, "elapsed_time": "3:23:16", "remaining_time": "1:15:44", "throughput": 2313.0, "total_tokens": 28211584} {"current_steps": 48920, "total_steps": 67140, "loss": 0.4459, "lr": 1.0403543868207169e-05, "epoch": 7.286267500744713, "percentage": 72.86, "elapsed_time": "3:23:18", "remaining_time": "1:15:43", "throughput": 2313.03, "total_tokens": 28214688} {"current_steps": 48925, "total_steps": 67140, "loss": 0.6002, "lr": 1.0398268239304118e-05, "epoch": 7.287012213285672, "percentage": 72.87, "elapsed_time": "3:23:19", "remaining_time": "1:15:41", "throughput": 2313.05, "total_tokens": 28217440} {"current_steps": 48930, "total_steps": 67140, "loss": 0.5919, "lr": 1.0392993597126743e-05, "epoch": 7.287756925826631, "percentage": 72.88, "elapsed_time": "3:23:20", "remaining_time": "1:15:40", "throughput": 2313.07, "total_tokens": 28220384} {"current_steps": 48935, "total_steps": 67140, "loss": 0.6672, "lr": 1.0387719942031462e-05, "epoch": 7.28850163836759, "percentage": 72.89, "elapsed_time": "3:23:21", "remaining_time": "1:15:39", "throughput": 2313.08, "total_tokens": 28223040} {"current_steps": 48940, "total_steps": 67140, "loss": 0.2418, "lr": 1.0382447274374667e-05, "epoch": 7.28924635090855, "percentage": 72.89, "elapsed_time": "3:23:22", "remaining_time": "1:15:37", "throughput": 2313.09, "total_tokens": 28225632} {"current_steps": 48945, "total_steps": 67140, "loss": 0.5681, "lr": 1.037717559451265e-05, "epoch": 7.289991063449508, "percentage": 72.9, "elapsed_time": "3:23:23", "remaining_time": "1:15:36", "throughput": 2313.11, "total_tokens": 28228640} {"current_steps": 48950, "total_steps": 67140, "loss": 0.5255, "lr": 1.0371904902801651e-05, "epoch": 7.290735775990468, "percentage": 72.91, "elapsed_time": "3:23:24", "remaining_time": "1:15:35", "throughput": 2313.13, "total_tokens": 28231520} {"current_steps": 48955, "total_steps": 67140, "loss": 0.5496, "lr": 1.0366635199597846e-05, "epoch": 7.291480488531427, "percentage": 72.91, "elapsed_time": "3:23:26", "remaining_time": "1:15:34", "throughput": 2313.16, "total_tokens": 28234496} {"current_steps": 48960, "total_steps": 67140, "loss": 0.6925, "lr": 1.0361366485257338e-05, "epoch": 7.292225201072386, "percentage": 72.92, "elapsed_time": "3:23:27", "remaining_time": "1:15:32", "throughput": 2313.19, "total_tokens": 28237568} {"current_steps": 48965, "total_steps": 67140, "loss": 0.6338, "lr": 1.0356098760136168e-05, "epoch": 7.292969913613345, "percentage": 72.93, "elapsed_time": "3:23:28", "remaining_time": "1:15:31", "throughput": 2313.22, "total_tokens": 28240640} {"current_steps": 48970, "total_steps": 67140, "loss": 0.6104, "lr": 1.0350832024590312e-05, "epoch": 7.293714626154305, "percentage": 72.94, "elapsed_time": "3:23:29", "remaining_time": "1:15:30", "throughput": 2313.25, "total_tokens": 28243616} {"current_steps": 48975, "total_steps": 67140, "loss": 0.4212, "lr": 1.0345566278975671e-05, "epoch": 7.294459338695264, "percentage": 72.94, "elapsed_time": "3:23:30", "remaining_time": "1:15:28", "throughput": 2313.29, "total_tokens": 28246848} {"current_steps": 48980, "total_steps": 67140, "loss": 0.5271, "lr": 1.0340301523648071e-05, "epoch": 7.295204051236222, "percentage": 72.95, "elapsed_time": "3:23:31", "remaining_time": "1:15:27", "throughput": 2313.3, "total_tokens": 28249600} {"current_steps": 48985, "total_steps": 67140, "loss": 0.4386, "lr": 1.0335037758963296e-05, "epoch": 7.295948763777182, "percentage": 72.96, "elapsed_time": "3:23:32", "remaining_time": "1:15:26", "throughput": 2313.32, "total_tokens": 28252448} {"current_steps": 48990, "total_steps": 67140, "loss": 0.5265, "lr": 1.0329774985277042e-05, "epoch": 7.296693476318141, "percentage": 72.97, "elapsed_time": "3:23:34", "remaining_time": "1:15:25", "throughput": 2313.36, "total_tokens": 28255616} {"current_steps": 48995, "total_steps": 67140, "loss": 0.5238, "lr": 1.0324513202944947e-05, "epoch": 7.2974381888591004, "percentage": 72.97, "elapsed_time": "3:23:35", "remaining_time": "1:15:23", "throughput": 2313.39, "total_tokens": 28258720} {"current_steps": 49000, "total_steps": 67140, "loss": 0.7234, "lr": 1.0319252412322586e-05, "epoch": 7.298182901400059, "percentage": 72.98, "elapsed_time": "3:23:36", "remaining_time": "1:15:22", "throughput": 2313.43, "total_tokens": 28262016} {"current_steps": 49005, "total_steps": 67140, "loss": 0.5698, "lr": 1.0313992613765469e-05, "epoch": 7.298927613941019, "percentage": 72.99, "elapsed_time": "3:23:37", "remaining_time": "1:15:21", "throughput": 2313.44, "total_tokens": 28264832} {"current_steps": 49010, "total_steps": 67140, "loss": 0.5396, "lr": 1.0308733807629022e-05, "epoch": 7.299672326481978, "percentage": 73.0, "elapsed_time": "3:23:38", "remaining_time": "1:15:20", "throughput": 2313.45, "total_tokens": 28267488} {"current_steps": 49015, "total_steps": 67140, "loss": 0.6935, "lr": 1.0303475994268606e-05, "epoch": 7.300417039022937, "percentage": 73.0, "elapsed_time": "3:23:39", "remaining_time": "1:15:18", "throughput": 2313.47, "total_tokens": 28270432} {"current_steps": 49020, "total_steps": 67140, "loss": 0.662, "lr": 1.029821917403953e-05, "epoch": 7.301161751563896, "percentage": 73.01, "elapsed_time": "3:23:41", "remaining_time": "1:15:17", "throughput": 2313.49, "total_tokens": 28273280} {"current_steps": 49025, "total_steps": 67140, "loss": 0.6163, "lr": 1.0292963347297027e-05, "epoch": 7.301906464104856, "percentage": 73.02, "elapsed_time": "3:23:42", "remaining_time": "1:15:16", "throughput": 2313.52, "total_tokens": 28276352} {"current_steps": 49030, "total_steps": 67140, "loss": 0.7067, "lr": 1.0287708514396268e-05, "epoch": 7.302651176645814, "percentage": 73.03, "elapsed_time": "3:23:43", "remaining_time": "1:15:14", "throughput": 2313.55, "total_tokens": 28279360} {"current_steps": 49035, "total_steps": 67140, "loss": 0.5038, "lr": 1.0282454675692354e-05, "epoch": 7.303395889186774, "percentage": 73.03, "elapsed_time": "3:23:44", "remaining_time": "1:15:13", "throughput": 2313.57, "total_tokens": 28282176} {"current_steps": 49040, "total_steps": 67140, "loss": 0.5562, "lr": 1.0277201831540323e-05, "epoch": 7.304140601727733, "percentage": 73.04, "elapsed_time": "3:23:45", "remaining_time": "1:15:12", "throughput": 2313.6, "total_tokens": 28285248} {"current_steps": 49045, "total_steps": 67140, "loss": 0.5182, "lr": 1.0271949982295123e-05, "epoch": 7.3048853142686925, "percentage": 73.05, "elapsed_time": "3:23:46", "remaining_time": "1:15:11", "throughput": 2313.61, "total_tokens": 28288032} {"current_steps": 49050, "total_steps": 67140, "loss": 0.5829, "lr": 1.0266699128311675e-05, "epoch": 7.305630026809651, "percentage": 73.06, "elapsed_time": "3:23:47", "remaining_time": "1:15:09", "throughput": 2313.64, "total_tokens": 28291072} {"current_steps": 49055, "total_steps": 67140, "loss": 0.3684, "lr": 1.0261449269944786e-05, "epoch": 7.306374739350611, "percentage": 73.06, "elapsed_time": "3:23:49", "remaining_time": "1:15:08", "throughput": 2313.66, "total_tokens": 28293856} {"current_steps": 49060, "total_steps": 67140, "loss": 0.503, "lr": 1.0256200407549239e-05, "epoch": 7.30711945189157, "percentage": 73.07, "elapsed_time": "3:23:50", "remaining_time": "1:15:07", "throughput": 2313.67, "total_tokens": 28296608} {"current_steps": 49065, "total_steps": 67140, "loss": 0.5796, "lr": 1.0250952541479719e-05, "epoch": 7.307864164432529, "percentage": 73.08, "elapsed_time": "3:23:51", "remaining_time": "1:15:05", "throughput": 2313.68, "total_tokens": 28299264} {"current_steps": 49070, "total_steps": 67140, "loss": 0.7759, "lr": 1.0245705672090872e-05, "epoch": 7.308608876973488, "percentage": 73.09, "elapsed_time": "3:23:52", "remaining_time": "1:15:04", "throughput": 2313.71, "total_tokens": 28302304} {"current_steps": 49075, "total_steps": 67140, "loss": 0.5656, "lr": 1.024045979973724e-05, "epoch": 7.309353589514448, "percentage": 73.09, "elapsed_time": "3:23:53", "remaining_time": "1:15:03", "throughput": 2313.72, "total_tokens": 28305024} {"current_steps": 49080, "total_steps": 67140, "loss": 0.5954, "lr": 1.0235214924773326e-05, "epoch": 7.3100983020554064, "percentage": 73.1, "elapsed_time": "3:23:54", "remaining_time": "1:15:02", "throughput": 2313.74, "total_tokens": 28307904} {"current_steps": 49085, "total_steps": 67140, "loss": 0.4362, "lr": 1.0229971047553557e-05, "epoch": 7.310843014596366, "percentage": 73.11, "elapsed_time": "3:23:55", "remaining_time": "1:15:00", "throughput": 2313.77, "total_tokens": 28310880} {"current_steps": 49090, "total_steps": 67140, "loss": 0.625, "lr": 1.0224728168432307e-05, "epoch": 7.311587727137325, "percentage": 73.12, "elapsed_time": "3:23:57", "remaining_time": "1:14:59", "throughput": 2313.81, "total_tokens": 28314112} {"current_steps": 49095, "total_steps": 67140, "loss": 0.5074, "lr": 1.0219486287763844e-05, "epoch": 7.3123324396782845, "percentage": 73.12, "elapsed_time": "3:23:58", "remaining_time": "1:14:58", "throughput": 2313.84, "total_tokens": 28317088} {"current_steps": 49100, "total_steps": 67140, "loss": 0.5877, "lr": 1.0214245405902406e-05, "epoch": 7.313077152219243, "percentage": 73.13, "elapsed_time": "3:23:59", "remaining_time": "1:14:56", "throughput": 2313.85, "total_tokens": 28319872} {"current_steps": 49105, "total_steps": 67140, "loss": 0.715, "lr": 1.0209005523202155e-05, "epoch": 7.313821864760203, "percentage": 73.14, "elapsed_time": "3:24:00", "remaining_time": "1:14:55", "throughput": 2313.87, "total_tokens": 28322784} {"current_steps": 49110, "total_steps": 67140, "loss": 0.653, "lr": 1.0203766640017167e-05, "epoch": 7.314566577301162, "percentage": 73.15, "elapsed_time": "3:24:01", "remaining_time": "1:14:54", "throughput": 2313.89, "total_tokens": 28325536} {"current_steps": 49115, "total_steps": 67140, "loss": 0.6899, "lr": 1.0198528756701475e-05, "epoch": 7.315311289842121, "percentage": 73.15, "elapsed_time": "3:24:02", "remaining_time": "1:14:53", "throughput": 2313.9, "total_tokens": 28328224} {"current_steps": 49120, "total_steps": 67140, "loss": 0.688, "lr": 1.019329187360903e-05, "epoch": 7.31605600238308, "percentage": 73.16, "elapsed_time": "3:24:03", "remaining_time": "1:14:51", "throughput": 2313.93, "total_tokens": 28331328} {"current_steps": 49125, "total_steps": 67140, "loss": 0.5729, "lr": 1.0188055991093717e-05, "epoch": 7.31680071492404, "percentage": 73.17, "elapsed_time": "3:24:04", "remaining_time": "1:14:50", "throughput": 2313.94, "total_tokens": 28334048} {"current_steps": 49130, "total_steps": 67140, "loss": 0.5789, "lr": 1.0182821109509364e-05, "epoch": 7.3175454274649985, "percentage": 73.18, "elapsed_time": "3:24:06", "remaining_time": "1:14:49", "throughput": 2313.98, "total_tokens": 28337152} {"current_steps": 49135, "total_steps": 67140, "loss": 0.6808, "lr": 1.0177587229209726e-05, "epoch": 7.318290140005958, "percentage": 73.18, "elapsed_time": "3:24:07", "remaining_time": "1:14:47", "throughput": 2313.98, "total_tokens": 28339776} {"current_steps": 49140, "total_steps": 67140, "loss": 0.4709, "lr": 1.0172354350548477e-05, "epoch": 7.319034852546917, "percentage": 73.19, "elapsed_time": "3:24:08", "remaining_time": "1:14:46", "throughput": 2314.02, "total_tokens": 28342848} {"current_steps": 49145, "total_steps": 67140, "loss": 0.6485, "lr": 1.0167122473879228e-05, "epoch": 7.319779565087876, "percentage": 73.2, "elapsed_time": "3:24:09", "remaining_time": "1:14:45", "throughput": 2314.05, "total_tokens": 28345920} {"current_steps": 49150, "total_steps": 67140, "loss": 0.565, "lr": 1.0161891599555536e-05, "epoch": 7.320524277628835, "percentage": 73.21, "elapsed_time": "3:24:10", "remaining_time": "1:14:44", "throughput": 2314.08, "total_tokens": 28348960} {"current_steps": 49155, "total_steps": 67140, "loss": 0.6475, "lr": 1.0156661727930886e-05, "epoch": 7.321268990169794, "percentage": 73.21, "elapsed_time": "3:24:11", "remaining_time": "1:14:42", "throughput": 2314.1, "total_tokens": 28351776} {"current_steps": 49160, "total_steps": 67140, "loss": 0.5768, "lr": 1.0151432859358684e-05, "epoch": 7.322013702710754, "percentage": 73.22, "elapsed_time": "3:24:12", "remaining_time": "1:14:41", "throughput": 2314.11, "total_tokens": 28354496} {"current_steps": 49165, "total_steps": 67140, "loss": 0.4679, "lr": 1.0146204994192283e-05, "epoch": 7.3227584152517124, "percentage": 73.23, "elapsed_time": "3:24:14", "remaining_time": "1:14:40", "throughput": 2314.14, "total_tokens": 28357472} {"current_steps": 49170, "total_steps": 67140, "loss": 0.7977, "lr": 1.0140978132784962e-05, "epoch": 7.323503127792672, "percentage": 73.24, "elapsed_time": "3:24:15", "remaining_time": "1:14:38", "throughput": 2314.17, "total_tokens": 28360640} {"current_steps": 49175, "total_steps": 67140, "loss": 0.514, "lr": 1.013575227548993e-05, "epoch": 7.324247840333631, "percentage": 73.24, "elapsed_time": "3:24:16", "remaining_time": "1:14:37", "throughput": 2314.19, "total_tokens": 28363552} {"current_steps": 49180, "total_steps": 67140, "loss": 0.6019, "lr": 1.0130527422660313e-05, "epoch": 7.3249925528745905, "percentage": 73.25, "elapsed_time": "3:24:17", "remaining_time": "1:14:36", "throughput": 2314.21, "total_tokens": 28366432} {"current_steps": 49185, "total_steps": 67140, "loss": 0.5309, "lr": 1.01253035746492e-05, "epoch": 7.325737265415549, "percentage": 73.26, "elapsed_time": "3:24:18", "remaining_time": "1:14:35", "throughput": 2314.24, "total_tokens": 28369408} {"current_steps": 49190, "total_steps": 67140, "loss": 0.6912, "lr": 1.0120080731809595e-05, "epoch": 7.326481977956509, "percentage": 73.26, "elapsed_time": "3:24:19", "remaining_time": "1:14:33", "throughput": 2314.27, "total_tokens": 28372416} {"current_steps": 49195, "total_steps": 67140, "loss": 0.5626, "lr": 1.0114858894494437e-05, "epoch": 7.327226690497468, "percentage": 73.27, "elapsed_time": "3:24:20", "remaining_time": "1:14:32", "throughput": 2314.29, "total_tokens": 28375360} {"current_steps": 49200, "total_steps": 67140, "loss": 0.706, "lr": 1.0109638063056595e-05, "epoch": 7.327971403038427, "percentage": 73.28, "elapsed_time": "3:24:22", "remaining_time": "1:14:31", "throughput": 2314.31, "total_tokens": 28378272} {"current_steps": 49205, "total_steps": 67140, "loss": 0.6185, "lr": 1.0104418237848883e-05, "epoch": 7.328716115579386, "percentage": 73.29, "elapsed_time": "3:24:23", "remaining_time": "1:14:29", "throughput": 2314.32, "total_tokens": 28380992} {"current_steps": 49210, "total_steps": 67140, "loss": 0.6297, "lr": 1.0099199419224018e-05, "epoch": 7.329460828120346, "percentage": 73.29, "elapsed_time": "3:24:24", "remaining_time": "1:14:28", "throughput": 2314.33, "total_tokens": 28383712} {"current_steps": 49215, "total_steps": 67140, "loss": 0.4725, "lr": 1.0093981607534683e-05, "epoch": 7.3302055406613045, "percentage": 73.3, "elapsed_time": "3:24:25", "remaining_time": "1:14:27", "throughput": 2314.35, "total_tokens": 28386496} {"current_steps": 49220, "total_steps": 67140, "loss": 0.567, "lr": 1.0088764803133454e-05, "epoch": 7.330950253202264, "percentage": 73.31, "elapsed_time": "3:24:26", "remaining_time": "1:14:25", "throughput": 2314.36, "total_tokens": 28389184} {"current_steps": 49225, "total_steps": 67140, "loss": 0.6352, "lr": 1.0083549006372881e-05, "epoch": 7.331694965743223, "percentage": 73.32, "elapsed_time": "3:24:27", "remaining_time": "1:14:24", "throughput": 2314.38, "total_tokens": 28391904} {"current_steps": 49230, "total_steps": 67140, "loss": 0.4303, "lr": 1.0078334217605418e-05, "epoch": 7.3324396782841825, "percentage": 73.32, "elapsed_time": "3:24:28", "remaining_time": "1:14:23", "throughput": 2314.39, "total_tokens": 28394720} {"current_steps": 49235, "total_steps": 67140, "loss": 0.4528, "lr": 1.007312043718347e-05, "epoch": 7.333184390825141, "percentage": 73.33, "elapsed_time": "3:24:29", "remaining_time": "1:14:22", "throughput": 2314.4, "total_tokens": 28397408} {"current_steps": 49240, "total_steps": 67140, "loss": 0.535, "lr": 1.0067907665459344e-05, "epoch": 7.333929103366101, "percentage": 73.34, "elapsed_time": "3:24:30", "remaining_time": "1:14:20", "throughput": 2314.42, "total_tokens": 28400192} {"current_steps": 49245, "total_steps": 67140, "loss": 0.8342, "lr": 1.006269590278531e-05, "epoch": 7.33467381590706, "percentage": 73.35, "elapsed_time": "3:24:32", "remaining_time": "1:14:19", "throughput": 2314.44, "total_tokens": 28403040} {"current_steps": 49250, "total_steps": 67140, "loss": 0.5306, "lr": 1.0057485149513557e-05, "epoch": 7.335418528448019, "percentage": 73.35, "elapsed_time": "3:24:33", "remaining_time": "1:14:18", "throughput": 2314.45, "total_tokens": 28405792} {"current_steps": 49255, "total_steps": 67140, "loss": 0.7045, "lr": 1.0052275405996214e-05, "epoch": 7.336163240988978, "percentage": 73.36, "elapsed_time": "3:24:34", "remaining_time": "1:14:16", "throughput": 2314.49, "total_tokens": 28408992} {"current_steps": 49260, "total_steps": 67140, "loss": 0.7897, "lr": 1.0047066672585317e-05, "epoch": 7.336907953529938, "percentage": 73.37, "elapsed_time": "3:24:35", "remaining_time": "1:14:15", "throughput": 2314.52, "total_tokens": 28411936} {"current_steps": 49265, "total_steps": 67140, "loss": 0.4985, "lr": 1.004185894963286e-05, "epoch": 7.3376526660708965, "percentage": 73.38, "elapsed_time": "3:24:36", "remaining_time": "1:14:14", "throughput": 2314.54, "total_tokens": 28414848} {"current_steps": 49270, "total_steps": 67140, "loss": 0.5536, "lr": 1.0036652237490768e-05, "epoch": 7.338397378611856, "percentage": 73.38, "elapsed_time": "3:24:37", "remaining_time": "1:14:13", "throughput": 2314.56, "total_tokens": 28417728} {"current_steps": 49275, "total_steps": 67140, "loss": 0.7974, "lr": 1.0031446536510875e-05, "epoch": 7.339142091152815, "percentage": 73.39, "elapsed_time": "3:24:38", "remaining_time": "1:14:11", "throughput": 2314.59, "total_tokens": 28420768} {"current_steps": 49280, "total_steps": 67140, "loss": 0.4627, "lr": 1.0026241847044964e-05, "epoch": 7.3398868036937746, "percentage": 73.4, "elapsed_time": "3:24:40", "remaining_time": "1:14:10", "throughput": 2314.62, "total_tokens": 28423808} {"current_steps": 49285, "total_steps": 67140, "loss": 0.5556, "lr": 1.0021038169444752e-05, "epoch": 7.340631516234733, "percentage": 73.41, "elapsed_time": "3:24:41", "remaining_time": "1:14:09", "throughput": 2314.63, "total_tokens": 28426560} {"current_steps": 49290, "total_steps": 67140, "loss": 0.7696, "lr": 1.0015835504061879e-05, "epoch": 7.341376228775693, "percentage": 73.41, "elapsed_time": "3:24:42", "remaining_time": "1:14:07", "throughput": 2314.64, "total_tokens": 28429184} {"current_steps": 49295, "total_steps": 67140, "loss": 0.6938, "lr": 1.0010633851247933e-05, "epoch": 7.342120941316652, "percentage": 73.42, "elapsed_time": "3:24:43", "remaining_time": "1:14:06", "throughput": 2314.65, "total_tokens": 28431808} {"current_steps": 49300, "total_steps": 67140, "loss": 0.5892, "lr": 1.0005433211354398e-05, "epoch": 7.342865653857611, "percentage": 73.43, "elapsed_time": "3:24:44", "remaining_time": "1:14:05", "throughput": 2314.66, "total_tokens": 28434624} {"current_steps": 49305, "total_steps": 67140, "loss": 0.7125, "lr": 1.0000233584732732e-05, "epoch": 7.34361036639857, "percentage": 73.44, "elapsed_time": "3:24:45", "remaining_time": "1:14:04", "throughput": 2314.67, "total_tokens": 28437344} {"current_steps": 49310, "total_steps": 67140, "loss": 0.651, "lr": 9.995034971734288e-06, "epoch": 7.344355078939529, "percentage": 73.44, "elapsed_time": "3:24:46", "remaining_time": "1:14:02", "throughput": 2314.69, "total_tokens": 28440224} {"current_steps": 49315, "total_steps": 67140, "loss": 0.6227, "lr": 9.989837372710374e-06, "epoch": 7.3450997914804885, "percentage": 73.45, "elapsed_time": "3:24:47", "remaining_time": "1:14:01", "throughput": 2314.71, "total_tokens": 28443008} {"current_steps": 49320, "total_steps": 67140, "loss": 0.6914, "lr": 9.984640788012222e-06, "epoch": 7.345844504021448, "percentage": 73.46, "elapsed_time": "3:24:49", "remaining_time": "1:14:00", "throughput": 2314.8, "total_tokens": 28447456} {"current_steps": 49325, "total_steps": 67140, "loss": 0.5872, "lr": 9.979445217991001e-06, "epoch": 7.346589216562407, "percentage": 73.47, "elapsed_time": "3:24:50", "remaining_time": "1:13:59", "throughput": 2314.83, "total_tokens": 28450464} {"current_steps": 49330, "total_steps": 67140, "loss": 0.6107, "lr": 9.9742506629978e-06, "epoch": 7.347333929103366, "percentage": 73.47, "elapsed_time": "3:24:51", "remaining_time": "1:13:57", "throughput": 2314.85, "total_tokens": 28453376} {"current_steps": 49335, "total_steps": 67140, "loss": 0.4916, "lr": 9.96905712338366e-06, "epoch": 7.348078641644325, "percentage": 73.48, "elapsed_time": "3:24:52", "remaining_time": "1:13:56", "throughput": 2314.87, "total_tokens": 28456160} {"current_steps": 49340, "total_steps": 67140, "loss": 0.5756, "lr": 9.963864599499528e-06, "epoch": 7.348823354185284, "percentage": 73.49, "elapsed_time": "3:24:53", "remaining_time": "1:13:55", "throughput": 2314.87, "total_tokens": 28458848} {"current_steps": 49345, "total_steps": 67140, "loss": 0.6365, "lr": 9.958673091696286e-06, "epoch": 7.349568066726244, "percentage": 73.5, "elapsed_time": "3:24:55", "remaining_time": "1:13:53", "throughput": 2314.92, "total_tokens": 28462080} {"current_steps": 49350, "total_steps": 67140, "loss": 0.7811, "lr": 9.95348260032476e-06, "epoch": 7.3503127792672025, "percentage": 73.5, "elapsed_time": "3:24:56", "remaining_time": "1:13:52", "throughput": 2314.93, "total_tokens": 28464864} {"current_steps": 49355, "total_steps": 67140, "loss": 0.6193, "lr": 9.948293125735705e-06, "epoch": 7.351057491808162, "percentage": 73.51, "elapsed_time": "3:24:57", "remaining_time": "1:13:51", "throughput": 2314.96, "total_tokens": 28467904} {"current_steps": 49360, "total_steps": 67140, "loss": 0.6014, "lr": 9.943104668279807e-06, "epoch": 7.351802204349121, "percentage": 73.52, "elapsed_time": "3:24:58", "remaining_time": "1:13:50", "throughput": 2315.0, "total_tokens": 28471072} {"current_steps": 49365, "total_steps": 67140, "loss": 0.4967, "lr": 9.937917228307678e-06, "epoch": 7.3525469168900806, "percentage": 73.53, "elapsed_time": "3:24:59", "remaining_time": "1:13:48", "throughput": 2315.01, "total_tokens": 28473856} {"current_steps": 49370, "total_steps": 67140, "loss": 0.7856, "lr": 9.932730806169873e-06, "epoch": 7.353291629431039, "percentage": 73.53, "elapsed_time": "3:25:00", "remaining_time": "1:13:47", "throughput": 2315.03, "total_tokens": 28476608} {"current_steps": 49375, "total_steps": 67140, "loss": 0.7222, "lr": 9.927545402216862e-06, "epoch": 7.354036341971999, "percentage": 73.54, "elapsed_time": "3:25:01", "remaining_time": "1:13:46", "throughput": 2315.06, "total_tokens": 28479808} {"current_steps": 49380, "total_steps": 67140, "loss": 0.5501, "lr": 9.922361016799045e-06, "epoch": 7.354781054512958, "percentage": 73.55, "elapsed_time": "3:25:03", "remaining_time": "1:13:44", "throughput": 2315.09, "total_tokens": 28482752} {"current_steps": 49385, "total_steps": 67140, "loss": 0.4952, "lr": 9.917177650266768e-06, "epoch": 7.355525767053917, "percentage": 73.56, "elapsed_time": "3:25:04", "remaining_time": "1:13:43", "throughput": 2315.1, "total_tokens": 28485536} {"current_steps": 49390, "total_steps": 67140, "loss": 0.5096, "lr": 9.911995302970301e-06, "epoch": 7.356270479594876, "percentage": 73.56, "elapsed_time": "3:25:05", "remaining_time": "1:13:42", "throughput": 2315.13, "total_tokens": 28488608} {"current_steps": 49395, "total_steps": 67140, "loss": 0.5167, "lr": 9.90681397525985e-06, "epoch": 7.357015192135836, "percentage": 73.57, "elapsed_time": "3:25:06", "remaining_time": "1:13:41", "throughput": 2315.14, "total_tokens": 28491328} {"current_steps": 49400, "total_steps": 67140, "loss": 0.4934, "lr": 9.901633667485554e-06, "epoch": 7.3577599046767945, "percentage": 73.58, "elapsed_time": "3:25:07", "remaining_time": "1:13:39", "throughput": 2315.16, "total_tokens": 28494176} {"current_steps": 49405, "total_steps": 67140, "loss": 0.5156, "lr": 9.89645437999746e-06, "epoch": 7.358504617217754, "percentage": 73.59, "elapsed_time": "3:25:08", "remaining_time": "1:13:38", "throughput": 2315.17, "total_tokens": 28496864} {"current_steps": 49410, "total_steps": 67140, "loss": 0.555, "lr": 9.891276113145576e-06, "epoch": 7.359249329758713, "percentage": 73.59, "elapsed_time": "3:25:09", "remaining_time": "1:13:37", "throughput": 2315.18, "total_tokens": 28499488} {"current_steps": 49415, "total_steps": 67140, "loss": 0.457, "lr": 9.886098867279831e-06, "epoch": 7.359994042299673, "percentage": 73.6, "elapsed_time": "3:25:10", "remaining_time": "1:13:35", "throughput": 2315.2, "total_tokens": 28502400} {"current_steps": 49420, "total_steps": 67140, "loss": 0.4785, "lr": 9.880922642750068e-06, "epoch": 7.360738754840631, "percentage": 73.61, "elapsed_time": "3:25:12", "remaining_time": "1:13:34", "throughput": 2315.21, "total_tokens": 28505088} {"current_steps": 49425, "total_steps": 67140, "loss": 0.539, "lr": 9.87574743990608e-06, "epoch": 7.361483467381591, "percentage": 73.61, "elapsed_time": "3:25:13", "remaining_time": "1:13:33", "throughput": 2315.23, "total_tokens": 28507936} {"current_steps": 49430, "total_steps": 67140, "loss": 0.5728, "lr": 9.870573259097593e-06, "epoch": 7.36222817992255, "percentage": 73.62, "elapsed_time": "3:25:14", "remaining_time": "1:13:32", "throughput": 2315.25, "total_tokens": 28510848} {"current_steps": 49435, "total_steps": 67140, "loss": 0.68, "lr": 9.86540010067426e-06, "epoch": 7.362972892463509, "percentage": 73.63, "elapsed_time": "3:25:15", "remaining_time": "1:13:30", "throughput": 2315.26, "total_tokens": 28513536} {"current_steps": 49440, "total_steps": 67140, "loss": 0.7743, "lr": 9.86022796498565e-06, "epoch": 7.363717605004468, "percentage": 73.64, "elapsed_time": "3:25:16", "remaining_time": "1:13:29", "throughput": 2315.28, "total_tokens": 28516416} {"current_steps": 49445, "total_steps": 67140, "loss": 0.6364, "lr": 9.855056852381275e-06, "epoch": 7.364462317545428, "percentage": 73.64, "elapsed_time": "3:25:17", "remaining_time": "1:13:28", "throughput": 2315.3, "total_tokens": 28519328} {"current_steps": 49450, "total_steps": 67140, "loss": 0.5589, "lr": 9.849886763210586e-06, "epoch": 7.3652070300863866, "percentage": 73.65, "elapsed_time": "3:25:18", "remaining_time": "1:13:26", "throughput": 2315.34, "total_tokens": 28522496} {"current_steps": 49455, "total_steps": 67140, "loss": 0.5914, "lr": 9.844717697822965e-06, "epoch": 7.365951742627346, "percentage": 73.66, "elapsed_time": "3:25:20", "remaining_time": "1:13:25", "throughput": 2315.36, "total_tokens": 28525440} {"current_steps": 49460, "total_steps": 67140, "loss": 0.609, "lr": 9.839549656567693e-06, "epoch": 7.366696455168305, "percentage": 73.67, "elapsed_time": "3:25:21", "remaining_time": "1:13:24", "throughput": 2315.37, "total_tokens": 28528224} {"current_steps": 49465, "total_steps": 67140, "loss": 0.4842, "lr": 9.834382639794015e-06, "epoch": 7.367441167709265, "percentage": 73.67, "elapsed_time": "3:25:22", "remaining_time": "1:13:23", "throughput": 2315.39, "total_tokens": 28531104} {"current_steps": 49470, "total_steps": 67140, "loss": 0.5337, "lr": 9.829216647851111e-06, "epoch": 7.368185880250223, "percentage": 73.68, "elapsed_time": "3:25:23", "remaining_time": "1:13:21", "throughput": 2315.4, "total_tokens": 28533696} {"current_steps": 49475, "total_steps": 67140, "loss": 0.6091, "lr": 9.824051681088058e-06, "epoch": 7.368930592791183, "percentage": 73.69, "elapsed_time": "3:25:24", "remaining_time": "1:13:20", "throughput": 2315.43, "total_tokens": 28536768} {"current_steps": 49480, "total_steps": 67140, "loss": 0.7003, "lr": 9.81888773985389e-06, "epoch": 7.369675305332142, "percentage": 73.7, "elapsed_time": "3:25:25", "remaining_time": "1:13:19", "throughput": 2315.44, "total_tokens": 28539392} {"current_steps": 49485, "total_steps": 67140, "loss": 0.5284, "lr": 9.81372482449757e-06, "epoch": 7.370420017873101, "percentage": 73.7, "elapsed_time": "3:25:26", "remaining_time": "1:13:17", "throughput": 2315.45, "total_tokens": 28542272} {"current_steps": 49490, "total_steps": 67140, "loss": 0.6048, "lr": 9.80856293536798e-06, "epoch": 7.37116473041406, "percentage": 73.71, "elapsed_time": "3:25:27", "remaining_time": "1:13:16", "throughput": 2315.46, "total_tokens": 28544928} {"current_steps": 49495, "total_steps": 67140, "loss": 0.6507, "lr": 9.803402072813953e-06, "epoch": 7.371909442955019, "percentage": 73.72, "elapsed_time": "3:25:29", "remaining_time": "1:13:15", "throughput": 2315.48, "total_tokens": 28547712} {"current_steps": 49500, "total_steps": 67140, "loss": 0.6032, "lr": 9.798242237184218e-06, "epoch": 7.372654155495979, "percentage": 73.73, "elapsed_time": "3:25:30", "remaining_time": "1:13:14", "throughput": 2315.51, "total_tokens": 28550752} {"current_steps": 49505, "total_steps": 67140, "loss": 0.4493, "lr": 9.793083428827477e-06, "epoch": 7.373398868036937, "percentage": 73.73, "elapsed_time": "3:25:31", "remaining_time": "1:13:12", "throughput": 2315.53, "total_tokens": 28553632} {"current_steps": 49510, "total_steps": 67140, "loss": 0.6027, "lr": 9.787925648092321e-06, "epoch": 7.374143580577897, "percentage": 73.74, "elapsed_time": "3:25:32", "remaining_time": "1:13:11", "throughput": 2315.56, "total_tokens": 28556608} {"current_steps": 49515, "total_steps": 67140, "loss": 0.7364, "lr": 9.782768895327305e-06, "epoch": 7.374888293118856, "percentage": 73.75, "elapsed_time": "3:25:33", "remaining_time": "1:13:10", "throughput": 2315.58, "total_tokens": 28559552} {"current_steps": 49520, "total_steps": 67140, "loss": 0.6936, "lr": 9.777613170880898e-06, "epoch": 7.375633005659815, "percentage": 73.76, "elapsed_time": "3:25:34", "remaining_time": "1:13:08", "throughput": 2315.59, "total_tokens": 28562272} {"current_steps": 49525, "total_steps": 67140, "loss": 0.6744, "lr": 9.7724584751015e-06, "epoch": 7.376377718200774, "percentage": 73.76, "elapsed_time": "3:25:35", "remaining_time": "1:13:07", "throughput": 2315.61, "total_tokens": 28565152} {"current_steps": 49530, "total_steps": 67140, "loss": 0.5843, "lr": 9.767304808337451e-06, "epoch": 7.377122430741734, "percentage": 73.77, "elapsed_time": "3:25:37", "remaining_time": "1:13:06", "throughput": 2315.63, "total_tokens": 28568096} {"current_steps": 49535, "total_steps": 67140, "loss": 0.5602, "lr": 9.76215217093702e-06, "epoch": 7.3778671432826926, "percentage": 73.78, "elapsed_time": "3:25:38", "remaining_time": "1:13:05", "throughput": 2315.64, "total_tokens": 28570688} {"current_steps": 49540, "total_steps": 67140, "loss": 0.5267, "lr": 9.757000563248389e-06, "epoch": 7.378611855823652, "percentage": 73.79, "elapsed_time": "3:25:39", "remaining_time": "1:13:03", "throughput": 2315.67, "total_tokens": 28573856} {"current_steps": 49545, "total_steps": 67140, "loss": 0.5329, "lr": 9.751849985619682e-06, "epoch": 7.379356568364611, "percentage": 73.79, "elapsed_time": "3:25:40", "remaining_time": "1:13:02", "throughput": 2315.69, "total_tokens": 28576768} {"current_steps": 49550, "total_steps": 67140, "loss": 0.6408, "lr": 9.746700438398957e-06, "epoch": 7.380101280905571, "percentage": 73.8, "elapsed_time": "3:25:41", "remaining_time": "1:13:01", "throughput": 2315.71, "total_tokens": 28579584} {"current_steps": 49555, "total_steps": 67140, "loss": 0.6429, "lr": 9.7415519219342e-06, "epoch": 7.380845993446529, "percentage": 73.81, "elapsed_time": "3:25:42", "remaining_time": "1:12:59", "throughput": 2315.72, "total_tokens": 28582336} {"current_steps": 49560, "total_steps": 67140, "loss": 0.5168, "lr": 9.736404436573327e-06, "epoch": 7.381590705987489, "percentage": 73.82, "elapsed_time": "3:25:43", "remaining_time": "1:12:58", "throughput": 2315.73, "total_tokens": 28585056} {"current_steps": 49565, "total_steps": 67140, "loss": 0.5407, "lr": 9.731257982664196e-06, "epoch": 7.382335418528448, "percentage": 73.82, "elapsed_time": "3:25:44", "remaining_time": "1:12:57", "throughput": 2315.74, "total_tokens": 28587680} {"current_steps": 49570, "total_steps": 67140, "loss": 0.4933, "lr": 9.726112560554562e-06, "epoch": 7.383080131069407, "percentage": 73.83, "elapsed_time": "3:25:46", "remaining_time": "1:12:56", "throughput": 2315.75, "total_tokens": 28590272} {"current_steps": 49575, "total_steps": 67140, "loss": 0.8296, "lr": 9.72096817059215e-06, "epoch": 7.383824843610366, "percentage": 73.84, "elapsed_time": "3:25:47", "remaining_time": "1:12:54", "throughput": 2315.75, "total_tokens": 28592832} {"current_steps": 49580, "total_steps": 67140, "loss": 0.6594, "lr": 9.715824813124582e-06, "epoch": 7.384569556151326, "percentage": 73.85, "elapsed_time": "3:25:48", "remaining_time": "1:12:53", "throughput": 2315.77, "total_tokens": 28595648} {"current_steps": 49585, "total_steps": 67140, "loss": 0.7283, "lr": 9.710682488499434e-06, "epoch": 7.385314268692285, "percentage": 73.85, "elapsed_time": "3:25:49", "remaining_time": "1:12:52", "throughput": 2315.8, "total_tokens": 28598688} {"current_steps": 49590, "total_steps": 67140, "loss": 0.5593, "lr": 9.7055411970642e-06, "epoch": 7.386058981233244, "percentage": 73.86, "elapsed_time": "3:25:50", "remaining_time": "1:12:50", "throughput": 2315.82, "total_tokens": 28601600} {"current_steps": 49595, "total_steps": 67140, "loss": 0.484, "lr": 9.700400939166308e-06, "epoch": 7.386803693774203, "percentage": 73.87, "elapsed_time": "3:25:51", "remaining_time": "1:12:49", "throughput": 2315.85, "total_tokens": 28604480} {"current_steps": 49600, "total_steps": 67140, "loss": 0.6994, "lr": 9.695261715153126e-06, "epoch": 7.387548406315163, "percentage": 73.88, "elapsed_time": "3:25:52", "remaining_time": "1:12:48", "throughput": 2315.87, "total_tokens": 28607328} {"current_steps": 49605, "total_steps": 67140, "loss": 0.3941, "lr": 9.690123525371925e-06, "epoch": 7.388293118856121, "percentage": 73.88, "elapsed_time": "3:25:53", "remaining_time": "1:12:47", "throughput": 2315.89, "total_tokens": 28610240} {"current_steps": 49610, "total_steps": 67140, "loss": 0.564, "lr": 9.68498637016993e-06, "epoch": 7.389037831397081, "percentage": 73.89, "elapsed_time": "3:25:55", "remaining_time": "1:12:45", "throughput": 2315.91, "total_tokens": 28613088} {"current_steps": 49615, "total_steps": 67140, "loss": 0.5793, "lr": 9.679850249894298e-06, "epoch": 7.38978254393804, "percentage": 73.9, "elapsed_time": "3:25:56", "remaining_time": "1:12:44", "throughput": 2315.94, "total_tokens": 28616192} {"current_steps": 49620, "total_steps": 67140, "loss": 0.5295, "lr": 9.67471516489209e-06, "epoch": 7.390527256478999, "percentage": 73.91, "elapsed_time": "3:25:57", "remaining_time": "1:12:43", "throughput": 2315.96, "total_tokens": 28619136} {"current_steps": 49625, "total_steps": 67140, "loss": 0.542, "lr": 9.669581115510323e-06, "epoch": 7.391271969019958, "percentage": 73.91, "elapsed_time": "3:25:58", "remaining_time": "1:12:41", "throughput": 2315.99, "total_tokens": 28622016} {"current_steps": 49630, "total_steps": 67140, "loss": 0.7411, "lr": 9.664448102095939e-06, "epoch": 7.392016681560918, "percentage": 73.92, "elapsed_time": "3:25:59", "remaining_time": "1:12:40", "throughput": 2316.01, "total_tokens": 28625088} {"current_steps": 49635, "total_steps": 67140, "loss": 0.6899, "lr": 9.659316124995806e-06, "epoch": 7.392761394101877, "percentage": 73.93, "elapsed_time": "3:26:00", "remaining_time": "1:12:39", "throughput": 2316.03, "total_tokens": 28627872} {"current_steps": 49640, "total_steps": 67140, "loss": 0.4667, "lr": 9.654185184556713e-06, "epoch": 7.393506106642836, "percentage": 73.94, "elapsed_time": "3:26:01", "remaining_time": "1:12:38", "throughput": 2316.04, "total_tokens": 28630656} {"current_steps": 49645, "total_steps": 67140, "loss": 0.4889, "lr": 9.649055281125394e-06, "epoch": 7.394250819183795, "percentage": 73.94, "elapsed_time": "3:26:03", "remaining_time": "1:12:36", "throughput": 2316.07, "total_tokens": 28633568} {"current_steps": 49650, "total_steps": 67140, "loss": 0.668, "lr": 9.643926415048504e-06, "epoch": 7.394995531724755, "percentage": 73.95, "elapsed_time": "3:26:04", "remaining_time": "1:12:35", "throughput": 2316.1, "total_tokens": 28636640} {"current_steps": 49655, "total_steps": 67140, "loss": 0.5584, "lr": 9.638798586672645e-06, "epoch": 7.395740244265713, "percentage": 73.96, "elapsed_time": "3:26:05", "remaining_time": "1:12:34", "throughput": 2316.1, "total_tokens": 28639264} {"current_steps": 49660, "total_steps": 67140, "loss": 0.5832, "lr": 9.633671796344312e-06, "epoch": 7.396484956806672, "percentage": 73.96, "elapsed_time": "3:26:06", "remaining_time": "1:12:32", "throughput": 2316.12, "total_tokens": 28642176} {"current_steps": 49665, "total_steps": 67140, "loss": 0.5321, "lr": 9.628546044409966e-06, "epoch": 7.397229669347632, "percentage": 73.97, "elapsed_time": "3:26:07", "remaining_time": "1:12:31", "throughput": 2316.15, "total_tokens": 28645088} {"current_steps": 49670, "total_steps": 67140, "loss": 0.6016, "lr": 9.623421331215992e-06, "epoch": 7.3979743818885915, "percentage": 73.98, "elapsed_time": "3:26:08", "remaining_time": "1:12:30", "throughput": 2316.16, "total_tokens": 28647904} {"current_steps": 49675, "total_steps": 67140, "loss": 0.6525, "lr": 9.618297657108676e-06, "epoch": 7.39871909442955, "percentage": 73.99, "elapsed_time": "3:26:09", "remaining_time": "1:12:29", "throughput": 2316.18, "total_tokens": 28650688} {"current_steps": 49680, "total_steps": 67140, "loss": 0.6407, "lr": 9.61317502243427e-06, "epoch": 7.399463806970509, "percentage": 73.99, "elapsed_time": "3:26:10", "remaining_time": "1:12:27", "throughput": 2316.2, "total_tokens": 28653536} {"current_steps": 49685, "total_steps": 67140, "loss": 0.5496, "lr": 9.608053427538938e-06, "epoch": 7.400208519511469, "percentage": 74.0, "elapsed_time": "3:26:12", "remaining_time": "1:12:26", "throughput": 2316.22, "total_tokens": 28656480} {"current_steps": 49690, "total_steps": 67140, "loss": 0.5474, "lr": 9.602932872768775e-06, "epoch": 7.400953232052427, "percentage": 74.01, "elapsed_time": "3:26:13", "remaining_time": "1:12:25", "throughput": 2316.24, "total_tokens": 28659264} {"current_steps": 49695, "total_steps": 67140, "loss": 0.6494, "lr": 9.597813358469817e-06, "epoch": 7.401697944593387, "percentage": 74.02, "elapsed_time": "3:26:14", "remaining_time": "1:12:23", "throughput": 2316.25, "total_tokens": 28661920} {"current_steps": 49700, "total_steps": 67140, "loss": 0.7131, "lr": 9.592694884988001e-06, "epoch": 7.402442657134346, "percentage": 74.02, "elapsed_time": "3:26:15", "remaining_time": "1:12:22", "throughput": 2316.28, "total_tokens": 28664928} {"current_steps": 49705, "total_steps": 67140, "loss": 0.4959, "lr": 9.587577452669235e-06, "epoch": 7.403187369675305, "percentage": 74.03, "elapsed_time": "3:26:16", "remaining_time": "1:12:21", "throughput": 2316.29, "total_tokens": 28667648} {"current_steps": 49710, "total_steps": 67140, "loss": 0.6214, "lr": 9.582461061859313e-06, "epoch": 7.403932082216264, "percentage": 74.04, "elapsed_time": "3:26:17", "remaining_time": "1:12:20", "throughput": 2316.32, "total_tokens": 28670752} {"current_steps": 49715, "total_steps": 67140, "loss": 0.6337, "lr": 9.577345712903988e-06, "epoch": 7.404676794757224, "percentage": 74.05, "elapsed_time": "3:26:18", "remaining_time": "1:12:18", "throughput": 2316.35, "total_tokens": 28673920} {"current_steps": 49720, "total_steps": 67140, "loss": 0.5418, "lr": 9.572231406148938e-06, "epoch": 7.405421507298183, "percentage": 74.05, "elapsed_time": "3:26:20", "remaining_time": "1:12:17", "throughput": 2316.38, "total_tokens": 28676928} {"current_steps": 49725, "total_steps": 67140, "loss": 0.445, "lr": 9.567118141939763e-06, "epoch": 7.406166219839142, "percentage": 74.06, "elapsed_time": "3:26:21", "remaining_time": "1:12:16", "throughput": 2316.39, "total_tokens": 28679712} {"current_steps": 49730, "total_steps": 67140, "loss": 0.5564, "lr": 9.562005920622009e-06, "epoch": 7.406910932380101, "percentage": 74.07, "elapsed_time": "3:26:22", "remaining_time": "1:12:14", "throughput": 2316.42, "total_tokens": 28682816} {"current_steps": 49735, "total_steps": 67140, "loss": 0.6525, "lr": 9.556894742541117e-06, "epoch": 7.407655644921061, "percentage": 74.08, "elapsed_time": "3:26:23", "remaining_time": "1:12:13", "throughput": 2316.45, "total_tokens": 28685792} {"current_steps": 49740, "total_steps": 67140, "loss": 0.7623, "lr": 9.551784608042501e-06, "epoch": 7.408400357462019, "percentage": 74.08, "elapsed_time": "3:26:24", "remaining_time": "1:12:12", "throughput": 2316.47, "total_tokens": 28688704} {"current_steps": 49745, "total_steps": 67140, "loss": 0.7269, "lr": 9.546675517471465e-06, "epoch": 7.409145070002979, "percentage": 74.09, "elapsed_time": "3:26:25", "remaining_time": "1:12:11", "throughput": 2316.48, "total_tokens": 28691296} {"current_steps": 49750, "total_steps": 67140, "loss": 0.5085, "lr": 9.541567471173268e-06, "epoch": 7.409889782543938, "percentage": 74.1, "elapsed_time": "3:26:26", "remaining_time": "1:12:09", "throughput": 2316.51, "total_tokens": 28694304} {"current_steps": 49755, "total_steps": 67140, "loss": 0.6291, "lr": 9.536460469493095e-06, "epoch": 7.4106344950848975, "percentage": 74.11, "elapsed_time": "3:26:28", "remaining_time": "1:12:08", "throughput": 2316.52, "total_tokens": 28697088} {"current_steps": 49760, "total_steps": 67140, "loss": 0.3379, "lr": 9.53135451277605e-06, "epoch": 7.411379207625856, "percentage": 74.11, "elapsed_time": "3:26:29", "remaining_time": "1:12:07", "throughput": 2316.54, "total_tokens": 28700032} {"current_steps": 49765, "total_steps": 67140, "loss": 0.5529, "lr": 9.526249601367185e-06, "epoch": 7.412123920166816, "percentage": 74.12, "elapsed_time": "3:26:30", "remaining_time": "1:12:05", "throughput": 2316.55, "total_tokens": 28702688} {"current_steps": 49770, "total_steps": 67140, "loss": 0.7426, "lr": 9.521145735611453e-06, "epoch": 7.412868632707775, "percentage": 74.13, "elapsed_time": "3:26:31", "remaining_time": "1:12:04", "throughput": 2316.57, "total_tokens": 28705536} {"current_steps": 49775, "total_steps": 67140, "loss": 0.4859, "lr": 9.51604291585376e-06, "epoch": 7.413613345248734, "percentage": 74.14, "elapsed_time": "3:26:32", "remaining_time": "1:12:03", "throughput": 2316.6, "total_tokens": 28708544} {"current_steps": 49780, "total_steps": 67140, "loss": 0.6789, "lr": 9.510941142438939e-06, "epoch": 7.414358057789693, "percentage": 74.14, "elapsed_time": "3:26:33", "remaining_time": "1:12:02", "throughput": 2316.62, "total_tokens": 28711424} {"current_steps": 49785, "total_steps": 67140, "loss": 0.522, "lr": 9.505840415711737e-06, "epoch": 7.415102770330653, "percentage": 74.15, "elapsed_time": "3:26:34", "remaining_time": "1:12:00", "throughput": 2316.64, "total_tokens": 28714400} {"current_steps": 49790, "total_steps": 67140, "loss": 0.5628, "lr": 9.500740736016845e-06, "epoch": 7.415847482871611, "percentage": 74.16, "elapsed_time": "3:26:35", "remaining_time": "1:11:59", "throughput": 2316.67, "total_tokens": 28717376} {"current_steps": 49795, "total_steps": 67140, "loss": 0.5006, "lr": 9.495642103698877e-06, "epoch": 7.416592195412571, "percentage": 74.17, "elapsed_time": "3:26:37", "remaining_time": "1:11:58", "throughput": 2316.69, "total_tokens": 28720224} {"current_steps": 49800, "total_steps": 67140, "loss": 0.6957, "lr": 9.490544519102387e-06, "epoch": 7.41733690795353, "percentage": 74.17, "elapsed_time": "3:26:38", "remaining_time": "1:11:56", "throughput": 2316.7, "total_tokens": 28723040} {"current_steps": 49805, "total_steps": 67140, "loss": 0.4733, "lr": 9.485447982571832e-06, "epoch": 7.4180816204944895, "percentage": 74.18, "elapsed_time": "3:26:39", "remaining_time": "1:11:55", "throughput": 2316.71, "total_tokens": 28725760} {"current_steps": 49810, "total_steps": 67140, "loss": 0.887, "lr": 9.480352494451628e-06, "epoch": 7.418826333035448, "percentage": 74.19, "elapsed_time": "3:26:40", "remaining_time": "1:11:54", "throughput": 2316.72, "total_tokens": 28728448} {"current_steps": 49815, "total_steps": 67140, "loss": 0.6405, "lr": 9.475258055086102e-06, "epoch": 7.419571045576408, "percentage": 74.2, "elapsed_time": "3:26:41", "remaining_time": "1:11:53", "throughput": 2316.74, "total_tokens": 28731264} {"current_steps": 49820, "total_steps": 67140, "loss": 0.7279, "lr": 9.470164664819527e-06, "epoch": 7.420315758117367, "percentage": 74.2, "elapsed_time": "3:26:42", "remaining_time": "1:11:51", "throughput": 2316.75, "total_tokens": 28734048} {"current_steps": 49825, "total_steps": 67140, "loss": 0.6698, "lr": 9.465072323996078e-06, "epoch": 7.421060470658326, "percentage": 74.21, "elapsed_time": "3:26:43", "remaining_time": "1:11:50", "throughput": 2316.78, "total_tokens": 28737184} {"current_steps": 49830, "total_steps": 67140, "loss": 0.5021, "lr": 9.459981032959877e-06, "epoch": 7.421805183199285, "percentage": 74.22, "elapsed_time": "3:26:45", "remaining_time": "1:11:49", "throughput": 2316.81, "total_tokens": 28740128} {"current_steps": 49835, "total_steps": 67140, "loss": 0.5417, "lr": 9.454890792054987e-06, "epoch": 7.422549895740245, "percentage": 74.23, "elapsed_time": "3:26:46", "remaining_time": "1:11:47", "throughput": 2316.81, "total_tokens": 28742784} {"current_steps": 49840, "total_steps": 67140, "loss": 0.4947, "lr": 9.44980160162537e-06, "epoch": 7.4232946082812035, "percentage": 74.23, "elapsed_time": "3:26:47", "remaining_time": "1:11:46", "throughput": 2316.84, "total_tokens": 28745792} {"current_steps": 49845, "total_steps": 67140, "loss": 0.6127, "lr": 9.444713462014934e-06, "epoch": 7.424039320822162, "percentage": 74.24, "elapsed_time": "3:26:48", "remaining_time": "1:11:45", "throughput": 2316.86, "total_tokens": 28748704} {"current_steps": 49850, "total_steps": 67140, "loss": 0.4843, "lr": 9.43962637356752e-06, "epoch": 7.424784033363122, "percentage": 74.25, "elapsed_time": "3:26:49", "remaining_time": "1:11:44", "throughput": 2316.88, "total_tokens": 28751552} {"current_steps": 49855, "total_steps": 67140, "loss": 0.4701, "lr": 9.434540336626892e-06, "epoch": 7.425528745904081, "percentage": 74.26, "elapsed_time": "3:26:50", "remaining_time": "1:11:42", "throughput": 2316.89, "total_tokens": 28754304} {"current_steps": 49860, "total_steps": 67140, "loss": 0.6421, "lr": 9.429455351536754e-06, "epoch": 7.42627345844504, "percentage": 74.26, "elapsed_time": "3:26:51", "remaining_time": "1:11:41", "throughput": 2316.92, "total_tokens": 28757248} {"current_steps": 49865, "total_steps": 67140, "loss": 0.6192, "lr": 9.424371418640706e-06, "epoch": 7.427018170985999, "percentage": 74.27, "elapsed_time": "3:26:52", "remaining_time": "1:11:40", "throughput": 2316.94, "total_tokens": 28760128} {"current_steps": 49870, "total_steps": 67140, "loss": 0.8782, "lr": 9.419288538282323e-06, "epoch": 7.427762883526959, "percentage": 74.28, "elapsed_time": "3:26:54", "remaining_time": "1:11:39", "throughput": 2316.97, "total_tokens": 28763264} {"current_steps": 49875, "total_steps": 67140, "loss": 0.4589, "lr": 9.414206710805062e-06, "epoch": 7.428507596067917, "percentage": 74.29, "elapsed_time": "3:26:55", "remaining_time": "1:11:37", "throughput": 2316.98, "total_tokens": 28765984} {"current_steps": 49880, "total_steps": 67140, "loss": 0.4857, "lr": 9.409125936552349e-06, "epoch": 7.429252308608877, "percentage": 74.29, "elapsed_time": "3:26:56", "remaining_time": "1:11:36", "throughput": 2316.99, "total_tokens": 28768576} {"current_steps": 49885, "total_steps": 67140, "loss": 0.5514, "lr": 9.404046215867515e-06, "epoch": 7.429997021149836, "percentage": 74.3, "elapsed_time": "3:26:57", "remaining_time": "1:11:35", "throughput": 2317.01, "total_tokens": 28771488} {"current_steps": 49890, "total_steps": 67140, "loss": 0.5126, "lr": 9.398967549093828e-06, "epoch": 7.4307417336907955, "percentage": 74.31, "elapsed_time": "3:26:58", "remaining_time": "1:11:33", "throughput": 2317.03, "total_tokens": 28774432} {"current_steps": 49895, "total_steps": 67140, "loss": 0.4204, "lr": 9.393889936574496e-06, "epoch": 7.431486446231754, "percentage": 74.31, "elapsed_time": "3:26:59", "remaining_time": "1:11:32", "throughput": 2317.04, "total_tokens": 28777184} {"current_steps": 49900, "total_steps": 67140, "loss": 0.44, "lr": 9.388813378652623e-06, "epoch": 7.432231158772714, "percentage": 74.32, "elapsed_time": "3:27:00", "remaining_time": "1:11:31", "throughput": 2317.06, "total_tokens": 28780032} {"current_steps": 49905, "total_steps": 67140, "loss": 0.7239, "lr": 9.383737875671278e-06, "epoch": 7.432975871313673, "percentage": 74.33, "elapsed_time": "3:27:02", "remaining_time": "1:11:30", "throughput": 2317.07, "total_tokens": 28782848} {"current_steps": 49910, "total_steps": 67140, "loss": 0.576, "lr": 9.378663427973428e-06, "epoch": 7.433720583854632, "percentage": 74.34, "elapsed_time": "3:27:03", "remaining_time": "1:11:28", "throughput": 2317.1, "total_tokens": 28785760} {"current_steps": 49915, "total_steps": 67140, "loss": 0.4503, "lr": 9.373590035901993e-06, "epoch": 7.434465296395591, "percentage": 74.34, "elapsed_time": "3:27:04", "remaining_time": "1:11:27", "throughput": 2317.13, "total_tokens": 28788896} {"current_steps": 49920, "total_steps": 67140, "loss": 0.6635, "lr": 9.368517699799812e-06, "epoch": 7.435210008936551, "percentage": 74.35, "elapsed_time": "3:27:05", "remaining_time": "1:11:26", "throughput": 2317.14, "total_tokens": 28791584} {"current_steps": 49925, "total_steps": 67140, "loss": 0.5683, "lr": 9.36344642000965e-06, "epoch": 7.4359547214775095, "percentage": 74.36, "elapsed_time": "3:27:06", "remaining_time": "1:11:24", "throughput": 2317.16, "total_tokens": 28794400} {"current_steps": 49930, "total_steps": 67140, "loss": 0.5228, "lr": 9.358376196874214e-06, "epoch": 7.436699434018469, "percentage": 74.37, "elapsed_time": "3:27:07", "remaining_time": "1:11:23", "throughput": 2317.19, "total_tokens": 28797536} {"current_steps": 49935, "total_steps": 67140, "loss": 0.5119, "lr": 9.353307030736113e-06, "epoch": 7.437444146559428, "percentage": 74.37, "elapsed_time": "3:27:08", "remaining_time": "1:11:22", "throughput": 2317.24, "total_tokens": 28800960} {"current_steps": 49940, "total_steps": 67140, "loss": 0.6107, "lr": 9.348238921937916e-06, "epoch": 7.4381888591003875, "percentage": 74.38, "elapsed_time": "3:27:10", "remaining_time": "1:11:21", "throughput": 2317.27, "total_tokens": 28804000} {"current_steps": 49945, "total_steps": 67140, "loss": 0.5609, "lr": 9.34317187082209e-06, "epoch": 7.438933571641346, "percentage": 74.39, "elapsed_time": "3:27:11", "remaining_time": "1:11:19", "throughput": 2317.28, "total_tokens": 28806784} {"current_steps": 49950, "total_steps": 67140, "loss": 0.4902, "lr": 9.338105877731051e-06, "epoch": 7.439678284182306, "percentage": 74.4, "elapsed_time": "3:27:12", "remaining_time": "1:11:18", "throughput": 2317.31, "total_tokens": 28809728} {"current_steps": 49955, "total_steps": 67140, "loss": 0.5454, "lr": 9.33304094300714e-06, "epoch": 7.440422996723265, "percentage": 74.4, "elapsed_time": "3:27:13", "remaining_time": "1:11:17", "throughput": 2317.32, "total_tokens": 28812608} {"current_steps": 49960, "total_steps": 67140, "loss": 0.5495, "lr": 9.327977066992627e-06, "epoch": 7.441167709264224, "percentage": 74.41, "elapsed_time": "3:27:14", "remaining_time": "1:11:15", "throughput": 2317.35, "total_tokens": 28815648} {"current_steps": 49965, "total_steps": 67140, "loss": 0.4988, "lr": 9.322914250029713e-06, "epoch": 7.441912421805183, "percentage": 74.42, "elapsed_time": "3:27:15", "remaining_time": "1:11:14", "throughput": 2317.36, "total_tokens": 28818336} {"current_steps": 49970, "total_steps": 67140, "loss": 0.6966, "lr": 9.317852492460508e-06, "epoch": 7.442657134346143, "percentage": 74.43, "elapsed_time": "3:27:16", "remaining_time": "1:11:13", "throughput": 2317.37, "total_tokens": 28821056} {"current_steps": 49975, "total_steps": 67140, "loss": 0.568, "lr": 9.312791794627072e-06, "epoch": 7.4434018468871015, "percentage": 74.43, "elapsed_time": "3:27:18", "remaining_time": "1:11:12", "throughput": 2317.4, "total_tokens": 28824032} {"current_steps": 49980, "total_steps": 67140, "loss": 0.6713, "lr": 9.307732156871393e-06, "epoch": 7.444146559428061, "percentage": 74.44, "elapsed_time": "3:27:19", "remaining_time": "1:11:10", "throughput": 2317.42, "total_tokens": 28827072} {"current_steps": 49985, "total_steps": 67140, "loss": 0.3706, "lr": 9.30267357953537e-06, "epoch": 7.44489127196902, "percentage": 74.45, "elapsed_time": "3:27:20", "remaining_time": "1:11:09", "throughput": 2317.45, "total_tokens": 28830048} {"current_steps": 49990, "total_steps": 67140, "loss": 0.6611, "lr": 9.297616062960843e-06, "epoch": 7.4456359845099795, "percentage": 74.46, "elapsed_time": "3:27:21", "remaining_time": "1:11:08", "throughput": 2317.47, "total_tokens": 28832928} {"current_steps": 49995, "total_steps": 67140, "loss": 0.6918, "lr": 9.292559607489585e-06, "epoch": 7.446380697050938, "percentage": 74.46, "elapsed_time": "3:27:22", "remaining_time": "1:11:07", "throughput": 2317.49, "total_tokens": 28835808} {"current_steps": 50000, "total_steps": 67140, "loss": 0.5482, "lr": 9.287504213463292e-06, "epoch": 7.447125409591898, "percentage": 74.47, "elapsed_time": "3:27:23", "remaining_time": "1:11:05", "throughput": 2317.51, "total_tokens": 28838656} {"current_steps": 50005, "total_steps": 67140, "loss": 0.5318, "lr": 9.282449881223573e-06, "epoch": 7.447870122132857, "percentage": 74.48, "elapsed_time": "3:27:24", "remaining_time": "1:11:04", "throughput": 2317.52, "total_tokens": 28841536} {"current_steps": 50010, "total_steps": 67140, "loss": 0.6093, "lr": 9.27739661111199e-06, "epoch": 7.4486148346738155, "percentage": 74.49, "elapsed_time": "3:27:26", "remaining_time": "1:11:03", "throughput": 2317.54, "total_tokens": 28844416} {"current_steps": 50015, "total_steps": 67140, "loss": 0.6848, "lr": 9.27234440347002e-06, "epoch": 7.449359547214775, "percentage": 74.49, "elapsed_time": "3:27:27", "remaining_time": "1:11:01", "throughput": 2317.56, "total_tokens": 28847328} {"current_steps": 50020, "total_steps": 67140, "loss": 0.6685, "lr": 9.267293258639082e-06, "epoch": 7.450104259755734, "percentage": 74.5, "elapsed_time": "3:27:28", "remaining_time": "1:11:00", "throughput": 2317.6, "total_tokens": 28850528} {"current_steps": 50025, "total_steps": 67140, "loss": 0.5826, "lr": 9.262243176960489e-06, "epoch": 7.4508489722966935, "percentage": 74.51, "elapsed_time": "3:27:29", "remaining_time": "1:10:59", "throughput": 2317.62, "total_tokens": 28853376} {"current_steps": 50030, "total_steps": 67140, "loss": 0.4762, "lr": 9.257194158775517e-06, "epoch": 7.451593684837652, "percentage": 74.52, "elapsed_time": "3:27:30", "remaining_time": "1:10:58", "throughput": 2317.64, "total_tokens": 28856384} {"current_steps": 50035, "total_steps": 67140, "loss": 0.5721, "lr": 9.252146204425369e-06, "epoch": 7.452338397378612, "percentage": 74.52, "elapsed_time": "3:27:31", "remaining_time": "1:10:56", "throughput": 2317.67, "total_tokens": 28859360} {"current_steps": 50040, "total_steps": 67140, "loss": 0.2575, "lr": 9.247099314251145e-06, "epoch": 7.453083109919571, "percentage": 74.53, "elapsed_time": "3:27:32", "remaining_time": "1:10:55", "throughput": 2317.68, "total_tokens": 28862016} {"current_steps": 50045, "total_steps": 67140, "loss": 0.4489, "lr": 9.242053488593902e-06, "epoch": 7.45382782246053, "percentage": 74.54, "elapsed_time": "3:27:34", "remaining_time": "1:10:54", "throughput": 2317.7, "total_tokens": 28864832} {"current_steps": 50050, "total_steps": 67140, "loss": 0.4982, "lr": 9.237008727794618e-06, "epoch": 7.454572535001489, "percentage": 74.55, "elapsed_time": "3:27:35", "remaining_time": "1:10:52", "throughput": 2317.7, "total_tokens": 28867424} {"current_steps": 50055, "total_steps": 67140, "loss": 0.5702, "lr": 9.231965032194198e-06, "epoch": 7.455317247542449, "percentage": 74.55, "elapsed_time": "3:27:36", "remaining_time": "1:10:51", "throughput": 2317.73, "total_tokens": 28870464} {"current_steps": 50060, "total_steps": 67140, "loss": 0.6578, "lr": 9.226922402133477e-06, "epoch": 7.4560619600834075, "percentage": 74.56, "elapsed_time": "3:27:37", "remaining_time": "1:10:50", "throughput": 2317.74, "total_tokens": 28873216} {"current_steps": 50065, "total_steps": 67140, "loss": 0.7241, "lr": 9.221880837953209e-06, "epoch": 7.456806672624367, "percentage": 74.57, "elapsed_time": "3:27:38", "remaining_time": "1:10:49", "throughput": 2317.75, "total_tokens": 28875968} {"current_steps": 50070, "total_steps": 67140, "loss": 0.4486, "lr": 9.21684033999409e-06, "epoch": 7.457551385165326, "percentage": 74.58, "elapsed_time": "3:27:39", "remaining_time": "1:10:47", "throughput": 2317.78, "total_tokens": 28878880} {"current_steps": 50075, "total_steps": 67140, "loss": 0.4904, "lr": 9.21180090859672e-06, "epoch": 7.4582960977062855, "percentage": 74.58, "elapsed_time": "3:27:40", "remaining_time": "1:10:46", "throughput": 2317.79, "total_tokens": 28881568} {"current_steps": 50080, "total_steps": 67140, "loss": 0.782, "lr": 9.20676254410166e-06, "epoch": 7.459040810247244, "percentage": 74.59, "elapsed_time": "3:27:41", "remaining_time": "1:10:45", "throughput": 2317.81, "total_tokens": 28884448} {"current_steps": 50085, "total_steps": 67140, "loss": 0.4921, "lr": 9.201725246849374e-06, "epoch": 7.459785522788204, "percentage": 74.6, "elapsed_time": "3:27:43", "remaining_time": "1:10:43", "throughput": 2317.82, "total_tokens": 28887136} {"current_steps": 50090, "total_steps": 67140, "loss": 0.5414, "lr": 9.196689017180262e-06, "epoch": 7.460530235329163, "percentage": 74.61, "elapsed_time": "3:27:44", "remaining_time": "1:10:42", "throughput": 2317.83, "total_tokens": 28889888} {"current_steps": 50095, "total_steps": 67140, "loss": 0.8671, "lr": 9.191653855434667e-06, "epoch": 7.461274947870122, "percentage": 74.61, "elapsed_time": "3:27:45", "remaining_time": "1:10:41", "throughput": 2317.85, "total_tokens": 28892736} {"current_steps": 50100, "total_steps": 67140, "loss": 0.6326, "lr": 9.186619761952831e-06, "epoch": 7.462019660411081, "percentage": 74.62, "elapsed_time": "3:27:46", "remaining_time": "1:10:40", "throughput": 2317.89, "total_tokens": 28896000} {"current_steps": 50105, "total_steps": 67140, "loss": 0.7398, "lr": 9.181586737074932e-06, "epoch": 7.462764372952041, "percentage": 74.63, "elapsed_time": "3:27:47", "remaining_time": "1:10:38", "throughput": 2317.91, "total_tokens": 28898880} {"current_steps": 50110, "total_steps": 67140, "loss": 0.5434, "lr": 9.176554781141086e-06, "epoch": 7.4635090854929995, "percentage": 74.64, "elapsed_time": "3:27:48", "remaining_time": "1:10:37", "throughput": 2317.92, "total_tokens": 28901632} {"current_steps": 50115, "total_steps": 67140, "loss": 0.6938, "lr": 9.171523894491336e-06, "epoch": 7.464253798033959, "percentage": 74.64, "elapsed_time": "3:27:49", "remaining_time": "1:10:36", "throughput": 2317.95, "total_tokens": 28904608} {"current_steps": 50120, "total_steps": 67140, "loss": 0.3978, "lr": 9.166494077465645e-06, "epoch": 7.464998510574918, "percentage": 74.65, "elapsed_time": "3:27:51", "remaining_time": "1:10:34", "throughput": 2317.97, "total_tokens": 28907456} {"current_steps": 50125, "total_steps": 67140, "loss": 0.3362, "lr": 9.161465330403912e-06, "epoch": 7.465743223115878, "percentage": 74.66, "elapsed_time": "3:27:52", "remaining_time": "1:10:33", "throughput": 2317.99, "total_tokens": 28910400} {"current_steps": 50130, "total_steps": 67140, "loss": 0.6463, "lr": 9.156437653645966e-06, "epoch": 7.466487935656836, "percentage": 74.66, "elapsed_time": "3:27:53", "remaining_time": "1:10:32", "throughput": 2318.01, "total_tokens": 28913280} {"current_steps": 50135, "total_steps": 67140, "loss": 0.5569, "lr": 9.151411047531539e-06, "epoch": 7.467232648197796, "percentage": 74.67, "elapsed_time": "3:27:54", "remaining_time": "1:10:31", "throughput": 2318.04, "total_tokens": 28916320} {"current_steps": 50140, "total_steps": 67140, "loss": 0.6023, "lr": 9.146385512400323e-06, "epoch": 7.467977360738755, "percentage": 74.68, "elapsed_time": "3:27:55", "remaining_time": "1:10:29", "throughput": 2318.07, "total_tokens": 28919520} {"current_steps": 50145, "total_steps": 67140, "loss": 0.5011, "lr": 9.141361048591916e-06, "epoch": 7.468722073279714, "percentage": 74.69, "elapsed_time": "3:27:56", "remaining_time": "1:10:28", "throughput": 2318.1, "total_tokens": 28922624} {"current_steps": 50150, "total_steps": 67140, "loss": 0.5985, "lr": 9.136337656445849e-06, "epoch": 7.469466785820673, "percentage": 74.69, "elapsed_time": "3:27:57", "remaining_time": "1:10:27", "throughput": 2318.11, "total_tokens": 28925280} {"current_steps": 50155, "total_steps": 67140, "loss": 0.7221, "lr": 9.131315336301585e-06, "epoch": 7.470211498361633, "percentage": 74.7, "elapsed_time": "3:27:59", "remaining_time": "1:10:26", "throughput": 2318.14, "total_tokens": 28928320} {"current_steps": 50160, "total_steps": 67140, "loss": 0.641, "lr": 9.126294088498515e-06, "epoch": 7.4709562109025915, "percentage": 74.71, "elapsed_time": "3:28:00", "remaining_time": "1:10:24", "throughput": 2318.16, "total_tokens": 28931136} {"current_steps": 50165, "total_steps": 67140, "loss": 0.5976, "lr": 9.12127391337596e-06, "epoch": 7.471700923443551, "percentage": 74.72, "elapsed_time": "3:28:01", "remaining_time": "1:10:23", "throughput": 2318.19, "total_tokens": 28934240} {"current_steps": 50170, "total_steps": 67140, "loss": 0.441, "lr": 9.116254811273151e-06, "epoch": 7.47244563598451, "percentage": 74.72, "elapsed_time": "3:28:02", "remaining_time": "1:10:22", "throughput": 2318.2, "total_tokens": 28937024} {"current_steps": 50175, "total_steps": 67140, "loss": 0.4227, "lr": 9.111236782529259e-06, "epoch": 7.473190348525469, "percentage": 74.73, "elapsed_time": "3:28:03", "remaining_time": "1:10:20", "throughput": 2318.23, "total_tokens": 28940064} {"current_steps": 50180, "total_steps": 67140, "loss": 0.3836, "lr": 9.106219827483398e-06, "epoch": 7.473935061066428, "percentage": 74.74, "elapsed_time": "3:28:04", "remaining_time": "1:10:19", "throughput": 2318.25, "total_tokens": 28942976} {"current_steps": 50185, "total_steps": 67140, "loss": 0.5042, "lr": 9.101203946474571e-06, "epoch": 7.474679773607388, "percentage": 74.75, "elapsed_time": "3:28:05", "remaining_time": "1:10:18", "throughput": 2318.26, "total_tokens": 28945632} {"current_steps": 50190, "total_steps": 67140, "loss": 0.5347, "lr": 9.09618913984174e-06, "epoch": 7.475424486148347, "percentage": 74.75, "elapsed_time": "3:28:07", "remaining_time": "1:10:17", "throughput": 2318.27, "total_tokens": 28948256} {"current_steps": 50195, "total_steps": 67140, "loss": 0.7027, "lr": 9.091175407923788e-06, "epoch": 7.4761691986893055, "percentage": 74.76, "elapsed_time": "3:28:08", "remaining_time": "1:10:15", "throughput": 2318.29, "total_tokens": 28951168} {"current_steps": 50200, "total_steps": 67140, "loss": 0.3529, "lr": 9.086162751059532e-06, "epoch": 7.476913911230265, "percentage": 74.77, "elapsed_time": "3:28:09", "remaining_time": "1:10:14", "throughput": 2318.3, "total_tokens": 28953920} {"current_steps": 50205, "total_steps": 67140, "loss": 0.5721, "lr": 9.081151169587686e-06, "epoch": 7.477658623771224, "percentage": 74.78, "elapsed_time": "3:28:10", "remaining_time": "1:10:13", "throughput": 2318.31, "total_tokens": 28956608} {"current_steps": 50210, "total_steps": 67140, "loss": 0.7802, "lr": 9.076140663846925e-06, "epoch": 7.478403336312184, "percentage": 74.78, "elapsed_time": "3:28:11", "remaining_time": "1:10:11", "throughput": 2318.35, "total_tokens": 28959840} {"current_steps": 50215, "total_steps": 67140, "loss": 0.7839, "lr": 9.071131234175831e-06, "epoch": 7.479148048853142, "percentage": 74.79, "elapsed_time": "3:28:12", "remaining_time": "1:10:10", "throughput": 2318.37, "total_tokens": 28962624} {"current_steps": 50220, "total_steps": 67140, "loss": 0.4187, "lr": 9.066122880912938e-06, "epoch": 7.479892761394102, "percentage": 74.8, "elapsed_time": "3:28:13", "remaining_time": "1:10:09", "throughput": 2318.36, "total_tokens": 28965056} {"current_steps": 50225, "total_steps": 67140, "loss": 0.6593, "lr": 9.06111560439667e-06, "epoch": 7.480637473935061, "percentage": 74.81, "elapsed_time": "3:28:14", "remaining_time": "1:10:08", "throughput": 2318.38, "total_tokens": 28967936} {"current_steps": 50230, "total_steps": 67140, "loss": 0.3995, "lr": 9.056109404965408e-06, "epoch": 7.48138218647602, "percentage": 74.81, "elapsed_time": "3:28:16", "remaining_time": "1:10:06", "throughput": 2318.4, "total_tokens": 28970816} {"current_steps": 50235, "total_steps": 67140, "loss": 0.7477, "lr": 9.051104282957454e-06, "epoch": 7.482126899016979, "percentage": 74.82, "elapsed_time": "3:28:17", "remaining_time": "1:10:05", "throughput": 2318.41, "total_tokens": 28973568} {"current_steps": 50240, "total_steps": 67140, "loss": 0.5682, "lr": 9.046100238711021e-06, "epoch": 7.482871611557939, "percentage": 74.83, "elapsed_time": "3:28:18", "remaining_time": "1:10:04", "throughput": 2318.44, "total_tokens": 28976544} {"current_steps": 50245, "total_steps": 67140, "loss": 0.6528, "lr": 9.041097272564275e-06, "epoch": 7.4836163240988975, "percentage": 74.84, "elapsed_time": "3:28:19", "remaining_time": "1:10:02", "throughput": 2318.46, "total_tokens": 28979616} {"current_steps": 50250, "total_steps": 67140, "loss": 0.482, "lr": 9.036095384855287e-06, "epoch": 7.484361036639857, "percentage": 74.84, "elapsed_time": "3:28:20", "remaining_time": "1:10:01", "throughput": 2318.48, "total_tokens": 28982368} {"current_steps": 50255, "total_steps": 67140, "loss": 0.6512, "lr": 9.03109457592207e-06, "epoch": 7.485105749180816, "percentage": 74.85, "elapsed_time": "3:28:21", "remaining_time": "1:10:00", "throughput": 2318.5, "total_tokens": 28985216} {"current_steps": 50260, "total_steps": 67140, "loss": 0.5223, "lr": 9.026094846102565e-06, "epoch": 7.485850461721776, "percentage": 74.86, "elapsed_time": "3:28:22", "remaining_time": "1:09:59", "throughput": 2318.51, "total_tokens": 28988000} {"current_steps": 50265, "total_steps": 67140, "loss": 0.5425, "lr": 9.021096195734625e-06, "epoch": 7.486595174262734, "percentage": 74.87, "elapsed_time": "3:28:23", "remaining_time": "1:09:57", "throughput": 2318.52, "total_tokens": 28990752} {"current_steps": 50270, "total_steps": 67140, "loss": 0.389, "lr": 9.016098625156027e-06, "epoch": 7.487339886803694, "percentage": 74.87, "elapsed_time": "3:28:25", "remaining_time": "1:09:56", "throughput": 2318.57, "total_tokens": 28994080} {"current_steps": 50275, "total_steps": 67140, "loss": 0.6619, "lr": 9.011102134704501e-06, "epoch": 7.488084599344653, "percentage": 74.88, "elapsed_time": "3:28:26", "remaining_time": "1:09:55", "throughput": 2318.59, "total_tokens": 28997088} {"current_steps": 50280, "total_steps": 67140, "loss": 0.6193, "lr": 9.006106724717686e-06, "epoch": 7.488829311885612, "percentage": 74.89, "elapsed_time": "3:28:27", "remaining_time": "1:09:54", "throughput": 2318.62, "total_tokens": 29000128} {"current_steps": 50285, "total_steps": 67140, "loss": 0.4756, "lr": 9.001112395533153e-06, "epoch": 7.489574024426571, "percentage": 74.9, "elapsed_time": "3:28:28", "remaining_time": "1:09:52", "throughput": 2318.65, "total_tokens": 29003168} {"current_steps": 50290, "total_steps": 67140, "loss": 0.6722, "lr": 8.996119147488396e-06, "epoch": 7.490318736967531, "percentage": 74.9, "elapsed_time": "3:28:29", "remaining_time": "1:09:51", "throughput": 2318.67, "total_tokens": 29006240} {"current_steps": 50295, "total_steps": 67140, "loss": 0.5677, "lr": 8.99112698092085e-06, "epoch": 7.49106344950849, "percentage": 74.91, "elapsed_time": "3:28:31", "remaining_time": "1:09:50", "throughput": 2318.71, "total_tokens": 29009344} {"current_steps": 50300, "total_steps": 67140, "loss": 0.6546, "lr": 8.986135896167856e-06, "epoch": 7.491808162049449, "percentage": 74.92, "elapsed_time": "3:28:32", "remaining_time": "1:09:48", "throughput": 2318.73, "total_tokens": 29012224} {"current_steps": 50305, "total_steps": 67140, "loss": 0.4423, "lr": 8.98114589356668e-06, "epoch": 7.492552874590408, "percentage": 74.93, "elapsed_time": "3:28:33", "remaining_time": "1:09:47", "throughput": 2318.75, "total_tokens": 29015200} {"current_steps": 50310, "total_steps": 67140, "loss": 0.428, "lr": 8.97615697345454e-06, "epoch": 7.493297587131368, "percentage": 74.93, "elapsed_time": "3:28:34", "remaining_time": "1:09:46", "throughput": 2318.77, "total_tokens": 29018048} {"current_steps": 50315, "total_steps": 67140, "loss": 0.5294, "lr": 8.97116913616856e-06, "epoch": 7.494042299672326, "percentage": 74.94, "elapsed_time": "3:28:35", "remaining_time": "1:09:45", "throughput": 2318.78, "total_tokens": 29020736} {"current_steps": 50320, "total_steps": 67140, "loss": 0.4418, "lr": 8.966182382045801e-06, "epoch": 7.494787012213286, "percentage": 74.95, "elapsed_time": "3:28:36", "remaining_time": "1:09:43", "throughput": 2318.8, "total_tokens": 29023584} {"current_steps": 50325, "total_steps": 67140, "loss": 0.4237, "lr": 8.96119671142325e-06, "epoch": 7.495531724754245, "percentage": 74.96, "elapsed_time": "3:28:37", "remaining_time": "1:09:42", "throughput": 2318.81, "total_tokens": 29026336} {"current_steps": 50330, "total_steps": 67140, "loss": 0.7569, "lr": 8.956212124637822e-06, "epoch": 7.496276437295204, "percentage": 74.96, "elapsed_time": "3:28:38", "remaining_time": "1:09:41", "throughput": 2318.83, "total_tokens": 29029280} {"current_steps": 50335, "total_steps": 67140, "loss": 0.7508, "lr": 8.951228622026344e-06, "epoch": 7.497021149836163, "percentage": 74.97, "elapsed_time": "3:28:40", "remaining_time": "1:09:39", "throughput": 2318.87, "total_tokens": 29032416} {"current_steps": 50340, "total_steps": 67140, "loss": 0.6249, "lr": 8.946246203925584e-06, "epoch": 7.497765862377123, "percentage": 74.98, "elapsed_time": "3:28:41", "remaining_time": "1:09:38", "throughput": 2318.9, "total_tokens": 29035552} {"current_steps": 50345, "total_steps": 67140, "loss": 0.5562, "lr": 8.941264870672244e-06, "epoch": 7.498510574918082, "percentage": 74.99, "elapsed_time": "3:28:42", "remaining_time": "1:09:37", "throughput": 2318.92, "total_tokens": 29038400} {"current_steps": 50350, "total_steps": 67140, "loss": 0.7282, "lr": 8.936284622602927e-06, "epoch": 7.499255287459041, "percentage": 74.99, "elapsed_time": "3:28:43", "remaining_time": "1:09:36", "throughput": 2318.94, "total_tokens": 29041216} {"current_steps": 50355, "total_steps": 67140, "loss": 0.4657, "lr": 8.931305460054184e-06, "epoch": 7.5, "percentage": 75.0, "elapsed_time": "3:28:44", "remaining_time": "1:09:34", "throughput": 2318.97, "total_tokens": 29044256} {"current_steps": 50355, "total_steps": 67140, "eval_loss": 0.6839770674705505, "epoch": 7.5, "percentage": 75.0, "elapsed_time": "3:29:58", "remaining_time": "1:09:59", "throughput": 2305.3, "total_tokens": 29044256} {"current_steps": 50360, "total_steps": 67140, "loss": 0.626, "lr": 8.92632738336249e-06, "epoch": 7.500744712540959, "percentage": 75.01, "elapsed_time": "3:30:03", "remaining_time": "1:09:59", "throughput": 2304.77, "total_tokens": 29047264} {"current_steps": 50365, "total_steps": 67140, "loss": 0.5083, "lr": 8.921350392864247e-06, "epoch": 7.501489425081918, "percentage": 75.01, "elapsed_time": "3:30:04", "remaining_time": "1:09:58", "throughput": 2304.79, "total_tokens": 29050112} {"current_steps": 50370, "total_steps": 67140, "loss": 0.5012, "lr": 8.916374488895766e-06, "epoch": 7.502234137622878, "percentage": 75.02, "elapsed_time": "3:30:05", "remaining_time": "1:09:56", "throughput": 2304.8, "total_tokens": 29052896} {"current_steps": 50375, "total_steps": 67140, "loss": 0.5865, "lr": 8.911399671793302e-06, "epoch": 7.502978850163837, "percentage": 75.03, "elapsed_time": "3:30:06", "remaining_time": "1:09:55", "throughput": 2304.82, "total_tokens": 29055840} {"current_steps": 50380, "total_steps": 67140, "loss": 0.7108, "lr": 8.90642594189304e-06, "epoch": 7.503723562704796, "percentage": 75.04, "elapsed_time": "3:30:07", "remaining_time": "1:09:54", "throughput": 2304.84, "total_tokens": 29058528} {"current_steps": 50385, "total_steps": 67140, "loss": 0.5034, "lr": 8.90145329953109e-06, "epoch": 7.504468275245755, "percentage": 75.04, "elapsed_time": "3:30:08", "remaining_time": "1:09:52", "throughput": 2304.87, "total_tokens": 29061568} {"current_steps": 50390, "total_steps": 67140, "loss": 0.6703, "lr": 8.896481745043463e-06, "epoch": 7.505212987786714, "percentage": 75.05, "elapsed_time": "3:30:09", "remaining_time": "1:09:51", "throughput": 2304.89, "total_tokens": 29064448} {"current_steps": 50395, "total_steps": 67140, "loss": 0.6818, "lr": 8.891511278766132e-06, "epoch": 7.505957700327674, "percentage": 75.06, "elapsed_time": "3:30:11", "remaining_time": "1:09:50", "throughput": 2304.9, "total_tokens": 29067136} {"current_steps": 50400, "total_steps": 67140, "loss": 0.6643, "lr": 8.886541901034981e-06, "epoch": 7.506702412868632, "percentage": 75.07, "elapsed_time": "3:30:12", "remaining_time": "1:09:49", "throughput": 2304.92, "total_tokens": 29069952} {"current_steps": 50405, "total_steps": 67140, "loss": 0.6088, "lr": 8.88157361218581e-06, "epoch": 7.507447125409592, "percentage": 75.07, "elapsed_time": "3:30:13", "remaining_time": "1:09:47", "throughput": 2304.94, "total_tokens": 29072800} {"current_steps": 50410, "total_steps": 67140, "loss": 0.6117, "lr": 8.876606412554358e-06, "epoch": 7.508191837950551, "percentage": 75.08, "elapsed_time": "3:30:14", "remaining_time": "1:09:46", "throughput": 2304.95, "total_tokens": 29075552} {"current_steps": 50415, "total_steps": 67140, "loss": 0.7305, "lr": 8.871640302476295e-06, "epoch": 7.50893655049151, "percentage": 75.09, "elapsed_time": "3:30:15", "remaining_time": "1:09:45", "throughput": 2304.98, "total_tokens": 29078528} {"current_steps": 50420, "total_steps": 67140, "loss": 0.602, "lr": 8.866675282287204e-06, "epoch": 7.509681263032469, "percentage": 75.1, "elapsed_time": "3:30:16", "remaining_time": "1:09:43", "throughput": 2305.01, "total_tokens": 29081536} {"current_steps": 50425, "total_steps": 67140, "loss": 0.4719, "lr": 8.861711352322616e-06, "epoch": 7.510425975573429, "percentage": 75.1, "elapsed_time": "3:30:17", "remaining_time": "1:09:42", "throughput": 2305.04, "total_tokens": 29084704} {"current_steps": 50430, "total_steps": 67140, "loss": 0.5331, "lr": 8.85674851291796e-06, "epoch": 7.511170688114388, "percentage": 75.11, "elapsed_time": "3:30:18", "remaining_time": "1:09:41", "throughput": 2305.05, "total_tokens": 29087296} {"current_steps": 50435, "total_steps": 67140, "loss": 0.6053, "lr": 8.851786764408596e-06, "epoch": 7.511915400655347, "percentage": 75.12, "elapsed_time": "3:30:20", "remaining_time": "1:09:40", "throughput": 2305.09, "total_tokens": 29090592} {"current_steps": 50440, "total_steps": 67140, "loss": 0.4163, "lr": 8.84682610712983e-06, "epoch": 7.512660113196306, "percentage": 75.13, "elapsed_time": "3:30:21", "remaining_time": "1:09:38", "throughput": 2305.11, "total_tokens": 29093344} {"current_steps": 50445, "total_steps": 67140, "loss": 0.6581, "lr": 8.841866541416883e-06, "epoch": 7.513404825737266, "percentage": 75.13, "elapsed_time": "3:30:22", "remaining_time": "1:09:37", "throughput": 2305.11, "total_tokens": 29095936} {"current_steps": 50450, "total_steps": 67140, "loss": 0.4799, "lr": 8.836908067604898e-06, "epoch": 7.514149538278224, "percentage": 75.14, "elapsed_time": "3:30:23", "remaining_time": "1:09:36", "throughput": 2305.12, "total_tokens": 29098624} {"current_steps": 50455, "total_steps": 67140, "loss": 0.5536, "lr": 8.831950686028953e-06, "epoch": 7.514894250819184, "percentage": 75.15, "elapsed_time": "3:30:24", "remaining_time": "1:09:34", "throughput": 2305.15, "total_tokens": 29101632} {"current_steps": 50460, "total_steps": 67140, "loss": 0.5539, "lr": 8.826994397024055e-06, "epoch": 7.515638963360143, "percentage": 75.16, "elapsed_time": "3:30:25", "remaining_time": "1:09:33", "throughput": 2305.18, "total_tokens": 29104704} {"current_steps": 50465, "total_steps": 67140, "loss": 0.5156, "lr": 8.82203920092512e-06, "epoch": 7.5163836759011025, "percentage": 75.16, "elapsed_time": "3:30:26", "remaining_time": "1:09:32", "throughput": 2305.21, "total_tokens": 29107680} {"current_steps": 50470, "total_steps": 67140, "loss": 0.6653, "lr": 8.817085098066994e-06, "epoch": 7.517128388442061, "percentage": 75.17, "elapsed_time": "3:30:28", "remaining_time": "1:09:30", "throughput": 2305.24, "total_tokens": 29110688} {"current_steps": 50475, "total_steps": 67140, "loss": 0.7467, "lr": 8.812132088784458e-06, "epoch": 7.517873100983021, "percentage": 75.18, "elapsed_time": "3:30:29", "remaining_time": "1:09:29", "throughput": 2305.25, "total_tokens": 29113408} {"current_steps": 50480, "total_steps": 67140, "loss": 0.503, "lr": 8.807180173412225e-06, "epoch": 7.51861781352398, "percentage": 75.19, "elapsed_time": "3:30:30", "remaining_time": "1:09:28", "throughput": 2305.26, "total_tokens": 29116192} {"current_steps": 50485, "total_steps": 67140, "loss": 0.6173, "lr": 8.802229352284919e-06, "epoch": 7.519362526064939, "percentage": 75.19, "elapsed_time": "3:30:31", "remaining_time": "1:09:27", "throughput": 2305.28, "total_tokens": 29119008} {"current_steps": 50490, "total_steps": 67140, "loss": 0.6776, "lr": 8.797279625737098e-06, "epoch": 7.520107238605898, "percentage": 75.2, "elapsed_time": "3:30:32", "remaining_time": "1:09:25", "throughput": 2305.3, "total_tokens": 29121952} {"current_steps": 50495, "total_steps": 67140, "loss": 0.6565, "lr": 8.792330994103253e-06, "epoch": 7.520851951146858, "percentage": 75.21, "elapsed_time": "3:30:33", "remaining_time": "1:09:24", "throughput": 2305.32, "total_tokens": 29124704} {"current_steps": 50500, "total_steps": 67140, "loss": 0.6731, "lr": 8.787383457717777e-06, "epoch": 7.521596663687816, "percentage": 75.22, "elapsed_time": "3:30:34", "remaining_time": "1:09:23", "throughput": 2305.36, "total_tokens": 29128064} {"current_steps": 50505, "total_steps": 67140, "loss": 0.5486, "lr": 8.782437016915016e-06, "epoch": 7.522341376228776, "percentage": 75.22, "elapsed_time": "3:30:36", "remaining_time": "1:09:21", "throughput": 2305.38, "total_tokens": 29130944} {"current_steps": 50510, "total_steps": 67140, "loss": 0.6261, "lr": 8.77749167202922e-06, "epoch": 7.523086088769735, "percentage": 75.23, "elapsed_time": "3:30:37", "remaining_time": "1:09:20", "throughput": 2305.41, "total_tokens": 29133984} {"current_steps": 50515, "total_steps": 67140, "loss": 0.608, "lr": 8.77254742339458e-06, "epoch": 7.5238308013106945, "percentage": 75.24, "elapsed_time": "3:30:38", "remaining_time": "1:09:19", "throughput": 2305.42, "total_tokens": 29136672} {"current_steps": 50520, "total_steps": 67140, "loss": 0.5773, "lr": 8.767604271345209e-06, "epoch": 7.524575513851653, "percentage": 75.25, "elapsed_time": "3:30:39", "remaining_time": "1:09:18", "throughput": 2305.44, "total_tokens": 29139616} {"current_steps": 50525, "total_steps": 67140, "loss": 0.5572, "lr": 8.762662216215146e-06, "epoch": 7.525320226392612, "percentage": 75.25, "elapsed_time": "3:30:40", "remaining_time": "1:09:16", "throughput": 2305.45, "total_tokens": 29142304} {"current_steps": 50530, "total_steps": 67140, "loss": 0.5696, "lr": 8.75772125833836e-06, "epoch": 7.526064938933572, "percentage": 75.26, "elapsed_time": "3:30:41", "remaining_time": "1:09:15", "throughput": 2305.48, "total_tokens": 29145184} {"current_steps": 50535, "total_steps": 67140, "loss": 0.6522, "lr": 8.752781398048732e-06, "epoch": 7.526809651474531, "percentage": 75.27, "elapsed_time": "3:30:42", "remaining_time": "1:09:14", "throughput": 2305.5, "total_tokens": 29148160} {"current_steps": 50540, "total_steps": 67140, "loss": 0.8492, "lr": 8.747842635680076e-06, "epoch": 7.52755436401549, "percentage": 75.28, "elapsed_time": "3:30:43", "remaining_time": "1:09:12", "throughput": 2305.51, "total_tokens": 29150848} {"current_steps": 50545, "total_steps": 67140, "loss": 0.5075, "lr": 8.742904971566148e-06, "epoch": 7.528299076556449, "percentage": 75.28, "elapsed_time": "3:30:45", "remaining_time": "1:09:11", "throughput": 2305.53, "total_tokens": 29153696} {"current_steps": 50550, "total_steps": 67140, "loss": 0.6435, "lr": 8.737968406040597e-06, "epoch": 7.5290437890974085, "percentage": 75.29, "elapsed_time": "3:30:46", "remaining_time": "1:09:10", "throughput": 2305.55, "total_tokens": 29156544} {"current_steps": 50555, "total_steps": 67140, "loss": 0.6401, "lr": 8.733032939437025e-06, "epoch": 7.529788501638367, "percentage": 75.3, "elapsed_time": "3:30:47", "remaining_time": "1:09:09", "throughput": 2305.58, "total_tokens": 29159552} {"current_steps": 50560, "total_steps": 67140, "loss": 0.6603, "lr": 8.72809857208895e-06, "epoch": 7.530533214179327, "percentage": 75.31, "elapsed_time": "3:30:48", "remaining_time": "1:09:07", "throughput": 2305.61, "total_tokens": 29162592} {"current_steps": 50565, "total_steps": 67140, "loss": 0.437, "lr": 8.723165304329825e-06, "epoch": 7.531277926720286, "percentage": 75.31, "elapsed_time": "3:30:49", "remaining_time": "1:09:06", "throughput": 2305.63, "total_tokens": 29165600} {"current_steps": 50570, "total_steps": 67140, "loss": 0.7194, "lr": 8.718233136493004e-06, "epoch": 7.532022639261245, "percentage": 75.32, "elapsed_time": "3:30:50", "remaining_time": "1:09:05", "throughput": 2305.66, "total_tokens": 29168544} {"current_steps": 50575, "total_steps": 67140, "loss": 0.5555, "lr": 8.71330206891179e-06, "epoch": 7.532767351802204, "percentage": 75.33, "elapsed_time": "3:30:51", "remaining_time": "1:09:03", "throughput": 2305.67, "total_tokens": 29171328} {"current_steps": 50580, "total_steps": 67140, "loss": 0.6709, "lr": 8.708372101919407e-06, "epoch": 7.533512064343164, "percentage": 75.34, "elapsed_time": "3:30:53", "remaining_time": "1:09:02", "throughput": 2305.7, "total_tokens": 29174336} {"current_steps": 50585, "total_steps": 67140, "loss": 0.5853, "lr": 8.703443235849007e-06, "epoch": 7.534256776884122, "percentage": 75.34, "elapsed_time": "3:30:54", "remaining_time": "1:09:01", "throughput": 2305.71, "total_tokens": 29176992} {"current_steps": 50590, "total_steps": 67140, "loss": 0.5582, "lr": 8.698515471033649e-06, "epoch": 7.535001489425082, "percentage": 75.35, "elapsed_time": "3:30:55", "remaining_time": "1:09:00", "throughput": 2305.71, "total_tokens": 29179520} {"current_steps": 50595, "total_steps": 67140, "loss": 0.4722, "lr": 8.693588807806346e-06, "epoch": 7.535746201966041, "percentage": 75.36, "elapsed_time": "3:30:56", "remaining_time": "1:08:58", "throughput": 2305.72, "total_tokens": 29182112} {"current_steps": 50600, "total_steps": 67140, "loss": 0.4466, "lr": 8.688663246500005e-06, "epoch": 7.5364909145070005, "percentage": 75.36, "elapsed_time": "3:30:57", "remaining_time": "1:08:57", "throughput": 2305.75, "total_tokens": 29185216} {"current_steps": 50605, "total_steps": 67140, "loss": 0.5857, "lr": 8.683738787447488e-06, "epoch": 7.537235627047959, "percentage": 75.37, "elapsed_time": "3:30:58", "remaining_time": "1:08:56", "throughput": 2305.77, "total_tokens": 29188096} {"current_steps": 50610, "total_steps": 67140, "loss": 0.5075, "lr": 8.678815430981563e-06, "epoch": 7.537980339588919, "percentage": 75.38, "elapsed_time": "3:30:59", "remaining_time": "1:08:54", "throughput": 2305.79, "total_tokens": 29190976} {"current_steps": 50615, "total_steps": 67140, "loss": 0.7061, "lr": 8.673893177434936e-06, "epoch": 7.538725052129878, "percentage": 75.39, "elapsed_time": "3:31:00", "remaining_time": "1:08:53", "throughput": 2305.8, "total_tokens": 29193632} {"current_steps": 50620, "total_steps": 67140, "loss": 0.7922, "lr": 8.668972027140231e-06, "epoch": 7.539469764670837, "percentage": 75.39, "elapsed_time": "3:31:02", "remaining_time": "1:08:52", "throughput": 2305.82, "total_tokens": 29196576} {"current_steps": 50625, "total_steps": 67140, "loss": 0.5454, "lr": 8.664051980430008e-06, "epoch": 7.540214477211796, "percentage": 75.4, "elapsed_time": "3:31:03", "remaining_time": "1:08:51", "throughput": 2305.84, "total_tokens": 29199456} {"current_steps": 50630, "total_steps": 67140, "loss": 0.6566, "lr": 8.659133037636732e-06, "epoch": 7.540959189752756, "percentage": 75.41, "elapsed_time": "3:31:04", "remaining_time": "1:08:49", "throughput": 2305.86, "total_tokens": 29202272} {"current_steps": 50635, "total_steps": 67140, "loss": 0.532, "lr": 8.654215199092804e-06, "epoch": 7.5417039022937145, "percentage": 75.42, "elapsed_time": "3:31:05", "remaining_time": "1:08:48", "throughput": 2305.9, "total_tokens": 29205440} {"current_steps": 50640, "total_steps": 67140, "loss": 0.4046, "lr": 8.649298465130553e-06, "epoch": 7.542448614834674, "percentage": 75.42, "elapsed_time": "3:31:06", "remaining_time": "1:08:47", "throughput": 2305.92, "total_tokens": 29208224} {"current_steps": 50645, "total_steps": 67140, "loss": 0.734, "lr": 8.644382836082235e-06, "epoch": 7.543193327375633, "percentage": 75.43, "elapsed_time": "3:31:07", "remaining_time": "1:08:45", "throughput": 2305.94, "total_tokens": 29211168} {"current_steps": 50650, "total_steps": 67140, "loss": 0.5156, "lr": 8.63946831228003e-06, "epoch": 7.5439380399165925, "percentage": 75.44, "elapsed_time": "3:31:08", "remaining_time": "1:08:44", "throughput": 2305.97, "total_tokens": 29214176} {"current_steps": 50655, "total_steps": 67140, "loss": 0.5128, "lr": 8.634554894056038e-06, "epoch": 7.544682752457551, "percentage": 75.45, "elapsed_time": "3:31:10", "remaining_time": "1:08:43", "throughput": 2305.98, "total_tokens": 29216832} {"current_steps": 50660, "total_steps": 67140, "loss": 0.7181, "lr": 8.629642581742295e-06, "epoch": 7.545427464998511, "percentage": 75.45, "elapsed_time": "3:31:11", "remaining_time": "1:08:42", "throughput": 2305.99, "total_tokens": 29219680} {"current_steps": 50665, "total_steps": 67140, "loss": 0.6729, "lr": 8.624731375670752e-06, "epoch": 7.54617217753947, "percentage": 75.46, "elapsed_time": "3:31:12", "remaining_time": "1:08:40", "throughput": 2306.01, "total_tokens": 29222400} {"current_steps": 50670, "total_steps": 67140, "loss": 0.5645, "lr": 8.619821276173279e-06, "epoch": 7.546916890080429, "percentage": 75.47, "elapsed_time": "3:31:13", "remaining_time": "1:08:39", "throughput": 2306.04, "total_tokens": 29225408} {"current_steps": 50675, "total_steps": 67140, "loss": 0.553, "lr": 8.614912283581683e-06, "epoch": 7.547661602621388, "percentage": 75.48, "elapsed_time": "3:31:14", "remaining_time": "1:08:38", "throughput": 2306.04, "total_tokens": 29228000} {"current_steps": 50680, "total_steps": 67140, "loss": 0.6729, "lr": 8.6100043982277e-06, "epoch": 7.548406315162348, "percentage": 75.48, "elapsed_time": "3:31:15", "remaining_time": "1:08:36", "throughput": 2306.05, "total_tokens": 29230592} {"current_steps": 50685, "total_steps": 67140, "loss": 0.644, "lr": 8.605097620442984e-06, "epoch": 7.5491510277033065, "percentage": 75.49, "elapsed_time": "3:31:16", "remaining_time": "1:08:35", "throughput": 2306.08, "total_tokens": 29233696} {"current_steps": 50690, "total_steps": 67140, "loss": 0.5118, "lr": 8.600191950559111e-06, "epoch": 7.549895740244265, "percentage": 75.5, "elapsed_time": "3:31:17", "remaining_time": "1:08:34", "throughput": 2306.1, "total_tokens": 29236576} {"current_steps": 50695, "total_steps": 67140, "loss": 0.6066, "lr": 8.5952873889076e-06, "epoch": 7.550640452785225, "percentage": 75.51, "elapsed_time": "3:31:19", "remaining_time": "1:08:32", "throughput": 2306.12, "total_tokens": 29239392} {"current_steps": 50700, "total_steps": 67140, "loss": 0.5394, "lr": 8.590383935819862e-06, "epoch": 7.5513851653261845, "percentage": 75.51, "elapsed_time": "3:31:20", "remaining_time": "1:08:31", "throughput": 2306.13, "total_tokens": 29242016} {"current_steps": 50705, "total_steps": 67140, "loss": 0.5772, "lr": 8.58548159162727e-06, "epoch": 7.552129877867143, "percentage": 75.52, "elapsed_time": "3:31:21", "remaining_time": "1:08:30", "throughput": 2306.13, "total_tokens": 29244640} {"current_steps": 50710, "total_steps": 67140, "loss": 0.6212, "lr": 8.580580356661085e-06, "epoch": 7.552874590408102, "percentage": 75.53, "elapsed_time": "3:31:22", "remaining_time": "1:08:29", "throughput": 2306.15, "total_tokens": 29247360} {"current_steps": 50715, "total_steps": 67140, "loss": 0.6376, "lr": 8.575680231252526e-06, "epoch": 7.553619302949062, "percentage": 75.54, "elapsed_time": "3:31:23", "remaining_time": "1:08:27", "throughput": 2306.16, "total_tokens": 29250080} {"current_steps": 50720, "total_steps": 67140, "loss": 0.6594, "lr": 8.570781215732718e-06, "epoch": 7.554364015490021, "percentage": 75.54, "elapsed_time": "3:31:24", "remaining_time": "1:08:26", "throughput": 2306.17, "total_tokens": 29252704} {"current_steps": 50725, "total_steps": 67140, "loss": 0.8102, "lr": 8.565883310432717e-06, "epoch": 7.55510872803098, "percentage": 75.55, "elapsed_time": "3:31:25", "remaining_time": "1:08:25", "throughput": 2306.2, "total_tokens": 29255840} {"current_steps": 50730, "total_steps": 67140, "loss": 0.5257, "lr": 8.56098651568352e-06, "epoch": 7.555853440571939, "percentage": 75.56, "elapsed_time": "3:31:26", "remaining_time": "1:08:23", "throughput": 2306.22, "total_tokens": 29258592} {"current_steps": 50735, "total_steps": 67140, "loss": 0.7097, "lr": 8.556090831816006e-06, "epoch": 7.5565981531128985, "percentage": 75.57, "elapsed_time": "3:31:27", "remaining_time": "1:08:22", "throughput": 2306.23, "total_tokens": 29261376} {"current_steps": 50740, "total_steps": 67140, "loss": 0.6348, "lr": 8.551196259161017e-06, "epoch": 7.557342865653857, "percentage": 75.57, "elapsed_time": "3:31:29", "remaining_time": "1:08:21", "throughput": 2306.26, "total_tokens": 29264448} {"current_steps": 50745, "total_steps": 67140, "loss": 0.6623, "lr": 8.546302798049319e-06, "epoch": 7.558087578194817, "percentage": 75.58, "elapsed_time": "3:31:30", "remaining_time": "1:08:20", "throughput": 2306.28, "total_tokens": 29267232} {"current_steps": 50750, "total_steps": 67140, "loss": 0.6467, "lr": 8.541410448811574e-06, "epoch": 7.558832290735776, "percentage": 75.59, "elapsed_time": "3:31:31", "remaining_time": "1:08:18", "throughput": 2306.29, "total_tokens": 29269920} {"current_steps": 50755, "total_steps": 67140, "loss": 0.5419, "lr": 8.536519211778393e-06, "epoch": 7.559577003276735, "percentage": 75.6, "elapsed_time": "3:31:32", "remaining_time": "1:08:17", "throughput": 2306.3, "total_tokens": 29272640} {"current_steps": 50760, "total_steps": 67140, "loss": 0.6714, "lr": 8.531629087280319e-06, "epoch": 7.560321715817694, "percentage": 75.6, "elapsed_time": "3:31:33", "remaining_time": "1:08:16", "throughput": 2306.33, "total_tokens": 29275808} {"current_steps": 50765, "total_steps": 67140, "loss": 0.5643, "lr": 8.526740075647784e-06, "epoch": 7.561066428358654, "percentage": 75.61, "elapsed_time": "3:31:34", "remaining_time": "1:08:14", "throughput": 2306.35, "total_tokens": 29278624} {"current_steps": 50770, "total_steps": 67140, "loss": 0.6784, "lr": 8.52185217721118e-06, "epoch": 7.5618111408996125, "percentage": 75.62, "elapsed_time": "3:31:35", "remaining_time": "1:08:13", "throughput": 2306.37, "total_tokens": 29281504} {"current_steps": 50775, "total_steps": 67140, "loss": 0.5567, "lr": 8.516965392300813e-06, "epoch": 7.562555853440572, "percentage": 75.63, "elapsed_time": "3:31:36", "remaining_time": "1:08:12", "throughput": 2306.38, "total_tokens": 29284032} {"current_steps": 50780, "total_steps": 67140, "loss": 0.6471, "lr": 8.512079721246907e-06, "epoch": 7.563300565981531, "percentage": 75.63, "elapsed_time": "3:31:38", "remaining_time": "1:08:11", "throughput": 2306.41, "total_tokens": 29287136} {"current_steps": 50785, "total_steps": 67140, "loss": 0.5732, "lr": 8.50719516437963e-06, "epoch": 7.5640452785224905, "percentage": 75.64, "elapsed_time": "3:31:39", "remaining_time": "1:08:09", "throughput": 2306.42, "total_tokens": 29289920} {"current_steps": 50790, "total_steps": 67140, "loss": 0.6674, "lr": 8.502311722029038e-06, "epoch": 7.564789991063449, "percentage": 75.65, "elapsed_time": "3:31:40", "remaining_time": "1:08:08", "throughput": 2306.44, "total_tokens": 29292832} {"current_steps": 50795, "total_steps": 67140, "loss": 0.5039, "lr": 8.497429394525155e-06, "epoch": 7.565534703604409, "percentage": 75.66, "elapsed_time": "3:31:41", "remaining_time": "1:08:07", "throughput": 2306.47, "total_tokens": 29295840} {"current_steps": 50800, "total_steps": 67140, "loss": 0.5958, "lr": 8.49254818219789e-06, "epoch": 7.566279416145368, "percentage": 75.66, "elapsed_time": "3:31:42", "remaining_time": "1:08:05", "throughput": 2306.48, "total_tokens": 29298624} {"current_steps": 50805, "total_steps": 67140, "loss": 0.4965, "lr": 8.487668085377104e-06, "epoch": 7.567024128686327, "percentage": 75.67, "elapsed_time": "3:31:43", "remaining_time": "1:08:04", "throughput": 2306.5, "total_tokens": 29301472} {"current_steps": 50810, "total_steps": 67140, "loss": 0.7653, "lr": 8.482789104392575e-06, "epoch": 7.567768841227286, "percentage": 75.68, "elapsed_time": "3:31:44", "remaining_time": "1:08:03", "throughput": 2306.52, "total_tokens": 29304160} {"current_steps": 50815, "total_steps": 67140, "loss": 0.528, "lr": 8.477911239574005e-06, "epoch": 7.568513553768246, "percentage": 75.69, "elapsed_time": "3:31:46", "remaining_time": "1:08:02", "throughput": 2306.56, "total_tokens": 29307520} {"current_steps": 50820, "total_steps": 67140, "loss": 0.4591, "lr": 8.473034491251016e-06, "epoch": 7.5692582663092045, "percentage": 75.69, "elapsed_time": "3:31:47", "remaining_time": "1:08:00", "throughput": 2306.58, "total_tokens": 29310400} {"current_steps": 50825, "total_steps": 67140, "loss": 0.6208, "lr": 8.468158859753175e-06, "epoch": 7.570002978850164, "percentage": 75.7, "elapsed_time": "3:31:48", "remaining_time": "1:07:59", "throughput": 2306.59, "total_tokens": 29313056} {"current_steps": 50830, "total_steps": 67140, "loss": 0.6774, "lr": 8.463284345409941e-06, "epoch": 7.570747691391123, "percentage": 75.71, "elapsed_time": "3:31:49", "remaining_time": "1:07:58", "throughput": 2306.62, "total_tokens": 29316096} {"current_steps": 50835, "total_steps": 67140, "loss": 0.4919, "lr": 8.458410948550713e-06, "epoch": 7.571492403932083, "percentage": 75.71, "elapsed_time": "3:31:50", "remaining_time": "1:07:56", "throughput": 2306.65, "total_tokens": 29319072} {"current_steps": 50840, "total_steps": 67140, "loss": 0.7745, "lr": 8.453538669504818e-06, "epoch": 7.572237116473041, "percentage": 75.72, "elapsed_time": "3:31:51", "remaining_time": "1:07:55", "throughput": 2306.67, "total_tokens": 29322080} {"current_steps": 50845, "total_steps": 67140, "loss": 0.6429, "lr": 8.448667508601505e-06, "epoch": 7.572981829014001, "percentage": 75.73, "elapsed_time": "3:31:52", "remaining_time": "1:07:54", "throughput": 2306.69, "total_tokens": 29324992} {"current_steps": 50850, "total_steps": 67140, "loss": 0.5541, "lr": 8.44379746616995e-06, "epoch": 7.57372654155496, "percentage": 75.74, "elapsed_time": "3:31:54", "remaining_time": "1:07:53", "throughput": 2306.72, "total_tokens": 29327872} {"current_steps": 50855, "total_steps": 67140, "loss": 0.4466, "lr": 8.438928542539251e-06, "epoch": 7.5744712540959185, "percentage": 75.74, "elapsed_time": "3:31:55", "remaining_time": "1:07:51", "throughput": 2306.74, "total_tokens": 29330816} {"current_steps": 50860, "total_steps": 67140, "loss": 0.6552, "lr": 8.434060738038438e-06, "epoch": 7.575215966636878, "percentage": 75.75, "elapsed_time": "3:31:56", "remaining_time": "1:07:50", "throughput": 2306.77, "total_tokens": 29333696} {"current_steps": 50865, "total_steps": 67140, "loss": 0.6549, "lr": 8.429194052996445e-06, "epoch": 7.575960679177838, "percentage": 75.76, "elapsed_time": "3:31:57", "remaining_time": "1:07:49", "throughput": 2306.78, "total_tokens": 29336480} {"current_steps": 50870, "total_steps": 67140, "loss": 0.5019, "lr": 8.424328487742139e-06, "epoch": 7.5767053917187965, "percentage": 75.77, "elapsed_time": "3:31:58", "remaining_time": "1:07:47", "throughput": 2306.79, "total_tokens": 29339104} {"current_steps": 50875, "total_steps": 67140, "loss": 0.5469, "lr": 8.419464042604322e-06, "epoch": 7.577450104259755, "percentage": 75.77, "elapsed_time": "3:31:59", "remaining_time": "1:07:46", "throughput": 2306.81, "total_tokens": 29341984} {"current_steps": 50880, "total_steps": 67140, "loss": 0.6569, "lr": 8.414600717911713e-06, "epoch": 7.578194816800715, "percentage": 75.78, "elapsed_time": "3:32:00", "remaining_time": "1:07:45", "throughput": 2306.84, "total_tokens": 29345024} {"current_steps": 50885, "total_steps": 67140, "loss": 0.6257, "lr": 8.409738513992958e-06, "epoch": 7.578939529341675, "percentage": 75.79, "elapsed_time": "3:32:01", "remaining_time": "1:07:43", "throughput": 2306.86, "total_tokens": 29347808} {"current_steps": 50890, "total_steps": 67140, "loss": 0.6296, "lr": 8.404877431176621e-06, "epoch": 7.579684241882633, "percentage": 75.8, "elapsed_time": "3:32:03", "remaining_time": "1:07:42", "throughput": 2306.89, "total_tokens": 29351008} {"current_steps": 50895, "total_steps": 67140, "loss": 0.5128, "lr": 8.400017469791206e-06, "epoch": 7.580428954423592, "percentage": 75.8, "elapsed_time": "3:32:04", "remaining_time": "1:07:41", "throughput": 2306.91, "total_tokens": 29353760} {"current_steps": 50900, "total_steps": 67140, "loss": 0.6583, "lr": 8.395158630165112e-06, "epoch": 7.581173666964552, "percentage": 75.81, "elapsed_time": "3:32:05", "remaining_time": "1:07:40", "throughput": 2306.93, "total_tokens": 29356736} {"current_steps": 50905, "total_steps": 67140, "loss": 0.3832, "lr": 8.390300912626686e-06, "epoch": 7.5819183795055105, "percentage": 75.82, "elapsed_time": "3:32:06", "remaining_time": "1:07:38", "throughput": 2306.93, "total_tokens": 29359200} {"current_steps": 50910, "total_steps": 67140, "loss": 0.5137, "lr": 8.385444317504201e-06, "epoch": 7.58266309204647, "percentage": 75.83, "elapsed_time": "3:32:07", "remaining_time": "1:07:37", "throughput": 2306.96, "total_tokens": 29362112} {"current_steps": 50915, "total_steps": 67140, "loss": 0.5707, "lr": 8.380588845125833e-06, "epoch": 7.583407804587429, "percentage": 75.83, "elapsed_time": "3:32:08", "remaining_time": "1:07:36", "throughput": 2306.98, "total_tokens": 29365184} {"current_steps": 50920, "total_steps": 67140, "loss": 0.6969, "lr": 8.3757344958197e-06, "epoch": 7.584152517128389, "percentage": 75.84, "elapsed_time": "3:32:09", "remaining_time": "1:07:34", "throughput": 2307.01, "total_tokens": 29368192} {"current_steps": 50925, "total_steps": 67140, "loss": 0.6087, "lr": 8.370881269913851e-06, "epoch": 7.584897229669347, "percentage": 75.85, "elapsed_time": "3:32:11", "remaining_time": "1:07:33", "throughput": 2307.03, "total_tokens": 29370976} {"current_steps": 50930, "total_steps": 67140, "loss": 0.5438, "lr": 8.366029167736227e-06, "epoch": 7.585641942210307, "percentage": 75.86, "elapsed_time": "3:32:12", "remaining_time": "1:07:32", "throughput": 2307.05, "total_tokens": 29374048} {"current_steps": 50935, "total_steps": 67140, "loss": 0.5293, "lr": 8.361178189614724e-06, "epoch": 7.586386654751266, "percentage": 75.86, "elapsed_time": "3:32:13", "remaining_time": "1:07:31", "throughput": 2307.07, "total_tokens": 29376832} {"current_steps": 50940, "total_steps": 67140, "loss": 0.6433, "lr": 8.356328335877147e-06, "epoch": 7.587131367292225, "percentage": 75.87, "elapsed_time": "3:32:14", "remaining_time": "1:07:29", "throughput": 2307.1, "total_tokens": 29379968} {"current_steps": 50945, "total_steps": 67140, "loss": 0.5319, "lr": 8.351479606851236e-06, "epoch": 7.587876079833184, "percentage": 75.88, "elapsed_time": "3:32:15", "remaining_time": "1:07:28", "throughput": 2307.12, "total_tokens": 29382752} {"current_steps": 50950, "total_steps": 67140, "loss": 0.7266, "lr": 8.346632002864655e-06, "epoch": 7.588620792374144, "percentage": 75.89, "elapsed_time": "3:32:16", "remaining_time": "1:07:27", "throughput": 2307.14, "total_tokens": 29385728} {"current_steps": 50955, "total_steps": 67140, "loss": 0.6435, "lr": 8.341785524244964e-06, "epoch": 7.5893655049151025, "percentage": 75.89, "elapsed_time": "3:32:17", "remaining_time": "1:07:26", "throughput": 2307.17, "total_tokens": 29388640} {"current_steps": 50960, "total_steps": 67140, "loss": 0.5632, "lr": 8.33694017131969e-06, "epoch": 7.590110217456062, "percentage": 75.9, "elapsed_time": "3:32:19", "remaining_time": "1:07:24", "throughput": 2307.19, "total_tokens": 29391616} {"current_steps": 50965, "total_steps": 67140, "loss": 0.5217, "lr": 8.332095944416243e-06, "epoch": 7.590854929997021, "percentage": 75.91, "elapsed_time": "3:32:20", "remaining_time": "1:07:23", "throughput": 2307.21, "total_tokens": 29394400} {"current_steps": 50970, "total_steps": 67140, "loss": 0.5974, "lr": 8.327252843861986e-06, "epoch": 7.591599642537981, "percentage": 75.92, "elapsed_time": "3:32:21", "remaining_time": "1:07:22", "throughput": 2307.23, "total_tokens": 29397216} {"current_steps": 50975, "total_steps": 67140, "loss": 0.6768, "lr": 8.322410869984195e-06, "epoch": 7.592344355078939, "percentage": 75.92, "elapsed_time": "3:32:22", "remaining_time": "1:07:20", "throughput": 2307.25, "total_tokens": 29400064} {"current_steps": 50980, "total_steps": 67140, "loss": 0.7429, "lr": 8.317570023110072e-06, "epoch": 7.593089067619899, "percentage": 75.93, "elapsed_time": "3:32:23", "remaining_time": "1:07:19", "throughput": 2307.27, "total_tokens": 29402944} {"current_steps": 50985, "total_steps": 67140, "loss": 0.6567, "lr": 8.312730303566738e-06, "epoch": 7.593833780160858, "percentage": 75.94, "elapsed_time": "3:32:24", "remaining_time": "1:07:18", "throughput": 2307.28, "total_tokens": 29405632} {"current_steps": 50990, "total_steps": 67140, "loss": 0.5219, "lr": 8.307891711681257e-06, "epoch": 7.594578492701817, "percentage": 75.95, "elapsed_time": "3:32:25", "remaining_time": "1:07:16", "throughput": 2307.31, "total_tokens": 29408800} {"current_steps": 50995, "total_steps": 67140, "loss": 0.7382, "lr": 8.303054247780587e-06, "epoch": 7.595323205242776, "percentage": 75.95, "elapsed_time": "3:32:27", "remaining_time": "1:07:15", "throughput": 2307.34, "total_tokens": 29411936} {"current_steps": 51000, "total_steps": 67140, "loss": 0.4763, "lr": 8.298217912191617e-06, "epoch": 7.596067917783736, "percentage": 75.96, "elapsed_time": "3:32:28", "remaining_time": "1:07:14", "throughput": 2307.36, "total_tokens": 29414752} {"current_steps": 51005, "total_steps": 67140, "loss": 0.6575, "lr": 8.293382705241177e-06, "epoch": 7.596812630324695, "percentage": 75.97, "elapsed_time": "3:32:29", "remaining_time": "1:07:13", "throughput": 2307.38, "total_tokens": 29417696} {"current_steps": 51010, "total_steps": 67140, "loss": 0.6791, "lr": 8.28854862725601e-06, "epoch": 7.597557342865654, "percentage": 75.98, "elapsed_time": "3:32:30", "remaining_time": "1:07:11", "throughput": 2307.4, "total_tokens": 29420544} {"current_steps": 51015, "total_steps": 67140, "loss": 0.43, "lr": 8.283715678562781e-06, "epoch": 7.598302055406613, "percentage": 75.98, "elapsed_time": "3:32:31", "remaining_time": "1:07:10", "throughput": 2307.41, "total_tokens": 29423232} {"current_steps": 51020, "total_steps": 67140, "loss": 0.5771, "lr": 8.278883859488085e-06, "epoch": 7.599046767947573, "percentage": 75.99, "elapsed_time": "3:32:32", "remaining_time": "1:07:09", "throughput": 2307.45, "total_tokens": 29426432} {"current_steps": 51025, "total_steps": 67140, "loss": 0.7003, "lr": 8.274053170358442e-06, "epoch": 7.599791480488531, "percentage": 76.0, "elapsed_time": "3:32:33", "remaining_time": "1:07:08", "throughput": 2307.48, "total_tokens": 29429376} {"current_steps": 51030, "total_steps": 67140, "loss": 0.5617, "lr": 8.269223611500285e-06, "epoch": 7.600536193029491, "percentage": 76.01, "elapsed_time": "3:32:35", "remaining_time": "1:07:06", "throughput": 2307.49, "total_tokens": 29432192} {"current_steps": 51035, "total_steps": 67140, "loss": 0.6477, "lr": 8.264395183239962e-06, "epoch": 7.60128090557045, "percentage": 76.01, "elapsed_time": "3:32:36", "remaining_time": "1:07:05", "throughput": 2307.52, "total_tokens": 29435168} {"current_steps": 51040, "total_steps": 67140, "loss": 0.5693, "lr": 8.259567885903775e-06, "epoch": 7.6020256181114085, "percentage": 76.02, "elapsed_time": "3:32:37", "remaining_time": "1:07:04", "throughput": 2307.53, "total_tokens": 29437952} {"current_steps": 51045, "total_steps": 67140, "loss": 0.3877, "lr": 8.254741719817924e-06, "epoch": 7.602770330652368, "percentage": 76.03, "elapsed_time": "3:32:38", "remaining_time": "1:07:02", "throughput": 2307.57, "total_tokens": 29441056} {"current_steps": 51050, "total_steps": 67140, "loss": 0.5699, "lr": 8.249916685308548e-06, "epoch": 7.603515043193328, "percentage": 76.04, "elapsed_time": "3:32:39", "remaining_time": "1:07:01", "throughput": 2307.59, "total_tokens": 29443936} {"current_steps": 51055, "total_steps": 67140, "loss": 0.5265, "lr": 8.245092782701703e-06, "epoch": 7.604259755734287, "percentage": 76.04, "elapsed_time": "3:32:40", "remaining_time": "1:07:00", "throughput": 2307.6, "total_tokens": 29446784} {"current_steps": 51060, "total_steps": 67140, "loss": 0.6374, "lr": 8.240270012323375e-06, "epoch": 7.605004468275245, "percentage": 76.05, "elapsed_time": "3:32:41", "remaining_time": "1:06:59", "throughput": 2307.63, "total_tokens": 29449792} {"current_steps": 51065, "total_steps": 67140, "loss": 0.6235, "lr": 8.23544837449945e-06, "epoch": 7.605749180816205, "percentage": 76.06, "elapsed_time": "3:32:43", "remaining_time": "1:06:57", "throughput": 2307.67, "total_tokens": 29453024} {"current_steps": 51070, "total_steps": 67140, "loss": 0.6017, "lr": 8.230627869555775e-06, "epoch": 7.606493893357164, "percentage": 76.06, "elapsed_time": "3:32:44", "remaining_time": "1:06:56", "throughput": 2307.67, "total_tokens": 29455680} {"current_steps": 51075, "total_steps": 67140, "loss": 0.6721, "lr": 8.225808497818077e-06, "epoch": 7.607238605898123, "percentage": 76.07, "elapsed_time": "3:32:45", "remaining_time": "1:06:55", "throughput": 2307.7, "total_tokens": 29458560} {"current_steps": 51080, "total_steps": 67140, "loss": 0.4234, "lr": 8.220990259612043e-06, "epoch": 7.607983318439082, "percentage": 76.08, "elapsed_time": "3:32:46", "remaining_time": "1:06:53", "throughput": 2307.74, "total_tokens": 29461856} {"current_steps": 51085, "total_steps": 67140, "loss": 0.5621, "lr": 8.216173155263271e-06, "epoch": 7.608728030980042, "percentage": 76.09, "elapsed_time": "3:32:47", "remaining_time": "1:06:52", "throughput": 2307.76, "total_tokens": 29464768} {"current_steps": 51090, "total_steps": 67140, "loss": 0.445, "lr": 8.211357185097285e-06, "epoch": 7.609472743521001, "percentage": 76.09, "elapsed_time": "3:32:48", "remaining_time": "1:06:51", "throughput": 2307.78, "total_tokens": 29467680} {"current_steps": 51095, "total_steps": 67140, "loss": 0.602, "lr": 8.206542349439517e-06, "epoch": 7.61021745606196, "percentage": 76.1, "elapsed_time": "3:32:49", "remaining_time": "1:06:50", "throughput": 2307.79, "total_tokens": 29470368} {"current_steps": 51100, "total_steps": 67140, "loss": 0.6387, "lr": 8.20172864861534e-06, "epoch": 7.610962168602919, "percentage": 76.11, "elapsed_time": "3:32:51", "remaining_time": "1:06:48", "throughput": 2307.8, "total_tokens": 29473120} {"current_steps": 51105, "total_steps": 67140, "loss": 0.4163, "lr": 8.19691608295004e-06, "epoch": 7.611706881143879, "percentage": 76.12, "elapsed_time": "3:32:52", "remaining_time": "1:06:47", "throughput": 2307.83, "total_tokens": 29476064} {"current_steps": 51110, "total_steps": 67140, "loss": 0.4654, "lr": 8.192104652768848e-06, "epoch": 7.612451593684837, "percentage": 76.12, "elapsed_time": "3:32:53", "remaining_time": "1:06:46", "throughput": 2307.86, "total_tokens": 29479232} {"current_steps": 51115, "total_steps": 67140, "loss": 0.617, "lr": 8.187294358396874e-06, "epoch": 7.613196306225797, "percentage": 76.13, "elapsed_time": "3:32:54", "remaining_time": "1:06:44", "throughput": 2307.88, "total_tokens": 29482048} {"current_steps": 51120, "total_steps": 67140, "loss": 0.6568, "lr": 8.182485200159195e-06, "epoch": 7.613941018766756, "percentage": 76.14, "elapsed_time": "3:32:55", "remaining_time": "1:06:43", "throughput": 2307.88, "total_tokens": 29484672} {"current_steps": 51125, "total_steps": 67140, "loss": 0.7165, "lr": 8.177677178380799e-06, "epoch": 7.614685731307715, "percentage": 76.15, "elapsed_time": "3:32:56", "remaining_time": "1:06:42", "throughput": 2307.89, "total_tokens": 29487360} {"current_steps": 51130, "total_steps": 67140, "loss": 0.6848, "lr": 8.172870293386579e-06, "epoch": 7.615430443848674, "percentage": 76.15, "elapsed_time": "3:32:57", "remaining_time": "1:06:41", "throughput": 2307.88, "total_tokens": 29489696} {"current_steps": 51135, "total_steps": 67140, "loss": 0.5309, "lr": 8.168064545501367e-06, "epoch": 7.616175156389634, "percentage": 76.16, "elapsed_time": "3:32:58", "remaining_time": "1:06:39", "throughput": 2307.9, "total_tokens": 29492512} {"current_steps": 51140, "total_steps": 67140, "loss": 0.714, "lr": 8.16325993504992e-06, "epoch": 7.616919868930593, "percentage": 76.17, "elapsed_time": "3:33:00", "remaining_time": "1:06:38", "throughput": 2307.92, "total_tokens": 29495296} {"current_steps": 51145, "total_steps": 67140, "loss": 0.5603, "lr": 8.158456462356915e-06, "epoch": 7.617664581471552, "percentage": 76.18, "elapsed_time": "3:33:01", "remaining_time": "1:06:37", "throughput": 2307.94, "total_tokens": 29498176} {"current_steps": 51150, "total_steps": 67140, "loss": 0.4944, "lr": 8.153654127746957e-06, "epoch": 7.618409294012511, "percentage": 76.18, "elapsed_time": "3:33:02", "remaining_time": "1:06:35", "throughput": 2307.95, "total_tokens": 29500832} {"current_steps": 51155, "total_steps": 67140, "loss": 0.5932, "lr": 8.148852931544551e-06, "epoch": 7.619154006553471, "percentage": 76.19, "elapsed_time": "3:33:03", "remaining_time": "1:06:34", "throughput": 2307.96, "total_tokens": 29503616} {"current_steps": 51160, "total_steps": 67140, "loss": 0.6443, "lr": 8.144052874074162e-06, "epoch": 7.619898719094429, "percentage": 76.2, "elapsed_time": "3:33:04", "remaining_time": "1:06:33", "throughput": 2307.98, "total_tokens": 29506496} {"current_steps": 51165, "total_steps": 67140, "loss": 0.3881, "lr": 8.139253955660139e-06, "epoch": 7.620643431635389, "percentage": 76.21, "elapsed_time": "3:33:05", "remaining_time": "1:06:31", "throughput": 2307.98, "total_tokens": 29508928} {"current_steps": 51170, "total_steps": 67140, "loss": 0.6219, "lr": 8.134456176626784e-06, "epoch": 7.621388144176348, "percentage": 76.21, "elapsed_time": "3:33:06", "remaining_time": "1:06:30", "throughput": 2308.0, "total_tokens": 29511840} {"current_steps": 51175, "total_steps": 67140, "loss": 0.6967, "lr": 8.129659537298308e-06, "epoch": 7.6221328567173074, "percentage": 76.22, "elapsed_time": "3:33:07", "remaining_time": "1:06:29", "throughput": 2308.03, "total_tokens": 29514752} {"current_steps": 51180, "total_steps": 67140, "loss": 0.6152, "lr": 8.124864037998852e-06, "epoch": 7.622877569258266, "percentage": 76.23, "elapsed_time": "3:33:08", "remaining_time": "1:06:28", "throughput": 2308.03, "total_tokens": 29517376} {"current_steps": 51185, "total_steps": 67140, "loss": 0.676, "lr": 8.120069679052477e-06, "epoch": 7.623622281799226, "percentage": 76.24, "elapsed_time": "3:33:10", "remaining_time": "1:06:26", "throughput": 2308.06, "total_tokens": 29520320} {"current_steps": 51190, "total_steps": 67140, "loss": 0.557, "lr": 8.115276460783172e-06, "epoch": 7.624366994340185, "percentage": 76.24, "elapsed_time": "3:33:11", "remaining_time": "1:06:25", "throughput": 2308.08, "total_tokens": 29523200} {"current_steps": 51195, "total_steps": 67140, "loss": 0.6567, "lr": 8.110484383514835e-06, "epoch": 7.625111706881144, "percentage": 76.25, "elapsed_time": "3:33:12", "remaining_time": "1:06:24", "throughput": 2308.09, "total_tokens": 29525984} {"current_steps": 51200, "total_steps": 67140, "loss": 0.6863, "lr": 8.105693447571286e-06, "epoch": 7.625856419422103, "percentage": 76.26, "elapsed_time": "3:33:13", "remaining_time": "1:06:22", "throughput": 2308.12, "total_tokens": 29528992} {"current_steps": 51205, "total_steps": 67140, "loss": 0.6808, "lr": 8.100903653276287e-06, "epoch": 7.626601131963062, "percentage": 76.27, "elapsed_time": "3:33:14", "remaining_time": "1:06:21", "throughput": 2308.13, "total_tokens": 29531712} {"current_steps": 51210, "total_steps": 67140, "loss": 0.4607, "lr": 8.096115000953513e-06, "epoch": 7.627345844504021, "percentage": 76.27, "elapsed_time": "3:33:15", "remaining_time": "1:06:20", "throughput": 2308.15, "total_tokens": 29534432} {"current_steps": 51215, "total_steps": 67140, "loss": 0.6013, "lr": 8.091327490926561e-06, "epoch": 7.628090557044981, "percentage": 76.28, "elapsed_time": "3:33:16", "remaining_time": "1:06:19", "throughput": 2308.16, "total_tokens": 29537248} {"current_steps": 51220, "total_steps": 67140, "loss": 0.5897, "lr": 8.08654112351895e-06, "epoch": 7.62883526958594, "percentage": 76.29, "elapsed_time": "3:33:17", "remaining_time": "1:06:17", "throughput": 2308.18, "total_tokens": 29540096} {"current_steps": 51225, "total_steps": 67140, "loss": 0.7233, "lr": 8.081755899054136e-06, "epoch": 7.629579982126899, "percentage": 76.3, "elapsed_time": "3:33:19", "remaining_time": "1:06:16", "throughput": 2308.21, "total_tokens": 29543040} {"current_steps": 51230, "total_steps": 67140, "loss": 0.64, "lr": 8.076971817855472e-06, "epoch": 7.630324694667858, "percentage": 76.3, "elapsed_time": "3:33:20", "remaining_time": "1:06:15", "throughput": 2308.23, "total_tokens": 29545952} {"current_steps": 51235, "total_steps": 67140, "loss": 0.7134, "lr": 8.07218888024624e-06, "epoch": 7.631069407208818, "percentage": 76.31, "elapsed_time": "3:33:21", "remaining_time": "1:06:13", "throughput": 2308.26, "total_tokens": 29549024} {"current_steps": 51240, "total_steps": 67140, "loss": 0.7334, "lr": 8.067407086549661e-06, "epoch": 7.631814119749777, "percentage": 76.32, "elapsed_time": "3:33:22", "remaining_time": "1:06:12", "throughput": 2308.29, "total_tokens": 29552064} {"current_steps": 51245, "total_steps": 67140, "loss": 0.6948, "lr": 8.06262643708887e-06, "epoch": 7.632558832290735, "percentage": 76.33, "elapsed_time": "3:33:23", "remaining_time": "1:06:11", "throughput": 2308.31, "total_tokens": 29554944} {"current_steps": 51250, "total_steps": 67140, "loss": 0.4935, "lr": 8.05784693218692e-06, "epoch": 7.633303544831695, "percentage": 76.33, "elapsed_time": "3:33:24", "remaining_time": "1:06:10", "throughput": 2308.34, "total_tokens": 29557920} {"current_steps": 51255, "total_steps": 67140, "loss": 0.6478, "lr": 8.053068572166797e-06, "epoch": 7.634048257372654, "percentage": 76.34, "elapsed_time": "3:33:25", "remaining_time": "1:06:08", "throughput": 2308.35, "total_tokens": 29560736} {"current_steps": 51260, "total_steps": 67140, "loss": 0.5187, "lr": 8.048291357351395e-06, "epoch": 7.6347929699136134, "percentage": 76.35, "elapsed_time": "3:33:27", "remaining_time": "1:06:07", "throughput": 2308.38, "total_tokens": 29563680} {"current_steps": 51265, "total_steps": 67140, "loss": 0.5587, "lr": 8.043515288063542e-06, "epoch": 7.635537682454572, "percentage": 76.36, "elapsed_time": "3:33:28", "remaining_time": "1:06:06", "throughput": 2308.4, "total_tokens": 29566528} {"current_steps": 51270, "total_steps": 67140, "loss": 0.5038, "lr": 8.038740364625994e-06, "epoch": 7.636282394995532, "percentage": 76.36, "elapsed_time": "3:33:29", "remaining_time": "1:06:04", "throughput": 2308.41, "total_tokens": 29569344} {"current_steps": 51275, "total_steps": 67140, "loss": 0.6357, "lr": 8.033966587361402e-06, "epoch": 7.637027107536491, "percentage": 76.37, "elapsed_time": "3:33:30", "remaining_time": "1:06:03", "throughput": 2308.44, "total_tokens": 29572448} {"current_steps": 51280, "total_steps": 67140, "loss": 0.5643, "lr": 8.029193956592371e-06, "epoch": 7.63777182007745, "percentage": 76.38, "elapsed_time": "3:33:31", "remaining_time": "1:06:02", "throughput": 2308.45, "total_tokens": 29575040} {"current_steps": 51285, "total_steps": 67140, "loss": 0.5423, "lr": 8.024422472641416e-06, "epoch": 7.638516532618409, "percentage": 76.39, "elapsed_time": "3:33:32", "remaining_time": "1:06:01", "throughput": 2308.49, "total_tokens": 29578272} {"current_steps": 51290, "total_steps": 67140, "loss": 0.6894, "lr": 8.01965213583098e-06, "epoch": 7.639261245159369, "percentage": 76.39, "elapsed_time": "3:33:33", "remaining_time": "1:05:59", "throughput": 2308.5, "total_tokens": 29581056} {"current_steps": 51295, "total_steps": 67140, "loss": 0.5695, "lr": 8.014882946483403e-06, "epoch": 7.640005957700327, "percentage": 76.4, "elapsed_time": "3:33:35", "remaining_time": "1:05:58", "throughput": 2308.52, "total_tokens": 29583808} {"current_steps": 51300, "total_steps": 67140, "loss": 0.7897, "lr": 8.010114904920984e-06, "epoch": 7.640750670241287, "percentage": 76.41, "elapsed_time": "3:33:36", "remaining_time": "1:05:57", "throughput": 2308.54, "total_tokens": 29586848} {"current_steps": 51305, "total_steps": 67140, "loss": 0.5945, "lr": 8.005348011465925e-06, "epoch": 7.641495382782246, "percentage": 76.41, "elapsed_time": "3:33:37", "remaining_time": "1:05:56", "throughput": 2308.56, "total_tokens": 29589600} {"current_steps": 51310, "total_steps": 67140, "loss": 0.6502, "lr": 8.000582266440356e-06, "epoch": 7.6422400953232055, "percentage": 76.42, "elapsed_time": "3:33:38", "remaining_time": "1:05:54", "throughput": 2308.58, "total_tokens": 29592480} {"current_steps": 51315, "total_steps": 67140, "loss": 0.4875, "lr": 7.995817670166319e-06, "epoch": 7.642984807864164, "percentage": 76.43, "elapsed_time": "3:33:39", "remaining_time": "1:05:53", "throughput": 2308.61, "total_tokens": 29595488} {"current_steps": 51320, "total_steps": 67140, "loss": 0.7739, "lr": 7.991054222965788e-06, "epoch": 7.643729520405124, "percentage": 76.44, "elapsed_time": "3:33:40", "remaining_time": "1:05:52", "throughput": 2308.63, "total_tokens": 29598432} {"current_steps": 51325, "total_steps": 67140, "loss": 0.4274, "lr": 7.986291925160668e-06, "epoch": 7.644474232946083, "percentage": 76.44, "elapsed_time": "3:33:41", "remaining_time": "1:05:50", "throughput": 2308.65, "total_tokens": 29601312} {"current_steps": 51330, "total_steps": 67140, "loss": 0.5629, "lr": 7.98153077707276e-06, "epoch": 7.645218945487042, "percentage": 76.45, "elapsed_time": "3:33:43", "remaining_time": "1:05:49", "throughput": 2308.66, "total_tokens": 29604032} {"current_steps": 51335, "total_steps": 67140, "loss": 0.6202, "lr": 7.976770779023807e-06, "epoch": 7.645963658028001, "percentage": 76.46, "elapsed_time": "3:33:44", "remaining_time": "1:05:48", "throughput": 2308.67, "total_tokens": 29606752} {"current_steps": 51340, "total_steps": 67140, "loss": 0.6514, "lr": 7.972011931335474e-06, "epoch": 7.646708370568961, "percentage": 76.47, "elapsed_time": "3:33:45", "remaining_time": "1:05:47", "throughput": 2308.68, "total_tokens": 29609504} {"current_steps": 51345, "total_steps": 67140, "loss": 0.6339, "lr": 7.967254234329347e-06, "epoch": 7.6474530831099194, "percentage": 76.47, "elapsed_time": "3:33:46", "remaining_time": "1:05:45", "throughput": 2308.71, "total_tokens": 29612384} {"current_steps": 51350, "total_steps": 67140, "loss": 0.6188, "lr": 7.962497688326934e-06, "epoch": 7.648197795650879, "percentage": 76.48, "elapsed_time": "3:33:47", "remaining_time": "1:05:44", "throughput": 2308.74, "total_tokens": 29615488} {"current_steps": 51355, "total_steps": 67140, "loss": 0.7039, "lr": 7.95774229364965e-06, "epoch": 7.648942508191838, "percentage": 76.49, "elapsed_time": "3:33:48", "remaining_time": "1:05:43", "throughput": 2308.78, "total_tokens": 29618816} {"current_steps": 51360, "total_steps": 67140, "loss": 0.6901, "lr": 7.952988050618862e-06, "epoch": 7.6496872207327975, "percentage": 76.5, "elapsed_time": "3:33:49", "remaining_time": "1:05:41", "throughput": 2308.79, "total_tokens": 29621504} {"current_steps": 51365, "total_steps": 67140, "loss": 0.6622, "lr": 7.948234959555825e-06, "epoch": 7.650431933273756, "percentage": 76.5, "elapsed_time": "3:33:51", "remaining_time": "1:05:40", "throughput": 2308.81, "total_tokens": 29624448} {"current_steps": 51370, "total_steps": 67140, "loss": 0.4738, "lr": 7.943483020781741e-06, "epoch": 7.651176645814716, "percentage": 76.51, "elapsed_time": "3:33:52", "remaining_time": "1:05:39", "throughput": 2308.84, "total_tokens": 29627488} {"current_steps": 51375, "total_steps": 67140, "loss": 0.5171, "lr": 7.93873223461773e-06, "epoch": 7.651921358355675, "percentage": 76.52, "elapsed_time": "3:33:53", "remaining_time": "1:05:38", "throughput": 2308.85, "total_tokens": 29630080} {"current_steps": 51380, "total_steps": 67140, "loss": 0.5723, "lr": 7.933982601384825e-06, "epoch": 7.652666070896634, "percentage": 76.53, "elapsed_time": "3:33:54", "remaining_time": "1:05:36", "throughput": 2308.87, "total_tokens": 29633056} {"current_steps": 51385, "total_steps": 67140, "loss": 0.6152, "lr": 7.929234121403994e-06, "epoch": 7.653410783437593, "percentage": 76.53, "elapsed_time": "3:33:55", "remaining_time": "1:05:35", "throughput": 2308.9, "total_tokens": 29636128} {"current_steps": 51390, "total_steps": 67140, "loss": 0.7141, "lr": 7.924486794996122e-06, "epoch": 7.654155495978552, "percentage": 76.54, "elapsed_time": "3:33:56", "remaining_time": "1:05:34", "throughput": 2308.92, "total_tokens": 29639008} {"current_steps": 51395, "total_steps": 67140, "loss": 0.6608, "lr": 7.919740622482012e-06, "epoch": 7.6549002085195115, "percentage": 76.55, "elapsed_time": "3:33:57", "remaining_time": "1:05:32", "throughput": 2308.94, "total_tokens": 29641888} {"current_steps": 51400, "total_steps": 67140, "loss": 0.7851, "lr": 7.914995604182373e-06, "epoch": 7.655644921060471, "percentage": 76.56, "elapsed_time": "3:33:59", "remaining_time": "1:05:31", "throughput": 2308.96, "total_tokens": 29644736} {"current_steps": 51405, "total_steps": 67140, "loss": 0.6004, "lr": 7.910251740417873e-06, "epoch": 7.65638963360143, "percentage": 76.56, "elapsed_time": "3:34:00", "remaining_time": "1:05:30", "throughput": 2308.97, "total_tokens": 29647456} {"current_steps": 51410, "total_steps": 67140, "loss": 0.8269, "lr": 7.905509031509079e-06, "epoch": 7.657134346142389, "percentage": 76.57, "elapsed_time": "3:34:01", "remaining_time": "1:05:29", "throughput": 2309.0, "total_tokens": 29650656} {"current_steps": 51415, "total_steps": 67140, "loss": 0.6382, "lr": 7.900767477776483e-06, "epoch": 7.657879058683348, "percentage": 76.58, "elapsed_time": "3:34:02", "remaining_time": "1:05:27", "throughput": 2309.02, "total_tokens": 29653568} {"current_steps": 51420, "total_steps": 67140, "loss": 0.4518, "lr": 7.896027079540508e-06, "epoch": 7.658623771224307, "percentage": 76.59, "elapsed_time": "3:34:03", "remaining_time": "1:05:26", "throughput": 2309.04, "total_tokens": 29656384} {"current_steps": 51425, "total_steps": 67140, "loss": 0.6074, "lr": 7.891287837121472e-06, "epoch": 7.659368483765267, "percentage": 76.59, "elapsed_time": "3:34:04", "remaining_time": "1:05:25", "throughput": 2309.06, "total_tokens": 29659232} {"current_steps": 51430, "total_steps": 67140, "loss": 0.7077, "lr": 7.886549750839658e-06, "epoch": 7.6601131963062254, "percentage": 76.6, "elapsed_time": "3:34:05", "remaining_time": "1:05:23", "throughput": 2309.09, "total_tokens": 29662240} {"current_steps": 51435, "total_steps": 67140, "loss": 0.5471, "lr": 7.881812821015221e-06, "epoch": 7.660857908847185, "percentage": 76.61, "elapsed_time": "3:34:07", "remaining_time": "1:05:22", "throughput": 2309.11, "total_tokens": 29665312} {"current_steps": 51440, "total_steps": 67140, "loss": 0.4735, "lr": 7.877077047968282e-06, "epoch": 7.661602621388144, "percentage": 76.62, "elapsed_time": "3:34:08", "remaining_time": "1:05:21", "throughput": 2309.14, "total_tokens": 29668192} {"current_steps": 51445, "total_steps": 67140, "loss": 0.5719, "lr": 7.872342432018856e-06, "epoch": 7.6623473339291035, "percentage": 76.62, "elapsed_time": "3:34:09", "remaining_time": "1:05:20", "throughput": 2309.15, "total_tokens": 29671040} {"current_steps": 51450, "total_steps": 67140, "loss": 0.5943, "lr": 7.867608973486892e-06, "epoch": 7.663092046470062, "percentage": 76.63, "elapsed_time": "3:34:10", "remaining_time": "1:05:18", "throughput": 2309.17, "total_tokens": 29673792} {"current_steps": 51455, "total_steps": 67140, "loss": 0.4892, "lr": 7.862876672692265e-06, "epoch": 7.663836759011022, "percentage": 76.64, "elapsed_time": "3:34:11", "remaining_time": "1:05:17", "throughput": 2309.19, "total_tokens": 29676736} {"current_steps": 51460, "total_steps": 67140, "loss": 0.692, "lr": 7.858145529954752e-06, "epoch": 7.664581471551981, "percentage": 76.65, "elapsed_time": "3:34:12", "remaining_time": "1:05:16", "throughput": 2309.22, "total_tokens": 29679712} {"current_steps": 51465, "total_steps": 67140, "loss": 0.4684, "lr": 7.853415545594073e-06, "epoch": 7.66532618409294, "percentage": 76.65, "elapsed_time": "3:34:13", "remaining_time": "1:05:14", "throughput": 2309.23, "total_tokens": 29682432} {"current_steps": 51470, "total_steps": 67140, "loss": 0.7176, "lr": 7.848686719929863e-06, "epoch": 7.666070896633899, "percentage": 76.66, "elapsed_time": "3:34:14", "remaining_time": "1:05:13", "throughput": 2309.25, "total_tokens": 29685184} {"current_steps": 51475, "total_steps": 67140, "loss": 0.6525, "lr": 7.843959053281663e-06, "epoch": 7.666815609174859, "percentage": 76.67, "elapsed_time": "3:34:16", "remaining_time": "1:05:12", "throughput": 2309.27, "total_tokens": 29687968} {"current_steps": 51480, "total_steps": 67140, "loss": 0.671, "lr": 7.839232545968964e-06, "epoch": 7.6675603217158175, "percentage": 76.68, "elapsed_time": "3:34:17", "remaining_time": "1:05:11", "throughput": 2309.29, "total_tokens": 29690912} {"current_steps": 51485, "total_steps": 67140, "loss": 0.6394, "lr": 7.834507198311154e-06, "epoch": 7.668305034256777, "percentage": 76.68, "elapsed_time": "3:34:18", "remaining_time": "1:05:09", "throughput": 2309.31, "total_tokens": 29693792} {"current_steps": 51490, "total_steps": 67140, "loss": 0.5158, "lr": 7.829783010627568e-06, "epoch": 7.669049746797736, "percentage": 76.69, "elapsed_time": "3:34:19", "remaining_time": "1:05:08", "throughput": 2309.33, "total_tokens": 29696512} {"current_steps": 51495, "total_steps": 67140, "loss": 0.5042, "lr": 7.82505998323743e-06, "epoch": 7.6697944593386955, "percentage": 76.7, "elapsed_time": "3:34:20", "remaining_time": "1:05:07", "throughput": 2309.35, "total_tokens": 29699456} {"current_steps": 51500, "total_steps": 67140, "loss": 0.4801, "lr": 7.820338116459908e-06, "epoch": 7.670539171879654, "percentage": 76.71, "elapsed_time": "3:34:21", "remaining_time": "1:05:05", "throughput": 2309.37, "total_tokens": 29702304} {"current_steps": 51505, "total_steps": 67140, "loss": 0.5884, "lr": 7.815617410614087e-06, "epoch": 7.671283884420614, "percentage": 76.71, "elapsed_time": "3:34:22", "remaining_time": "1:05:04", "throughput": 2309.39, "total_tokens": 29705312} {"current_steps": 51510, "total_steps": 67140, "loss": 0.5489, "lr": 7.81089786601898e-06, "epoch": 7.672028596961573, "percentage": 76.72, "elapsed_time": "3:34:23", "remaining_time": "1:05:03", "throughput": 2309.42, "total_tokens": 29708320} {"current_steps": 51515, "total_steps": 67140, "loss": 0.4027, "lr": 7.806179482993514e-06, "epoch": 7.672773309502532, "percentage": 76.73, "elapsed_time": "3:34:25", "remaining_time": "1:05:02", "throughput": 2309.46, "total_tokens": 29711616} {"current_steps": 51520, "total_steps": 67140, "loss": 0.6201, "lr": 7.801462261856526e-06, "epoch": 7.673518022043491, "percentage": 76.74, "elapsed_time": "3:34:26", "remaining_time": "1:05:00", "throughput": 2309.5, "total_tokens": 29714848} {"current_steps": 51525, "total_steps": 67140, "loss": 0.6355, "lr": 7.796746202926802e-06, "epoch": 7.674262734584451, "percentage": 76.74, "elapsed_time": "3:34:27", "remaining_time": "1:04:59", "throughput": 2309.51, "total_tokens": 29717664} {"current_steps": 51530, "total_steps": 67140, "loss": 0.6007, "lr": 7.792031306523018e-06, "epoch": 7.6750074471254095, "percentage": 76.75, "elapsed_time": "3:34:28", "remaining_time": "1:04:58", "throughput": 2309.54, "total_tokens": 29720672} {"current_steps": 51535, "total_steps": 67140, "loss": 0.5378, "lr": 7.787317572963798e-06, "epoch": 7.675752159666369, "percentage": 76.76, "elapsed_time": "3:34:29", "remaining_time": "1:04:57", "throughput": 2309.57, "total_tokens": 29723808} {"current_steps": 51540, "total_steps": 67140, "loss": 0.4689, "lr": 7.782605002567673e-06, "epoch": 7.676496872207328, "percentage": 76.76, "elapsed_time": "3:34:30", "remaining_time": "1:04:55", "throughput": 2309.58, "total_tokens": 29726400} {"current_steps": 51545, "total_steps": 67140, "loss": 0.639, "lr": 7.777893595653102e-06, "epoch": 7.6772415847482876, "percentage": 76.77, "elapsed_time": "3:34:32", "remaining_time": "1:04:54", "throughput": 2309.61, "total_tokens": 29729504} {"current_steps": 51550, "total_steps": 67140, "loss": 0.5971, "lr": 7.77318335253846e-06, "epoch": 7.677986297289246, "percentage": 76.78, "elapsed_time": "3:34:33", "remaining_time": "1:04:53", "throughput": 2309.64, "total_tokens": 29732672} {"current_steps": 51555, "total_steps": 67140, "loss": 0.5912, "lr": 7.768474273542056e-06, "epoch": 7.678731009830205, "percentage": 76.79, "elapsed_time": "3:34:34", "remaining_time": "1:04:51", "throughput": 2309.66, "total_tokens": 29735552} {"current_steps": 51560, "total_steps": 67140, "loss": 0.6669, "lr": 7.763766358982104e-06, "epoch": 7.679475722371165, "percentage": 76.79, "elapsed_time": "3:34:35", "remaining_time": "1:04:50", "throughput": 2309.69, "total_tokens": 29738624} {"current_steps": 51565, "total_steps": 67140, "loss": 0.5687, "lr": 7.759059609176735e-06, "epoch": 7.680220434912124, "percentage": 76.8, "elapsed_time": "3:34:36", "remaining_time": "1:04:49", "throughput": 2309.7, "total_tokens": 29741376} {"current_steps": 51570, "total_steps": 67140, "loss": 0.446, "lr": 7.754354024444021e-06, "epoch": 7.680965147453083, "percentage": 76.81, "elapsed_time": "3:34:37", "remaining_time": "1:04:48", "throughput": 2309.72, "total_tokens": 29744192} {"current_steps": 51575, "total_steps": 67140, "loss": 0.8271, "lr": 7.749649605101947e-06, "epoch": 7.681709859994042, "percentage": 76.82, "elapsed_time": "3:34:38", "remaining_time": "1:04:46", "throughput": 2309.73, "total_tokens": 29746944} {"current_steps": 51580, "total_steps": 67140, "loss": 0.5798, "lr": 7.744946351468419e-06, "epoch": 7.6824545725350015, "percentage": 76.82, "elapsed_time": "3:34:40", "remaining_time": "1:04:45", "throughput": 2309.75, "total_tokens": 29749696} {"current_steps": 51585, "total_steps": 67140, "loss": 0.5892, "lr": 7.740244263861268e-06, "epoch": 7.683199285075961, "percentage": 76.83, "elapsed_time": "3:34:41", "remaining_time": "1:04:44", "throughput": 2309.76, "total_tokens": 29752480} {"current_steps": 51590, "total_steps": 67140, "loss": 0.492, "lr": 7.73554334259823e-06, "epoch": 7.68394399761692, "percentage": 76.84, "elapsed_time": "3:34:42", "remaining_time": "1:04:42", "throughput": 2309.78, "total_tokens": 29755232} {"current_steps": 51595, "total_steps": 67140, "loss": 0.6474, "lr": 7.730843587996989e-06, "epoch": 7.684688710157879, "percentage": 76.85, "elapsed_time": "3:34:43", "remaining_time": "1:04:41", "throughput": 2309.81, "total_tokens": 29758304} {"current_steps": 51600, "total_steps": 67140, "loss": 0.5273, "lr": 7.72614500037512e-06, "epoch": 7.685433422698838, "percentage": 76.85, "elapsed_time": "3:34:44", "remaining_time": "1:04:40", "throughput": 2309.84, "total_tokens": 29761344} {"current_steps": 51605, "total_steps": 67140, "loss": 0.4714, "lr": 7.72144758005014e-06, "epoch": 7.686178135239797, "percentage": 76.86, "elapsed_time": "3:34:45", "remaining_time": "1:04:39", "throughput": 2309.85, "total_tokens": 29764192} {"current_steps": 51610, "total_steps": 67140, "loss": 0.5452, "lr": 7.716751327339484e-06, "epoch": 7.686922847780757, "percentage": 76.87, "elapsed_time": "3:34:46", "remaining_time": "1:04:37", "throughput": 2309.87, "total_tokens": 29767008} {"current_steps": 51615, "total_steps": 67140, "loss": 0.4717, "lr": 7.712056242560503e-06, "epoch": 7.6876675603217155, "percentage": 76.88, "elapsed_time": "3:34:48", "remaining_time": "1:04:36", "throughput": 2309.89, "total_tokens": 29769920} {"current_steps": 51620, "total_steps": 67140, "loss": 0.6232, "lr": 7.707362326030482e-06, "epoch": 7.688412272862675, "percentage": 76.88, "elapsed_time": "3:34:49", "remaining_time": "1:04:35", "throughput": 2309.91, "total_tokens": 29772960} {"current_steps": 51625, "total_steps": 67140, "loss": 0.7848, "lr": 7.702669578066602e-06, "epoch": 7.689156985403634, "percentage": 76.89, "elapsed_time": "3:34:50", "remaining_time": "1:04:33", "throughput": 2309.94, "total_tokens": 29775872} {"current_steps": 51630, "total_steps": 67140, "loss": 0.5431, "lr": 7.697977998985984e-06, "epoch": 7.6899016979445936, "percentage": 76.9, "elapsed_time": "3:34:51", "remaining_time": "1:04:32", "throughput": 2309.96, "total_tokens": 29778912} {"current_steps": 51635, "total_steps": 67140, "loss": 0.6221, "lr": 7.693287589105678e-06, "epoch": 7.690646410485552, "percentage": 76.91, "elapsed_time": "3:34:52", "remaining_time": "1:04:31", "throughput": 2309.98, "total_tokens": 29781792} {"current_steps": 51640, "total_steps": 67140, "loss": 0.621, "lr": 7.68859834874262e-06, "epoch": 7.691391123026512, "percentage": 76.91, "elapsed_time": "3:34:53", "remaining_time": "1:04:30", "throughput": 2310.0, "total_tokens": 29784672} {"current_steps": 51645, "total_steps": 67140, "loss": 0.578, "lr": 7.683910278213708e-06, "epoch": 7.692135835567471, "percentage": 76.92, "elapsed_time": "3:34:54", "remaining_time": "1:04:28", "throughput": 2310.03, "total_tokens": 29787552} {"current_steps": 51650, "total_steps": 67140, "loss": 0.55, "lr": 7.679223377835735e-06, "epoch": 7.69288054810843, "percentage": 76.93, "elapsed_time": "3:34:56", "remaining_time": "1:04:27", "throughput": 2310.05, "total_tokens": 29790496} {"current_steps": 51655, "total_steps": 67140, "loss": 0.6582, "lr": 7.674537647925434e-06, "epoch": 7.693625260649389, "percentage": 76.94, "elapsed_time": "3:34:57", "remaining_time": "1:04:26", "throughput": 2310.08, "total_tokens": 29793504} {"current_steps": 51660, "total_steps": 67140, "loss": 0.4, "lr": 7.669853088799432e-06, "epoch": 7.694369973190349, "percentage": 76.94, "elapsed_time": "3:34:58", "remaining_time": "1:04:25", "throughput": 2310.1, "total_tokens": 29796416} {"current_steps": 51665, "total_steps": 67140, "loss": 0.4741, "lr": 7.665169700774294e-06, "epoch": 7.6951146857313075, "percentage": 76.95, "elapsed_time": "3:34:59", "remaining_time": "1:04:23", "throughput": 2310.15, "total_tokens": 29799872} {"current_steps": 51670, "total_steps": 67140, "loss": 0.6418, "lr": 7.660487484166513e-06, "epoch": 7.695859398272267, "percentage": 76.96, "elapsed_time": "3:35:00", "remaining_time": "1:04:22", "throughput": 2310.17, "total_tokens": 29802720} {"current_steps": 51675, "total_steps": 67140, "loss": 0.7552, "lr": 7.655806439292498e-06, "epoch": 7.696604110813226, "percentage": 76.97, "elapsed_time": "3:35:01", "remaining_time": "1:04:21", "throughput": 2310.18, "total_tokens": 29805472} {"current_steps": 51680, "total_steps": 67140, "loss": 0.5343, "lr": 7.651126566468559e-06, "epoch": 7.697348823354186, "percentage": 76.97, "elapsed_time": "3:35:02", "remaining_time": "1:04:19", "throughput": 2310.21, "total_tokens": 29808448} {"current_steps": 51685, "total_steps": 67140, "loss": 0.7079, "lr": 7.64644786601095e-06, "epoch": 7.698093535895144, "percentage": 76.98, "elapsed_time": "3:35:04", "remaining_time": "1:04:18", "throughput": 2310.22, "total_tokens": 29811200} {"current_steps": 51690, "total_steps": 67140, "loss": 0.5946, "lr": 7.641770338235851e-06, "epoch": 7.698838248436104, "percentage": 76.99, "elapsed_time": "3:35:05", "remaining_time": "1:04:17", "throughput": 2310.25, "total_tokens": 29814304} {"current_steps": 51695, "total_steps": 67140, "loss": 0.4913, "lr": 7.637093983459329e-06, "epoch": 7.699582960977063, "percentage": 77.0, "elapsed_time": "3:35:06", "remaining_time": "1:04:16", "throughput": 2310.27, "total_tokens": 29817088} {"current_steps": 51700, "total_steps": 67140, "loss": 0.6085, "lr": 7.632418801997404e-06, "epoch": 7.700327673518022, "percentage": 77.0, "elapsed_time": "3:35:07", "remaining_time": "1:04:14", "throughput": 2310.28, "total_tokens": 29819872} {"current_steps": 51705, "total_steps": 67140, "loss": 0.5764, "lr": 7.627744794166003e-06, "epoch": 7.701072386058981, "percentage": 77.01, "elapsed_time": "3:35:08", "remaining_time": "1:04:13", "throughput": 2310.29, "total_tokens": 29822592} {"current_steps": 51710, "total_steps": 67140, "loss": 0.5792, "lr": 7.623071960280981e-06, "epoch": 7.701817098599941, "percentage": 77.02, "elapsed_time": "3:35:09", "remaining_time": "1:04:12", "throughput": 2310.31, "total_tokens": 29825440} {"current_steps": 51715, "total_steps": 67140, "loss": 0.4966, "lr": 7.618400300658113e-06, "epoch": 7.7025618111408996, "percentage": 77.03, "elapsed_time": "3:35:10", "remaining_time": "1:04:10", "throughput": 2310.33, "total_tokens": 29828320} {"current_steps": 51720, "total_steps": 67140, "loss": 0.5407, "lr": 7.613729815613077e-06, "epoch": 7.703306523681858, "percentage": 77.03, "elapsed_time": "3:35:11", "remaining_time": "1:04:09", "throughput": 2310.35, "total_tokens": 29831232} {"current_steps": 51725, "total_steps": 67140, "loss": 0.5407, "lr": 7.609060505461499e-06, "epoch": 7.704051236222818, "percentage": 77.04, "elapsed_time": "3:35:13", "remaining_time": "1:04:08", "throughput": 2310.38, "total_tokens": 29834336} {"current_steps": 51730, "total_steps": 67140, "loss": 0.5682, "lr": 7.6043923705189005e-06, "epoch": 7.704795948763778, "percentage": 77.05, "elapsed_time": "3:35:14", "remaining_time": "1:04:07", "throughput": 2310.42, "total_tokens": 29837440} {"current_steps": 51735, "total_steps": 67140, "loss": 0.8987, "lr": 7.599725411100739e-06, "epoch": 7.705540661304736, "percentage": 77.06, "elapsed_time": "3:35:15", "remaining_time": "1:04:05", "throughput": 2310.44, "total_tokens": 29840416} {"current_steps": 51740, "total_steps": 67140, "loss": 0.5673, "lr": 7.595059627522389e-06, "epoch": 7.706285373845695, "percentage": 77.06, "elapsed_time": "3:35:16", "remaining_time": "1:04:04", "throughput": 2310.47, "total_tokens": 29843552} {"current_steps": 51745, "total_steps": 67140, "loss": 0.5483, "lr": 7.590395020099145e-06, "epoch": 7.707030086386655, "percentage": 77.07, "elapsed_time": "3:35:17", "remaining_time": "1:04:03", "throughput": 2310.48, "total_tokens": 29846240} {"current_steps": 51750, "total_steps": 67140, "loss": 0.606, "lr": 7.585731589146234e-06, "epoch": 7.707774798927614, "percentage": 77.08, "elapsed_time": "3:35:18", "remaining_time": "1:04:01", "throughput": 2310.5, "total_tokens": 29848992} {"current_steps": 51755, "total_steps": 67140, "loss": 0.6909, "lr": 7.581069334978771e-06, "epoch": 7.708519511468573, "percentage": 77.09, "elapsed_time": "3:35:19", "remaining_time": "1:04:00", "throughput": 2310.52, "total_tokens": 29851872} {"current_steps": 51760, "total_steps": 67140, "loss": 0.6868, "lr": 7.57640825791183e-06, "epoch": 7.709264224009532, "percentage": 77.09, "elapsed_time": "3:35:21", "remaining_time": "1:03:59", "throughput": 2310.54, "total_tokens": 29854688} {"current_steps": 51765, "total_steps": 67140, "loss": 0.5645, "lr": 7.571748358260372e-06, "epoch": 7.710008936550492, "percentage": 77.1, "elapsed_time": "3:35:22", "remaining_time": "1:03:58", "throughput": 2310.54, "total_tokens": 29857280} {"current_steps": 51770, "total_steps": 67140, "loss": 0.6639, "lr": 7.567089636339303e-06, "epoch": 7.71075364909145, "percentage": 77.11, "elapsed_time": "3:35:23", "remaining_time": "1:03:56", "throughput": 2310.56, "total_tokens": 29860064} {"current_steps": 51775, "total_steps": 67140, "loss": 0.6737, "lr": 7.562432092463439e-06, "epoch": 7.71149836163241, "percentage": 77.11, "elapsed_time": "3:35:24", "remaining_time": "1:03:55", "throughput": 2310.58, "total_tokens": 29863136} {"current_steps": 51780, "total_steps": 67140, "loss": 0.7819, "lr": 7.557775726947519e-06, "epoch": 7.712243074173369, "percentage": 77.12, "elapsed_time": "3:35:25", "remaining_time": "1:03:54", "throughput": 2310.6, "total_tokens": 29865920} {"current_steps": 51785, "total_steps": 67140, "loss": 0.6662, "lr": 7.553120540106206e-06, "epoch": 7.712987786714328, "percentage": 77.13, "elapsed_time": "3:35:26", "remaining_time": "1:03:52", "throughput": 2310.62, "total_tokens": 29868928} {"current_steps": 51790, "total_steps": 67140, "loss": 0.4911, "lr": 7.5484665322540675e-06, "epoch": 7.713732499255287, "percentage": 77.14, "elapsed_time": "3:35:27", "remaining_time": "1:03:51", "throughput": 2310.64, "total_tokens": 29871712} {"current_steps": 51795, "total_steps": 67140, "loss": 0.6209, "lr": 7.543813703705616e-06, "epoch": 7.714477211796247, "percentage": 77.14, "elapsed_time": "3:35:29", "remaining_time": "1:03:50", "throughput": 2310.67, "total_tokens": 29874688} {"current_steps": 51800, "total_steps": 67140, "loss": 0.6489, "lr": 7.539162054775253e-06, "epoch": 7.7152219243372056, "percentage": 77.15, "elapsed_time": "3:35:30", "remaining_time": "1:03:49", "throughput": 2310.68, "total_tokens": 29877536} {"current_steps": 51805, "total_steps": 67140, "loss": 0.698, "lr": 7.534511585777326e-06, "epoch": 7.715966636878165, "percentage": 77.16, "elapsed_time": "3:35:31", "remaining_time": "1:03:47", "throughput": 2310.71, "total_tokens": 29880480} {"current_steps": 51810, "total_steps": 67140, "loss": 0.5319, "lr": 7.529862297026099e-06, "epoch": 7.716711349419124, "percentage": 77.17, "elapsed_time": "3:35:32", "remaining_time": "1:03:46", "throughput": 2310.73, "total_tokens": 29883424} {"current_steps": 51815, "total_steps": 67140, "loss": 0.6251, "lr": 7.525214188835749e-06, "epoch": 7.717456061960084, "percentage": 77.17, "elapsed_time": "3:35:33", "remaining_time": "1:03:45", "throughput": 2310.75, "total_tokens": 29886176} {"current_steps": 51820, "total_steps": 67140, "loss": 0.643, "lr": 7.520567261520387e-06, "epoch": 7.718200774501042, "percentage": 77.18, "elapsed_time": "3:35:34", "remaining_time": "1:03:43", "throughput": 2310.77, "total_tokens": 29889088} {"current_steps": 51825, "total_steps": 67140, "loss": 0.3722, "lr": 7.515921515394014e-06, "epoch": 7.718945487042002, "percentage": 77.19, "elapsed_time": "3:35:35", "remaining_time": "1:03:42", "throughput": 2310.78, "total_tokens": 29891744} {"current_steps": 51830, "total_steps": 67140, "loss": 0.7524, "lr": 7.51127695077058e-06, "epoch": 7.719690199582961, "percentage": 77.2, "elapsed_time": "3:35:36", "remaining_time": "1:03:41", "throughput": 2310.8, "total_tokens": 29894624} {"current_steps": 51835, "total_steps": 67140, "loss": 0.5181, "lr": 7.506633567963953e-06, "epoch": 7.72043491212392, "percentage": 77.2, "elapsed_time": "3:35:38", "remaining_time": "1:03:40", "throughput": 2310.82, "total_tokens": 29897568} {"current_steps": 51840, "total_steps": 67140, "loss": 0.6412, "lr": 7.501991367287897e-06, "epoch": 7.721179624664879, "percentage": 77.21, "elapsed_time": "3:35:39", "remaining_time": "1:03:38", "throughput": 2310.84, "total_tokens": 29900512} {"current_steps": 51845, "total_steps": 67140, "loss": 0.7303, "lr": 7.497350349056126e-06, "epoch": 7.721924337205839, "percentage": 77.22, "elapsed_time": "3:35:40", "remaining_time": "1:03:37", "throughput": 2310.85, "total_tokens": 29903136} {"current_steps": 51850, "total_steps": 67140, "loss": 0.6057, "lr": 7.492710513582257e-06, "epoch": 7.722669049746798, "percentage": 77.23, "elapsed_time": "3:35:41", "remaining_time": "1:03:36", "throughput": 2310.88, "total_tokens": 29906208} {"current_steps": 51855, "total_steps": 67140, "loss": 0.5439, "lr": 7.488071861179838e-06, "epoch": 7.723413762287757, "percentage": 77.23, "elapsed_time": "3:35:42", "remaining_time": "1:03:35", "throughput": 2310.88, "total_tokens": 29908768} {"current_steps": 51860, "total_steps": 67140, "loss": 0.7, "lr": 7.4834343921623165e-06, "epoch": 7.724158474828716, "percentage": 77.24, "elapsed_time": "3:35:43", "remaining_time": "1:03:33", "throughput": 2310.91, "total_tokens": 29911776} {"current_steps": 51865, "total_steps": 67140, "loss": 0.4587, "lr": 7.478798106843085e-06, "epoch": 7.724903187369676, "percentage": 77.25, "elapsed_time": "3:35:44", "remaining_time": "1:03:32", "throughput": 2310.93, "total_tokens": 29914752} {"current_steps": 51870, "total_steps": 67140, "loss": 0.5782, "lr": 7.474163005535439e-06, "epoch": 7.725647899910634, "percentage": 77.26, "elapsed_time": "3:35:45", "remaining_time": "1:03:31", "throughput": 2310.93, "total_tokens": 29917312} {"current_steps": 51875, "total_steps": 67140, "loss": 0.5554, "lr": 7.46952908855261e-06, "epoch": 7.726392612451594, "percentage": 77.26, "elapsed_time": "3:35:47", "remaining_time": "1:03:29", "throughput": 2310.96, "total_tokens": 29920224} {"current_steps": 51880, "total_steps": 67140, "loss": 0.5385, "lr": 7.464896356207723e-06, "epoch": 7.727137324992553, "percentage": 77.27, "elapsed_time": "3:35:48", "remaining_time": "1:03:28", "throughput": 2310.97, "total_tokens": 29923040} {"current_steps": 51885, "total_steps": 67140, "loss": 0.6693, "lr": 7.460264808813849e-06, "epoch": 7.727882037533512, "percentage": 77.28, "elapsed_time": "3:35:49", "remaining_time": "1:03:27", "throughput": 2311.01, "total_tokens": 29926176} {"current_steps": 51890, "total_steps": 67140, "loss": 0.6168, "lr": 7.455634446683976e-06, "epoch": 7.728626750074471, "percentage": 77.29, "elapsed_time": "3:35:50", "remaining_time": "1:03:26", "throughput": 2311.06, "total_tokens": 29929600} {"current_steps": 51895, "total_steps": 67140, "loss": 0.6247, "lr": 7.451005270130987e-06, "epoch": 7.729371462615431, "percentage": 77.29, "elapsed_time": "3:35:51", "remaining_time": "1:03:24", "throughput": 2311.07, "total_tokens": 29932384} {"current_steps": 51900, "total_steps": 67140, "loss": 0.4953, "lr": 7.4463772794677145e-06, "epoch": 7.73011617515639, "percentage": 77.3, "elapsed_time": "3:35:52", "remaining_time": "1:03:23", "throughput": 2311.11, "total_tokens": 29935584} {"current_steps": 51905, "total_steps": 67140, "loss": 0.6032, "lr": 7.441750475006898e-06, "epoch": 7.730860887697348, "percentage": 77.31, "elapsed_time": "3:35:54", "remaining_time": "1:03:22", "throughput": 2311.12, "total_tokens": 29938368} {"current_steps": 51910, "total_steps": 67140, "loss": 0.5003, "lr": 7.4371248570611975e-06, "epoch": 7.731605600238308, "percentage": 77.32, "elapsed_time": "3:35:55", "remaining_time": "1:03:20", "throughput": 2311.13, "total_tokens": 29941056} {"current_steps": 51915, "total_steps": 67140, "loss": 0.55, "lr": 7.4325004259432006e-06, "epoch": 7.732350312779268, "percentage": 77.32, "elapsed_time": "3:35:56", "remaining_time": "1:03:19", "throughput": 2311.15, "total_tokens": 29943808} {"current_steps": 51920, "total_steps": 67140, "loss": 0.5531, "lr": 7.427877181965393e-06, "epoch": 7.733095025320226, "percentage": 77.33, "elapsed_time": "3:35:57", "remaining_time": "1:03:18", "throughput": 2311.17, "total_tokens": 29946816} {"current_steps": 51925, "total_steps": 67140, "loss": 0.5582, "lr": 7.423255125440212e-06, "epoch": 7.733839737861185, "percentage": 77.34, "elapsed_time": "3:35:58", "remaining_time": "1:03:17", "throughput": 2311.2, "total_tokens": 29949760} {"current_steps": 51930, "total_steps": 67140, "loss": 0.548, "lr": 7.418634256679976e-06, "epoch": 7.734584450402145, "percentage": 77.35, "elapsed_time": "3:35:59", "remaining_time": "1:03:15", "throughput": 2311.21, "total_tokens": 29952576} {"current_steps": 51935, "total_steps": 67140, "loss": 0.437, "lr": 7.414014575996961e-06, "epoch": 7.735329162943104, "percentage": 77.35, "elapsed_time": "3:36:00", "remaining_time": "1:03:14", "throughput": 2311.23, "total_tokens": 29955360} {"current_steps": 51940, "total_steps": 67140, "loss": 0.5, "lr": 7.409396083703341e-06, "epoch": 7.736073875484063, "percentage": 77.36, "elapsed_time": "3:36:01", "remaining_time": "1:03:13", "throughput": 2311.23, "total_tokens": 29957920} {"current_steps": 51945, "total_steps": 67140, "loss": 0.5568, "lr": 7.404778780111213e-06, "epoch": 7.736818588025022, "percentage": 77.37, "elapsed_time": "3:36:03", "remaining_time": "1:03:11", "throughput": 2311.25, "total_tokens": 29960736} {"current_steps": 51950, "total_steps": 67140, "loss": 0.7148, "lr": 7.400162665532606e-06, "epoch": 7.737563300565982, "percentage": 77.38, "elapsed_time": "3:36:04", "remaining_time": "1:03:10", "throughput": 2311.27, "total_tokens": 29963616} {"current_steps": 51955, "total_steps": 67140, "loss": 0.4775, "lr": 7.3955477402794435e-06, "epoch": 7.73830801310694, "percentage": 77.38, "elapsed_time": "3:36:05", "remaining_time": "1:03:09", "throughput": 2311.28, "total_tokens": 29966400} {"current_steps": 51960, "total_steps": 67140, "loss": 0.7235, "lr": 7.390934004663597e-06, "epoch": 7.7390527256479, "percentage": 77.39, "elapsed_time": "3:36:06", "remaining_time": "1:03:08", "throughput": 2311.3, "total_tokens": 29969248} {"current_steps": 51965, "total_steps": 67140, "loss": 0.6905, "lr": 7.386321458996831e-06, "epoch": 7.739797438188859, "percentage": 77.4, "elapsed_time": "3:36:07", "remaining_time": "1:03:06", "throughput": 2311.32, "total_tokens": 29972096} {"current_steps": 51970, "total_steps": 67140, "loss": 0.7616, "lr": 7.381710103590847e-06, "epoch": 7.740542150729818, "percentage": 77.41, "elapsed_time": "3:36:08", "remaining_time": "1:03:05", "throughput": 2311.34, "total_tokens": 29975072} {"current_steps": 51975, "total_steps": 67140, "loss": 0.6183, "lr": 7.377099938757265e-06, "epoch": 7.741286863270777, "percentage": 77.41, "elapsed_time": "3:36:09", "remaining_time": "1:03:04", "throughput": 2311.37, "total_tokens": 29978080} {"current_steps": 51980, "total_steps": 67140, "loss": 0.5612, "lr": 7.372490964807619e-06, "epoch": 7.742031575811737, "percentage": 77.42, "elapsed_time": "3:36:10", "remaining_time": "1:03:02", "throughput": 2311.38, "total_tokens": 29980928} {"current_steps": 51985, "total_steps": 67140, "loss": 0.5761, "lr": 7.367883182053373e-06, "epoch": 7.742776288352696, "percentage": 77.43, "elapsed_time": "3:36:12", "remaining_time": "1:03:01", "throughput": 2311.41, "total_tokens": 29983904} {"current_steps": 51990, "total_steps": 67140, "loss": 0.5092, "lr": 7.363276590805887e-06, "epoch": 7.743521000893655, "percentage": 77.44, "elapsed_time": "3:36:13", "remaining_time": "1:03:00", "throughput": 2311.43, "total_tokens": 29986720} {"current_steps": 51995, "total_steps": 67140, "loss": 0.4971, "lr": 7.358671191376474e-06, "epoch": 7.744265713434614, "percentage": 77.44, "elapsed_time": "3:36:14", "remaining_time": "1:02:59", "throughput": 2311.45, "total_tokens": 29989600} {"current_steps": 52000, "total_steps": 67140, "loss": 0.5167, "lr": 7.3540669840763246e-06, "epoch": 7.745010425975574, "percentage": 77.45, "elapsed_time": "3:36:15", "remaining_time": "1:02:57", "throughput": 2311.47, "total_tokens": 29992608} {"current_steps": 52005, "total_steps": 67140, "loss": 0.5618, "lr": 7.349463969216589e-06, "epoch": 7.745755138516532, "percentage": 77.46, "elapsed_time": "3:36:16", "remaining_time": "1:02:56", "throughput": 2311.51, "total_tokens": 29995968} {"current_steps": 52010, "total_steps": 67140, "loss": 0.5736, "lr": 7.344862147108314e-06, "epoch": 7.746499851057492, "percentage": 77.46, "elapsed_time": "3:36:17", "remaining_time": "1:02:55", "throughput": 2311.53, "total_tokens": 29998816} {"current_steps": 52015, "total_steps": 67140, "loss": 0.7148, "lr": 7.340261518062475e-06, "epoch": 7.747244563598451, "percentage": 77.47, "elapsed_time": "3:36:19", "remaining_time": "1:02:54", "throughput": 2311.55, "total_tokens": 30001792} {"current_steps": 52020, "total_steps": 67140, "loss": 0.6124, "lr": 7.335662082389972e-06, "epoch": 7.7479892761394105, "percentage": 77.48, "elapsed_time": "3:36:20", "remaining_time": "1:02:52", "throughput": 2311.56, "total_tokens": 30004512} {"current_steps": 52025, "total_steps": 67140, "loss": 0.5866, "lr": 7.3310638404016005e-06, "epoch": 7.748733988680369, "percentage": 77.49, "elapsed_time": "3:36:21", "remaining_time": "1:02:51", "throughput": 2311.59, "total_tokens": 30007424} {"current_steps": 52030, "total_steps": 67140, "loss": 0.5717, "lr": 7.326466792408096e-06, "epoch": 7.749478701221329, "percentage": 77.49, "elapsed_time": "3:36:22", "remaining_time": "1:02:50", "throughput": 2311.61, "total_tokens": 30010368} {"current_steps": 52035, "total_steps": 67140, "loss": 0.624, "lr": 7.321870938720118e-06, "epoch": 7.750223413762288, "percentage": 77.5, "elapsed_time": "3:36:23", "remaining_time": "1:02:48", "throughput": 2311.65, "total_tokens": 30013568} {"current_steps": 52040, "total_steps": 67140, "loss": 0.655, "lr": 7.317276279648222e-06, "epoch": 7.750968126303247, "percentage": 77.51, "elapsed_time": "3:36:24", "remaining_time": "1:02:47", "throughput": 2311.68, "total_tokens": 30016768} {"current_steps": 52045, "total_steps": 67140, "loss": 0.7308, "lr": 7.3126828155029024e-06, "epoch": 7.751712838844206, "percentage": 77.52, "elapsed_time": "3:36:25", "remaining_time": "1:02:46", "throughput": 2311.69, "total_tokens": 30019488} {"current_steps": 52050, "total_steps": 67140, "loss": 0.6334, "lr": 7.308090546594565e-06, "epoch": 7.752457551385166, "percentage": 77.52, "elapsed_time": "3:36:27", "remaining_time": "1:02:45", "throughput": 2311.71, "total_tokens": 30022272} {"current_steps": 52055, "total_steps": 67140, "loss": 0.4785, "lr": 7.303499473233546e-06, "epoch": 7.753202263926124, "percentage": 77.53, "elapsed_time": "3:36:28", "remaining_time": "1:02:43", "throughput": 2311.73, "total_tokens": 30025216} {"current_steps": 52060, "total_steps": 67140, "loss": 0.6901, "lr": 7.2989095957300804e-06, "epoch": 7.753946976467084, "percentage": 77.54, "elapsed_time": "3:36:29", "remaining_time": "1:02:42", "throughput": 2311.79, "total_tokens": 30029024} {"current_steps": 52065, "total_steps": 67140, "loss": 0.5024, "lr": 7.294320914394331e-06, "epoch": 7.754691689008043, "percentage": 77.55, "elapsed_time": "3:36:30", "remaining_time": "1:02:41", "throughput": 2311.83, "total_tokens": 30032192} {"current_steps": 52070, "total_steps": 67140, "loss": 0.6852, "lr": 7.289733429536391e-06, "epoch": 7.755436401549002, "percentage": 77.55, "elapsed_time": "3:36:31", "remaining_time": "1:02:40", "throughput": 2311.85, "total_tokens": 30035040} {"current_steps": 52075, "total_steps": 67140, "loss": 0.6506, "lr": 7.285147141466269e-06, "epoch": 7.756181114089961, "percentage": 77.56, "elapsed_time": "3:36:32", "remaining_time": "1:02:38", "throughput": 2311.86, "total_tokens": 30037728} {"current_steps": 52080, "total_steps": 67140, "loss": 0.5998, "lr": 7.280562050493872e-06, "epoch": 7.756925826630921, "percentage": 77.57, "elapsed_time": "3:36:34", "remaining_time": "1:02:37", "throughput": 2311.88, "total_tokens": 30040672} {"current_steps": 52085, "total_steps": 67140, "loss": 0.5358, "lr": 7.2759781569290506e-06, "epoch": 7.75767053917188, "percentage": 77.58, "elapsed_time": "3:36:35", "remaining_time": "1:02:36", "throughput": 2311.91, "total_tokens": 30043712} {"current_steps": 52090, "total_steps": 67140, "loss": 0.5339, "lr": 7.27139546108157e-06, "epoch": 7.758415251712838, "percentage": 77.58, "elapsed_time": "3:36:36", "remaining_time": "1:02:34", "throughput": 2311.92, "total_tokens": 30046432} {"current_steps": 52095, "total_steps": 67140, "loss": 0.6001, "lr": 7.266813963261099e-06, "epoch": 7.759159964253798, "percentage": 77.59, "elapsed_time": "3:36:37", "remaining_time": "1:02:33", "throughput": 2311.95, "total_tokens": 30049504} {"current_steps": 52100, "total_steps": 67140, "loss": 0.6043, "lr": 7.262233663777243e-06, "epoch": 7.759904676794758, "percentage": 77.6, "elapsed_time": "3:36:38", "remaining_time": "1:02:32", "throughput": 2311.99, "total_tokens": 30052832} {"current_steps": 52105, "total_steps": 67140, "loss": 0.4762, "lr": 7.257654562939517e-06, "epoch": 7.7606493893357165, "percentage": 77.61, "elapsed_time": "3:36:39", "remaining_time": "1:02:31", "throughput": 2312.0, "total_tokens": 30055456} {"current_steps": 52110, "total_steps": 67140, "loss": 0.6622, "lr": 7.253076661057362e-06, "epoch": 7.761394101876675, "percentage": 77.61, "elapsed_time": "3:36:40", "remaining_time": "1:02:29", "throughput": 2312.01, "total_tokens": 30058208} {"current_steps": 52115, "total_steps": 67140, "loss": 0.645, "lr": 7.248499958440141e-06, "epoch": 7.762138814417635, "percentage": 77.62, "elapsed_time": "3:36:42", "remaining_time": "1:02:28", "throughput": 2312.02, "total_tokens": 30060928} {"current_steps": 52120, "total_steps": 67140, "loss": 0.5052, "lr": 7.243924455397111e-06, "epoch": 7.762883526958594, "percentage": 77.63, "elapsed_time": "3:36:43", "remaining_time": "1:02:27", "throughput": 2312.03, "total_tokens": 30063648} {"current_steps": 52125, "total_steps": 67140, "loss": 0.4644, "lr": 7.2393501522374844e-06, "epoch": 7.763628239499553, "percentage": 77.64, "elapsed_time": "3:36:44", "remaining_time": "1:02:25", "throughput": 2312.06, "total_tokens": 30066656} {"current_steps": 52130, "total_steps": 67140, "loss": 0.5387, "lr": 7.234777049270358e-06, "epoch": 7.764372952040512, "percentage": 77.64, "elapsed_time": "3:36:45", "remaining_time": "1:02:24", "throughput": 2312.08, "total_tokens": 30069504} {"current_steps": 52135, "total_steps": 67140, "loss": 0.5247, "lr": 7.230205146804769e-06, "epoch": 7.765117664581472, "percentage": 77.65, "elapsed_time": "3:36:46", "remaining_time": "1:02:23", "throughput": 2312.1, "total_tokens": 30072512} {"current_steps": 52140, "total_steps": 67140, "loss": 0.4818, "lr": 7.2256344451496676e-06, "epoch": 7.76586237712243, "percentage": 77.66, "elapsed_time": "3:36:47", "remaining_time": "1:02:22", "throughput": 2312.12, "total_tokens": 30075360} {"current_steps": 52145, "total_steps": 67140, "loss": 0.6659, "lr": 7.221064944613929e-06, "epoch": 7.76660708966339, "percentage": 77.67, "elapsed_time": "3:36:48", "remaining_time": "1:02:20", "throughput": 2312.14, "total_tokens": 30078304} {"current_steps": 52150, "total_steps": 67140, "loss": 0.6499, "lr": 7.2164966455063435e-06, "epoch": 7.767351802204349, "percentage": 77.67, "elapsed_time": "3:36:49", "remaining_time": "1:02:19", "throughput": 2312.16, "total_tokens": 30081184} {"current_steps": 52155, "total_steps": 67140, "loss": 0.6962, "lr": 7.2119295481356044e-06, "epoch": 7.7680965147453085, "percentage": 77.68, "elapsed_time": "3:36:51", "remaining_time": "1:02:18", "throughput": 2312.17, "total_tokens": 30084000} {"current_steps": 52160, "total_steps": 67140, "loss": 0.539, "lr": 7.2073636528103535e-06, "epoch": 7.768841227286267, "percentage": 77.69, "elapsed_time": "3:36:52", "remaining_time": "1:02:17", "throughput": 2312.2, "total_tokens": 30086944} {"current_steps": 52165, "total_steps": 67140, "loss": 0.6619, "lr": 7.202798959839119e-06, "epoch": 7.769585939827227, "percentage": 77.7, "elapsed_time": "3:36:53", "remaining_time": "1:02:15", "throughput": 2312.23, "total_tokens": 30090048} {"current_steps": 52170, "total_steps": 67140, "loss": 0.5998, "lr": 7.198235469530374e-06, "epoch": 7.770330652368186, "percentage": 77.7, "elapsed_time": "3:36:54", "remaining_time": "1:02:14", "throughput": 2312.26, "total_tokens": 30093088} {"current_steps": 52175, "total_steps": 67140, "loss": 0.4146, "lr": 7.193673182192498e-06, "epoch": 7.771075364909145, "percentage": 77.71, "elapsed_time": "3:36:55", "remaining_time": "1:02:13", "throughput": 2312.28, "total_tokens": 30096128} {"current_steps": 52180, "total_steps": 67140, "loss": 0.714, "lr": 7.189112098133793e-06, "epoch": 7.771820077450104, "percentage": 77.72, "elapsed_time": "3:36:56", "remaining_time": "1:02:11", "throughput": 2312.3, "total_tokens": 30099040} {"current_steps": 52185, "total_steps": 67140, "loss": 0.5852, "lr": 7.184552217662488e-06, "epoch": 7.772564789991064, "percentage": 77.73, "elapsed_time": "3:36:58", "remaining_time": "1:02:10", "throughput": 2312.32, "total_tokens": 30101888} {"current_steps": 52190, "total_steps": 67140, "loss": 0.6943, "lr": 7.179993541086702e-06, "epoch": 7.7733095025320225, "percentage": 77.73, "elapsed_time": "3:36:59", "remaining_time": "1:02:09", "throughput": 2312.33, "total_tokens": 30104640} {"current_steps": 52195, "total_steps": 67140, "loss": 0.6268, "lr": 7.175436068714503e-06, "epoch": 7.774054215072982, "percentage": 77.74, "elapsed_time": "3:37:00", "remaining_time": "1:02:08", "throughput": 2312.38, "total_tokens": 30108096} {"current_steps": 52200, "total_steps": 67140, "loss": 0.5172, "lr": 7.170879800853872e-06, "epoch": 7.774798927613941, "percentage": 77.75, "elapsed_time": "3:37:01", "remaining_time": "1:02:06", "throughput": 2312.4, "total_tokens": 30110912} {"current_steps": 52205, "total_steps": 67140, "loss": 0.5939, "lr": 7.166324737812688e-06, "epoch": 7.7755436401549005, "percentage": 77.76, "elapsed_time": "3:37:02", "remaining_time": "1:02:05", "throughput": 2312.41, "total_tokens": 30113536} {"current_steps": 52210, "total_steps": 67140, "loss": 0.4806, "lr": 7.161770879898771e-06, "epoch": 7.776288352695859, "percentage": 77.76, "elapsed_time": "3:37:03", "remaining_time": "1:02:04", "throughput": 2312.44, "total_tokens": 30116672} {"current_steps": 52215, "total_steps": 67140, "loss": 0.5271, "lr": 7.1572182274198564e-06, "epoch": 7.777033065236819, "percentage": 77.77, "elapsed_time": "3:37:04", "remaining_time": "1:02:03", "throughput": 2312.47, "total_tokens": 30119648} {"current_steps": 52220, "total_steps": 67140, "loss": 0.5531, "lr": 7.152666780683595e-06, "epoch": 7.777777777777778, "percentage": 77.78, "elapsed_time": "3:37:06", "remaining_time": "1:02:01", "throughput": 2312.49, "total_tokens": 30122560} {"current_steps": 52225, "total_steps": 67140, "loss": 0.7376, "lr": 7.148116539997546e-06, "epoch": 7.778522490318737, "percentage": 77.79, "elapsed_time": "3:37:07", "remaining_time": "1:02:00", "throughput": 2312.52, "total_tokens": 30125568} {"current_steps": 52230, "total_steps": 67140, "loss": 0.5737, "lr": 7.143567505669199e-06, "epoch": 7.779267202859696, "percentage": 77.79, "elapsed_time": "3:37:08", "remaining_time": "1:01:59", "throughput": 2312.56, "total_tokens": 30128864} {"current_steps": 52235, "total_steps": 67140, "loss": 0.5807, "lr": 7.139019678005959e-06, "epoch": 7.780011915400656, "percentage": 77.8, "elapsed_time": "3:37:09", "remaining_time": "1:01:57", "throughput": 2312.58, "total_tokens": 30131744} {"current_steps": 52240, "total_steps": 67140, "loss": 0.4932, "lr": 7.134473057315163e-06, "epoch": 7.7807566279416145, "percentage": 77.81, "elapsed_time": "3:37:10", "remaining_time": "1:01:56", "throughput": 2312.59, "total_tokens": 30134432} {"current_steps": 52245, "total_steps": 67140, "loss": 0.496, "lr": 7.129927643904033e-06, "epoch": 7.781501340482574, "percentage": 77.82, "elapsed_time": "3:37:11", "remaining_time": "1:01:55", "throughput": 2312.6, "total_tokens": 30137248} {"current_steps": 52250, "total_steps": 67140, "loss": 0.4035, "lr": 7.125383438079736e-06, "epoch": 7.782246053023533, "percentage": 77.82, "elapsed_time": "3:37:12", "remaining_time": "1:01:54", "throughput": 2312.62, "total_tokens": 30140096} {"current_steps": 52255, "total_steps": 67140, "loss": 0.5292, "lr": 7.120840440149365e-06, "epoch": 7.782990765564492, "percentage": 77.83, "elapsed_time": "3:37:13", "remaining_time": "1:01:52", "throughput": 2312.63, "total_tokens": 30142784} {"current_steps": 52260, "total_steps": 67140, "loss": 0.5477, "lr": 7.1162986504198945e-06, "epoch": 7.783735478105451, "percentage": 77.84, "elapsed_time": "3:37:15", "remaining_time": "1:01:51", "throughput": 2312.65, "total_tokens": 30145568} {"current_steps": 52265, "total_steps": 67140, "loss": 0.5892, "lr": 7.1117580691982545e-06, "epoch": 7.784480190646411, "percentage": 77.84, "elapsed_time": "3:37:16", "remaining_time": "1:01:50", "throughput": 2312.69, "total_tokens": 30148896} {"current_steps": 52270, "total_steps": 67140, "loss": 0.4489, "lr": 7.107218696791273e-06, "epoch": 7.78522490318737, "percentage": 77.85, "elapsed_time": "3:37:17", "remaining_time": "1:01:48", "throughput": 2312.7, "total_tokens": 30151552} {"current_steps": 52275, "total_steps": 67140, "loss": 0.4322, "lr": 7.102680533505707e-06, "epoch": 7.7859696157283285, "percentage": 77.86, "elapsed_time": "3:37:18", "remaining_time": "1:01:47", "throughput": 2312.74, "total_tokens": 30154688} {"current_steps": 52280, "total_steps": 67140, "loss": 0.7139, "lr": 7.0981435796482306e-06, "epoch": 7.786714328269288, "percentage": 77.87, "elapsed_time": "3:37:19", "remaining_time": "1:01:46", "throughput": 2312.76, "total_tokens": 30157728} {"current_steps": 52285, "total_steps": 67140, "loss": 0.558, "lr": 7.093607835525423e-06, "epoch": 7.787459040810247, "percentage": 77.87, "elapsed_time": "3:37:20", "remaining_time": "1:01:45", "throughput": 2312.79, "total_tokens": 30160672} {"current_steps": 52290, "total_steps": 67140, "loss": 0.5267, "lr": 7.089073301443802e-06, "epoch": 7.7882037533512065, "percentage": 77.88, "elapsed_time": "3:37:21", "remaining_time": "1:01:43", "throughput": 2312.81, "total_tokens": 30163584} {"current_steps": 52295, "total_steps": 67140, "loss": 0.5794, "lr": 7.084539977709778e-06, "epoch": 7.788948465892165, "percentage": 77.89, "elapsed_time": "3:37:23", "remaining_time": "1:01:42", "throughput": 2312.82, "total_tokens": 30166368} {"current_steps": 52300, "total_steps": 67140, "loss": 0.534, "lr": 7.080007864629706e-06, "epoch": 7.789693178433125, "percentage": 77.9, "elapsed_time": "3:37:24", "remaining_time": "1:01:41", "throughput": 2312.83, "total_tokens": 30169088} {"current_steps": 52305, "total_steps": 67140, "loss": 0.8111, "lr": 7.075476962509845e-06, "epoch": 7.790437890974084, "percentage": 77.9, "elapsed_time": "3:37:25", "remaining_time": "1:01:39", "throughput": 2312.84, "total_tokens": 30171712} {"current_steps": 52310, "total_steps": 67140, "loss": 0.3897, "lr": 7.070947271656372e-06, "epoch": 7.791182603515043, "percentage": 77.91, "elapsed_time": "3:37:26", "remaining_time": "1:01:38", "throughput": 2312.87, "total_tokens": 30174720} {"current_steps": 52315, "total_steps": 67140, "loss": 0.5079, "lr": 7.0664187923753984e-06, "epoch": 7.791927316056002, "percentage": 77.92, "elapsed_time": "3:37:27", "remaining_time": "1:01:37", "throughput": 2312.89, "total_tokens": 30177632} {"current_steps": 52320, "total_steps": 67140, "loss": 0.4864, "lr": 7.061891524972927e-06, "epoch": 7.792672028596962, "percentage": 77.93, "elapsed_time": "3:37:28", "remaining_time": "1:01:36", "throughput": 2312.93, "total_tokens": 30180928} {"current_steps": 52325, "total_steps": 67140, "loss": 0.5472, "lr": 7.057365469754892e-06, "epoch": 7.7934167411379205, "percentage": 77.93, "elapsed_time": "3:37:29", "remaining_time": "1:01:34", "throughput": 2312.93, "total_tokens": 30183552} {"current_steps": 52330, "total_steps": 67140, "loss": 0.4985, "lr": 7.052840627027146e-06, "epoch": 7.79416145367888, "percentage": 77.94, "elapsed_time": "3:37:31", "remaining_time": "1:01:33", "throughput": 2312.95, "total_tokens": 30186432} {"current_steps": 52335, "total_steps": 67140, "loss": 0.5582, "lr": 7.048316997095464e-06, "epoch": 7.794906166219839, "percentage": 77.95, "elapsed_time": "3:37:32", "remaining_time": "1:01:32", "throughput": 2312.98, "total_tokens": 30189472} {"current_steps": 52340, "total_steps": 67140, "loss": 0.6873, "lr": 7.0437945802655334e-06, "epoch": 7.7956508787607985, "percentage": 77.96, "elapsed_time": "3:37:33", "remaining_time": "1:01:31", "throughput": 2312.99, "total_tokens": 30192160} {"current_steps": 52345, "total_steps": 67140, "loss": 0.5071, "lr": 7.039273376842958e-06, "epoch": 7.796395591301757, "percentage": 77.96, "elapsed_time": "3:37:34", "remaining_time": "1:01:29", "throughput": 2313.01, "total_tokens": 30195136} {"current_steps": 52350, "total_steps": 67140, "loss": 0.5, "lr": 7.034753387133275e-06, "epoch": 7.797140303842717, "percentage": 77.97, "elapsed_time": "3:37:35", "remaining_time": "1:01:28", "throughput": 2313.04, "total_tokens": 30198208} {"current_steps": 52355, "total_steps": 67140, "loss": 0.7234, "lr": 7.03023461144191e-06, "epoch": 7.797885016383676, "percentage": 77.98, "elapsed_time": "3:37:36", "remaining_time": "1:01:27", "throughput": 2313.06, "total_tokens": 30201088} {"current_steps": 52360, "total_steps": 67140, "loss": 0.5724, "lr": 7.025717050074235e-06, "epoch": 7.798629728924635, "percentage": 77.99, "elapsed_time": "3:37:37", "remaining_time": "1:01:25", "throughput": 2313.09, "total_tokens": 30204192} {"current_steps": 52365, "total_steps": 67140, "loss": 0.5037, "lr": 7.021200703335518e-06, "epoch": 7.799374441465594, "percentage": 77.99, "elapsed_time": "3:37:39", "remaining_time": "1:01:24", "throughput": 2313.1, "total_tokens": 30206976} {"current_steps": 52370, "total_steps": 67140, "loss": 0.7045, "lr": 7.01668557153096e-06, "epoch": 7.800119154006554, "percentage": 78.0, "elapsed_time": "3:37:40", "remaining_time": "1:01:23", "throughput": 2313.12, "total_tokens": 30209696} {"current_steps": 52375, "total_steps": 67140, "loss": 0.6518, "lr": 7.012171654965677e-06, "epoch": 7.8008638665475125, "percentage": 78.01, "elapsed_time": "3:37:41", "remaining_time": "1:01:22", "throughput": 2313.12, "total_tokens": 30212256} {"current_steps": 52380, "total_steps": 67140, "loss": 0.6731, "lr": 7.007658953944699e-06, "epoch": 7.801608579088472, "percentage": 78.02, "elapsed_time": "3:37:42", "remaining_time": "1:01:20", "throughput": 2313.15, "total_tokens": 30215264} {"current_steps": 52385, "total_steps": 67140, "loss": 0.592, "lr": 7.003147468772986e-06, "epoch": 7.802353291629431, "percentage": 78.02, "elapsed_time": "3:37:43", "remaining_time": "1:01:19", "throughput": 2313.16, "total_tokens": 30218016} {"current_steps": 52390, "total_steps": 67140, "loss": 0.4595, "lr": 6.998637199755389e-06, "epoch": 7.803098004170391, "percentage": 78.03, "elapsed_time": "3:37:44", "remaining_time": "1:01:18", "throughput": 2313.18, "total_tokens": 30220832} {"current_steps": 52395, "total_steps": 67140, "loss": 0.6759, "lr": 6.994128147196702e-06, "epoch": 7.803842716711349, "percentage": 78.04, "elapsed_time": "3:37:45", "remaining_time": "1:01:16", "throughput": 2313.19, "total_tokens": 30223616} {"current_steps": 52400, "total_steps": 67140, "loss": 0.4332, "lr": 6.989620311401637e-06, "epoch": 7.804587429252309, "percentage": 78.05, "elapsed_time": "3:37:46", "remaining_time": "1:01:15", "throughput": 2313.21, "total_tokens": 30226464} {"current_steps": 52405, "total_steps": 67140, "loss": 0.8107, "lr": 6.985113692674797e-06, "epoch": 7.805332141793268, "percentage": 78.05, "elapsed_time": "3:37:47", "remaining_time": "1:01:14", "throughput": 2313.23, "total_tokens": 30229248} {"current_steps": 52410, "total_steps": 67140, "loss": 0.4844, "lr": 6.980608291320731e-06, "epoch": 7.806076854334227, "percentage": 78.06, "elapsed_time": "3:37:49", "remaining_time": "1:01:13", "throughput": 2313.25, "total_tokens": 30232192} {"current_steps": 52415, "total_steps": 67140, "loss": 0.584, "lr": 6.976104107643896e-06, "epoch": 7.806821566875186, "percentage": 78.07, "elapsed_time": "3:37:50", "remaining_time": "1:01:11", "throughput": 2313.27, "total_tokens": 30235008} {"current_steps": 52420, "total_steps": 67140, "loss": 0.6567, "lr": 6.9716011419486745e-06, "epoch": 7.807566279416145, "percentage": 78.08, "elapsed_time": "3:37:51", "remaining_time": "1:01:10", "throughput": 2313.28, "total_tokens": 30237792} {"current_steps": 52425, "total_steps": 67140, "loss": 0.5983, "lr": 6.96709939453934e-06, "epoch": 7.8083109919571045, "percentage": 78.08, "elapsed_time": "3:37:52", "remaining_time": "1:01:09", "throughput": 2313.31, "total_tokens": 30240928} {"current_steps": 52430, "total_steps": 67140, "loss": 0.6051, "lr": 6.962598865720113e-06, "epoch": 7.809055704498064, "percentage": 78.09, "elapsed_time": "3:37:53", "remaining_time": "1:01:08", "throughput": 2313.33, "total_tokens": 30243776} {"current_steps": 52435, "total_steps": 67140, "loss": 0.4438, "lr": 6.95809955579512e-06, "epoch": 7.809800417039023, "percentage": 78.1, "elapsed_time": "3:37:54", "remaining_time": "1:01:06", "throughput": 2313.34, "total_tokens": 30246528} {"current_steps": 52440, "total_steps": 67140, "loss": 0.59, "lr": 6.95360146506841e-06, "epoch": 7.810545129579982, "percentage": 78.11, "elapsed_time": "3:37:55", "remaining_time": "1:01:05", "throughput": 2313.37, "total_tokens": 30249536} {"current_steps": 52445, "total_steps": 67140, "loss": 0.5834, "lr": 6.949104593843939e-06, "epoch": 7.811289842120941, "percentage": 78.11, "elapsed_time": "3:37:57", "remaining_time": "1:01:04", "throughput": 2313.4, "total_tokens": 30252576} {"current_steps": 52450, "total_steps": 67140, "loss": 0.5056, "lr": 6.9446089424255875e-06, "epoch": 7.812034554661901, "percentage": 78.12, "elapsed_time": "3:37:58", "remaining_time": "1:01:02", "throughput": 2313.42, "total_tokens": 30255488} {"current_steps": 52455, "total_steps": 67140, "loss": 0.542, "lr": 6.940114511117163e-06, "epoch": 7.81277926720286, "percentage": 78.13, "elapsed_time": "3:37:59", "remaining_time": "1:01:01", "throughput": 2313.45, "total_tokens": 30258784} {"current_steps": 52460, "total_steps": 67140, "loss": 0.6465, "lr": 6.935621300222367e-06, "epoch": 7.8135239797438185, "percentage": 78.14, "elapsed_time": "3:38:00", "remaining_time": "1:01:00", "throughput": 2313.46, "total_tokens": 30261376} {"current_steps": 52465, "total_steps": 67140, "loss": 0.3889, "lr": 6.93112931004484e-06, "epoch": 7.814268692284778, "percentage": 78.14, "elapsed_time": "3:38:01", "remaining_time": "1:00:59", "throughput": 2313.48, "total_tokens": 30264224} {"current_steps": 52470, "total_steps": 67140, "loss": 0.6729, "lr": 6.9266385408881305e-06, "epoch": 7.815013404825737, "percentage": 78.15, "elapsed_time": "3:38:02", "remaining_time": "1:00:57", "throughput": 2313.5, "total_tokens": 30267136} {"current_steps": 52475, "total_steps": 67140, "loss": 0.5213, "lr": 6.922148993055708e-06, "epoch": 7.815758117366697, "percentage": 78.16, "elapsed_time": "3:38:03", "remaining_time": "1:00:56", "throughput": 2313.51, "total_tokens": 30269920} {"current_steps": 52480, "total_steps": 67140, "loss": 0.5908, "lr": 6.917660666850964e-06, "epoch": 7.816502829907655, "percentage": 78.17, "elapsed_time": "3:38:05", "remaining_time": "1:00:55", "throughput": 2313.53, "total_tokens": 30272800} {"current_steps": 52485, "total_steps": 67140, "loss": 0.5777, "lr": 6.913173562577193e-06, "epoch": 7.817247542448615, "percentage": 78.17, "elapsed_time": "3:38:06", "remaining_time": "1:00:53", "throughput": 2313.55, "total_tokens": 30275680} {"current_steps": 52490, "total_steps": 67140, "loss": 0.6478, "lr": 6.908687680537615e-06, "epoch": 7.817992254989574, "percentage": 78.18, "elapsed_time": "3:38:07", "remaining_time": "1:00:52", "throughput": 2313.57, "total_tokens": 30278656} {"current_steps": 52495, "total_steps": 67140, "loss": 0.5855, "lr": 6.904203021035366e-06, "epoch": 7.818736967530533, "percentage": 78.19, "elapsed_time": "3:38:08", "remaining_time": "1:00:51", "throughput": 2313.6, "total_tokens": 30281632} {"current_steps": 52500, "total_steps": 67140, "loss": 0.5107, "lr": 6.899719584373504e-06, "epoch": 7.819481680071492, "percentage": 78.19, "elapsed_time": "3:38:09", "remaining_time": "1:00:50", "throughput": 2313.61, "total_tokens": 30284416} {"current_steps": 52505, "total_steps": 67140, "loss": 0.8007, "lr": 6.895237370855004e-06, "epoch": 7.820226392612452, "percentage": 78.2, "elapsed_time": "3:38:10", "remaining_time": "1:00:48", "throughput": 2313.64, "total_tokens": 30287392} {"current_steps": 52510, "total_steps": 67140, "loss": 0.5086, "lr": 6.890756380782751e-06, "epoch": 7.8209711051534105, "percentage": 78.21, "elapsed_time": "3:38:11", "remaining_time": "1:00:47", "throughput": 2313.66, "total_tokens": 30290368} {"current_steps": 52515, "total_steps": 67140, "loss": 0.6679, "lr": 6.886276614459567e-06, "epoch": 7.82171581769437, "percentage": 78.22, "elapsed_time": "3:38:13", "remaining_time": "1:00:46", "throughput": 2313.68, "total_tokens": 30293216} {"current_steps": 52520, "total_steps": 67140, "loss": 0.5382, "lr": 6.881798072188159e-06, "epoch": 7.822460530235329, "percentage": 78.22, "elapsed_time": "3:38:14", "remaining_time": "1:00:45", "throughput": 2313.7, "total_tokens": 30296224} {"current_steps": 52525, "total_steps": 67140, "loss": 0.6784, "lr": 6.8773207542711716e-06, "epoch": 7.823205242776289, "percentage": 78.23, "elapsed_time": "3:38:15", "remaining_time": "1:00:43", "throughput": 2313.73, "total_tokens": 30299232} {"current_steps": 52530, "total_steps": 67140, "loss": 0.3737, "lr": 6.872844661011163e-06, "epoch": 7.823949955317247, "percentage": 78.24, "elapsed_time": "3:38:16", "remaining_time": "1:00:42", "throughput": 2313.75, "total_tokens": 30302112} {"current_steps": 52535, "total_steps": 67140, "loss": 0.427, "lr": 6.868369792710613e-06, "epoch": 7.824694667858207, "percentage": 78.25, "elapsed_time": "3:38:17", "remaining_time": "1:00:41", "throughput": 2313.77, "total_tokens": 30305120} {"current_steps": 52540, "total_steps": 67140, "loss": 0.5456, "lr": 6.863896149671914e-06, "epoch": 7.825439380399166, "percentage": 78.25, "elapsed_time": "3:38:18", "remaining_time": "1:00:39", "throughput": 2313.79, "total_tokens": 30307968} {"current_steps": 52545, "total_steps": 67140, "loss": 0.5262, "lr": 6.859423732197379e-06, "epoch": 7.826184092940125, "percentage": 78.26, "elapsed_time": "3:38:19", "remaining_time": "1:00:38", "throughput": 2313.8, "total_tokens": 30310752} {"current_steps": 52550, "total_steps": 67140, "loss": 0.625, "lr": 6.854952540589241e-06, "epoch": 7.826928805481084, "percentage": 78.27, "elapsed_time": "3:38:21", "remaining_time": "1:00:37", "throughput": 2313.82, "total_tokens": 30313568} {"current_steps": 52555, "total_steps": 67140, "loss": 0.3806, "lr": 6.850482575149631e-06, "epoch": 7.827673518022044, "percentage": 78.28, "elapsed_time": "3:38:22", "remaining_time": "1:00:36", "throughput": 2313.85, "total_tokens": 30316576} {"current_steps": 52560, "total_steps": 67140, "loss": 0.8062, "lr": 6.846013836180623e-06, "epoch": 7.828418230563003, "percentage": 78.28, "elapsed_time": "3:38:23", "remaining_time": "1:00:34", "throughput": 2313.87, "total_tokens": 30319520} {"current_steps": 52565, "total_steps": 67140, "loss": 0.541, "lr": 6.8415463239841854e-06, "epoch": 7.829162943103962, "percentage": 78.29, "elapsed_time": "3:38:24", "remaining_time": "1:00:33", "throughput": 2313.88, "total_tokens": 30322336} {"current_steps": 52570, "total_steps": 67140, "loss": 0.5374, "lr": 6.83708003886222e-06, "epoch": 7.829907655644921, "percentage": 78.3, "elapsed_time": "3:38:25", "remaining_time": "1:00:32", "throughput": 2313.9, "total_tokens": 30325184} {"current_steps": 52575, "total_steps": 67140, "loss": 0.5216, "lr": 6.832614981116542e-06, "epoch": 7.830652368185881, "percentage": 78.31, "elapsed_time": "3:38:26", "remaining_time": "1:00:30", "throughput": 2313.91, "total_tokens": 30327744} {"current_steps": 52580, "total_steps": 67140, "loss": 0.8717, "lr": 6.8281511510488785e-06, "epoch": 7.831397080726839, "percentage": 78.31, "elapsed_time": "3:38:27", "remaining_time": "1:00:29", "throughput": 2313.94, "total_tokens": 30330880} {"current_steps": 52585, "total_steps": 67140, "loss": 0.592, "lr": 6.8236885489608885e-06, "epoch": 7.832141793267798, "percentage": 78.32, "elapsed_time": "3:38:29", "remaining_time": "1:00:28", "throughput": 2313.95, "total_tokens": 30333664} {"current_steps": 52590, "total_steps": 67140, "loss": 0.5468, "lr": 6.819227175154117e-06, "epoch": 7.832886505808758, "percentage": 78.33, "elapsed_time": "3:38:30", "remaining_time": "1:00:27", "throughput": 2313.98, "total_tokens": 30336640} {"current_steps": 52595, "total_steps": 67140, "loss": 0.6835, "lr": 6.814767029930055e-06, "epoch": 7.833631218349717, "percentage": 78.34, "elapsed_time": "3:38:31", "remaining_time": "1:00:25", "throughput": 2313.99, "total_tokens": 30339456} {"current_steps": 52600, "total_steps": 67140, "loss": 0.6007, "lr": 6.810308113590111e-06, "epoch": 7.834375930890676, "percentage": 78.34, "elapsed_time": "3:38:32", "remaining_time": "1:00:24", "throughput": 2314.01, "total_tokens": 30342432} {"current_steps": 52605, "total_steps": 67140, "loss": 0.5307, "lr": 6.805850426435581e-06, "epoch": 7.835120643431635, "percentage": 78.35, "elapsed_time": "3:38:33", "remaining_time": "1:00:23", "throughput": 2314.08, "total_tokens": 30346432} {"current_steps": 52610, "total_steps": 67140, "loss": 0.5699, "lr": 6.801393968767708e-06, "epoch": 7.835865355972595, "percentage": 78.36, "elapsed_time": "3:38:34", "remaining_time": "1:00:22", "throughput": 2314.1, "total_tokens": 30349344} {"current_steps": 52615, "total_steps": 67140, "loss": 0.5533, "lr": 6.796938740887643e-06, "epoch": 7.836610068513554, "percentage": 78.37, "elapsed_time": "3:38:36", "remaining_time": "1:00:20", "throughput": 2314.11, "total_tokens": 30352032} {"current_steps": 52620, "total_steps": 67140, "loss": 0.5936, "lr": 6.792484743096456e-06, "epoch": 7.837354781054513, "percentage": 78.37, "elapsed_time": "3:38:37", "remaining_time": "1:00:19", "throughput": 2314.12, "total_tokens": 30354784} {"current_steps": 52625, "total_steps": 67140, "loss": 0.7416, "lr": 6.788031975695114e-06, "epoch": 7.838099493595472, "percentage": 78.38, "elapsed_time": "3:38:38", "remaining_time": "1:00:18", "throughput": 2314.17, "total_tokens": 30358208} {"current_steps": 52630, "total_steps": 67140, "loss": 0.4433, "lr": 6.783580438984527e-06, "epoch": 7.838844206136431, "percentage": 78.39, "elapsed_time": "3:38:39", "remaining_time": "1:00:17", "throughput": 2314.18, "total_tokens": 30360928} {"current_steps": 52635, "total_steps": 67140, "loss": 0.5629, "lr": 6.779130133265513e-06, "epoch": 7.83958891867739, "percentage": 78.4, "elapsed_time": "3:38:40", "remaining_time": "1:00:15", "throughput": 2314.18, "total_tokens": 30363392} {"current_steps": 52640, "total_steps": 67140, "loss": 0.6826, "lr": 6.774681058838811e-06, "epoch": 7.84033363121835, "percentage": 78.4, "elapsed_time": "3:38:41", "remaining_time": "1:00:14", "throughput": 2314.19, "total_tokens": 30366144} {"current_steps": 52645, "total_steps": 67140, "loss": 0.581, "lr": 6.770233216005056e-06, "epoch": 7.841078343759309, "percentage": 78.41, "elapsed_time": "3:38:42", "remaining_time": "1:00:13", "throughput": 2314.22, "total_tokens": 30369280} {"current_steps": 52650, "total_steps": 67140, "loss": 0.5087, "lr": 6.76578660506483e-06, "epoch": 7.841823056300268, "percentage": 78.42, "elapsed_time": "3:38:44", "remaining_time": "1:00:11", "throughput": 2314.24, "total_tokens": 30372160} {"current_steps": 52655, "total_steps": 67140, "loss": 0.4499, "lr": 6.7613412263186074e-06, "epoch": 7.842567768841227, "percentage": 78.43, "elapsed_time": "3:38:45", "remaining_time": "1:00:10", "throughput": 2314.27, "total_tokens": 30375328} {"current_steps": 52660, "total_steps": 67140, "loss": 0.6022, "lr": 6.756897080066788e-06, "epoch": 7.843312481382187, "percentage": 78.43, "elapsed_time": "3:38:46", "remaining_time": "1:00:09", "throughput": 2314.28, "total_tokens": 30377920} {"current_steps": 52665, "total_steps": 67140, "loss": 0.6197, "lr": 6.752454166609693e-06, "epoch": 7.844057193923145, "percentage": 78.44, "elapsed_time": "3:38:47", "remaining_time": "1:00:08", "throughput": 2314.3, "total_tokens": 30380768} {"current_steps": 52670, "total_steps": 67140, "loss": 0.6059, "lr": 6.748012486247557e-06, "epoch": 7.844801906464105, "percentage": 78.45, "elapsed_time": "3:38:48", "remaining_time": "1:00:06", "throughput": 2314.31, "total_tokens": 30383424} {"current_steps": 52675, "total_steps": 67140, "loss": 0.5481, "lr": 6.74357203928053e-06, "epoch": 7.845546619005064, "percentage": 78.46, "elapsed_time": "3:38:49", "remaining_time": "1:00:05", "throughput": 2314.33, "total_tokens": 30386368} {"current_steps": 52680, "total_steps": 67140, "loss": 0.463, "lr": 6.7391328260086845e-06, "epoch": 7.846291331546023, "percentage": 78.46, "elapsed_time": "3:38:50", "remaining_time": "1:00:04", "throughput": 2314.38, "total_tokens": 30389920} {"current_steps": 52685, "total_steps": 67140, "loss": 0.5325, "lr": 6.7346948467320036e-06, "epoch": 7.847036044086982, "percentage": 78.47, "elapsed_time": "3:38:52", "remaining_time": "1:00:02", "throughput": 2314.39, "total_tokens": 30392640} {"current_steps": 52690, "total_steps": 67140, "loss": 0.4904, "lr": 6.730258101750372e-06, "epoch": 7.847780756627942, "percentage": 78.48, "elapsed_time": "3:38:53", "remaining_time": "1:00:01", "throughput": 2314.4, "total_tokens": 30395264} {"current_steps": 52695, "total_steps": 67140, "loss": 0.6622, "lr": 6.725822591363621e-06, "epoch": 7.848525469168901, "percentage": 78.49, "elapsed_time": "3:38:54", "remaining_time": "1:00:00", "throughput": 2314.42, "total_tokens": 30398272} {"current_steps": 52700, "total_steps": 67140, "loss": 0.7332, "lr": 6.721388315871482e-06, "epoch": 7.84927018170986, "percentage": 78.49, "elapsed_time": "3:38:55", "remaining_time": "0:59:59", "throughput": 2314.44, "total_tokens": 30401184} {"current_steps": 52705, "total_steps": 67140, "loss": 0.4802, "lr": 6.7169552755736055e-06, "epoch": 7.850014894250819, "percentage": 78.5, "elapsed_time": "3:38:56", "remaining_time": "0:59:57", "throughput": 2314.45, "total_tokens": 30403744} {"current_steps": 52710, "total_steps": 67140, "loss": 0.6799, "lr": 6.712523470769555e-06, "epoch": 7.850759606791779, "percentage": 78.51, "elapsed_time": "3:38:57", "remaining_time": "0:59:56", "throughput": 2314.48, "total_tokens": 30407008} {"current_steps": 52715, "total_steps": 67140, "loss": 0.7665, "lr": 6.708092901758828e-06, "epoch": 7.851504319332737, "percentage": 78.52, "elapsed_time": "3:38:58", "remaining_time": "0:59:55", "throughput": 2314.5, "total_tokens": 30409920} {"current_steps": 52720, "total_steps": 67140, "loss": 0.6179, "lr": 6.703663568840804e-06, "epoch": 7.852249031873697, "percentage": 78.52, "elapsed_time": "3:38:59", "remaining_time": "0:59:54", "throughput": 2314.51, "total_tokens": 30412544} {"current_steps": 52725, "total_steps": 67140, "loss": 0.4689, "lr": 6.699235472314816e-06, "epoch": 7.852993744414656, "percentage": 78.53, "elapsed_time": "3:39:01", "remaining_time": "0:59:52", "throughput": 2314.55, "total_tokens": 30415872} {"current_steps": 52730, "total_steps": 67140, "loss": 0.4268, "lr": 6.694808612480083e-06, "epoch": 7.8537384569556155, "percentage": 78.54, "elapsed_time": "3:39:02", "remaining_time": "0:59:51", "throughput": 2314.6, "total_tokens": 30419328} {"current_steps": 52735, "total_steps": 67140, "loss": 0.4905, "lr": 6.6903829896357604e-06, "epoch": 7.854483169496574, "percentage": 78.54, "elapsed_time": "3:39:03", "remaining_time": "0:59:50", "throughput": 2314.61, "total_tokens": 30422080} {"current_steps": 52740, "total_steps": 67140, "loss": 0.611, "lr": 6.6859586040809105e-06, "epoch": 7.855227882037534, "percentage": 78.55, "elapsed_time": "3:39:04", "remaining_time": "0:59:48", "throughput": 2314.63, "total_tokens": 30424864} {"current_steps": 52745, "total_steps": 67140, "loss": 0.7647, "lr": 6.681535456114521e-06, "epoch": 7.855972594578493, "percentage": 78.56, "elapsed_time": "3:39:05", "remaining_time": "0:59:47", "throughput": 2314.64, "total_tokens": 30427680} {"current_steps": 52750, "total_steps": 67140, "loss": 0.82, "lr": 6.677113546035496e-06, "epoch": 7.856717307119452, "percentage": 78.57, "elapsed_time": "3:39:06", "remaining_time": "0:59:46", "throughput": 2314.66, "total_tokens": 30430592} {"current_steps": 52755, "total_steps": 67140, "loss": 0.4671, "lr": 6.672692874142636e-06, "epoch": 7.857462019660411, "percentage": 78.57, "elapsed_time": "3:39:08", "remaining_time": "0:59:45", "throughput": 2314.67, "total_tokens": 30433344} {"current_steps": 52760, "total_steps": 67140, "loss": 0.6428, "lr": 6.668273440734676e-06, "epoch": 7.858206732201371, "percentage": 78.58, "elapsed_time": "3:39:09", "remaining_time": "0:59:43", "throughput": 2314.69, "total_tokens": 30436128} {"current_steps": 52765, "total_steps": 67140, "loss": 0.5889, "lr": 6.663855246110273e-06, "epoch": 7.858951444742329, "percentage": 78.59, "elapsed_time": "3:39:10", "remaining_time": "0:59:42", "throughput": 2314.71, "total_tokens": 30439200} {"current_steps": 52770, "total_steps": 67140, "loss": 0.6203, "lr": 6.659438290567976e-06, "epoch": 7.859696157283288, "percentage": 78.6, "elapsed_time": "3:39:11", "remaining_time": "0:59:41", "throughput": 2314.74, "total_tokens": 30442112} {"current_steps": 52775, "total_steps": 67140, "loss": 0.5924, "lr": 6.655022574406272e-06, "epoch": 7.860440869824248, "percentage": 78.6, "elapsed_time": "3:39:12", "remaining_time": "0:59:40", "throughput": 2314.74, "total_tokens": 30444640} {"current_steps": 52780, "total_steps": 67140, "loss": 0.5346, "lr": 6.650608097923558e-06, "epoch": 7.8611855823652075, "percentage": 78.61, "elapsed_time": "3:39:13", "remaining_time": "0:59:38", "throughput": 2314.76, "total_tokens": 30447680} {"current_steps": 52785, "total_steps": 67140, "loss": 0.5467, "lr": 6.64619486141815e-06, "epoch": 7.861930294906166, "percentage": 78.62, "elapsed_time": "3:39:14", "remaining_time": "0:59:37", "throughput": 2314.78, "total_tokens": 30450432} {"current_steps": 52790, "total_steps": 67140, "loss": 0.6789, "lr": 6.641782865188267e-06, "epoch": 7.862675007447125, "percentage": 78.63, "elapsed_time": "3:39:15", "remaining_time": "0:59:36", "throughput": 2314.79, "total_tokens": 30453248} {"current_steps": 52795, "total_steps": 67140, "loss": 0.6008, "lr": 6.637372109532061e-06, "epoch": 7.863419719988085, "percentage": 78.63, "elapsed_time": "3:39:17", "remaining_time": "0:59:34", "throughput": 2314.81, "total_tokens": 30456064} {"current_steps": 52800, "total_steps": 67140, "loss": 0.5728, "lr": 6.632962594747588e-06, "epoch": 7.864164432529043, "percentage": 78.64, "elapsed_time": "3:39:18", "remaining_time": "0:59:33", "throughput": 2314.84, "total_tokens": 30459136} {"current_steps": 52805, "total_steps": 67140, "loss": 0.6353, "lr": 6.628554321132835e-06, "epoch": 7.864909145070003, "percentage": 78.65, "elapsed_time": "3:39:19", "remaining_time": "0:59:32", "throughput": 2314.85, "total_tokens": 30461888} {"current_steps": 52810, "total_steps": 67140, "loss": 0.8625, "lr": 6.624147288985682e-06, "epoch": 7.865653857610962, "percentage": 78.66, "elapsed_time": "3:39:20", "remaining_time": "0:59:31", "throughput": 2314.87, "total_tokens": 30464704} {"current_steps": 52815, "total_steps": 67140, "loss": 0.5099, "lr": 6.619741498603951e-06, "epoch": 7.8663985701519215, "percentage": 78.66, "elapsed_time": "3:39:21", "remaining_time": "0:59:29", "throughput": 2314.88, "total_tokens": 30467392} {"current_steps": 52820, "total_steps": 67140, "loss": 0.5639, "lr": 6.615336950285356e-06, "epoch": 7.86714328269288, "percentage": 78.67, "elapsed_time": "3:39:22", "remaining_time": "0:59:28", "throughput": 2314.9, "total_tokens": 30470400} {"current_steps": 52825, "total_steps": 67140, "loss": 0.5865, "lr": 6.610933644327541e-06, "epoch": 7.86788799523384, "percentage": 78.68, "elapsed_time": "3:39:23", "remaining_time": "0:59:27", "throughput": 2314.92, "total_tokens": 30473248} {"current_steps": 52830, "total_steps": 67140, "loss": 0.6274, "lr": 6.606531581028067e-06, "epoch": 7.868632707774799, "percentage": 78.69, "elapsed_time": "3:39:25", "remaining_time": "0:59:25", "throughput": 2314.94, "total_tokens": 30476160} {"current_steps": 52835, "total_steps": 67140, "loss": 0.4477, "lr": 6.602130760684405e-06, "epoch": 7.869377420315758, "percentage": 78.69, "elapsed_time": "3:39:26", "remaining_time": "0:59:24", "throughput": 2314.99, "total_tokens": 30479648} {"current_steps": 52840, "total_steps": 67140, "loss": 0.5872, "lr": 6.597731183593947e-06, "epoch": 7.870122132856717, "percentage": 78.7, "elapsed_time": "3:39:27", "remaining_time": "0:59:23", "throughput": 2315.0, "total_tokens": 30482400} {"current_steps": 52845, "total_steps": 67140, "loss": 0.6161, "lr": 6.593332850054004e-06, "epoch": 7.870866845397677, "percentage": 78.71, "elapsed_time": "3:39:28", "remaining_time": "0:59:22", "throughput": 2315.02, "total_tokens": 30485312} {"current_steps": 52850, "total_steps": 67140, "loss": 0.5533, "lr": 6.588935760361789e-06, "epoch": 7.871611557938635, "percentage": 78.72, "elapsed_time": "3:39:29", "remaining_time": "0:59:20", "throughput": 2315.05, "total_tokens": 30488448} {"current_steps": 52855, "total_steps": 67140, "loss": 0.5936, "lr": 6.584539914814439e-06, "epoch": 7.872356270479595, "percentage": 78.72, "elapsed_time": "3:39:30", "remaining_time": "0:59:19", "throughput": 2315.08, "total_tokens": 30491456} {"current_steps": 52860, "total_steps": 67140, "loss": 0.7292, "lr": 6.580145313709005e-06, "epoch": 7.873100983020554, "percentage": 78.73, "elapsed_time": "3:39:31", "remaining_time": "0:59:18", "throughput": 2315.1, "total_tokens": 30494432} {"current_steps": 52865, "total_steps": 67140, "loss": 0.6476, "lr": 6.575751957342463e-06, "epoch": 7.8738456955615135, "percentage": 78.74, "elapsed_time": "3:39:33", "remaining_time": "0:59:17", "throughput": 2315.13, "total_tokens": 30497504} {"current_steps": 52870, "total_steps": 67140, "loss": 0.5444, "lr": 6.571359846011696e-06, "epoch": 7.874590408102472, "percentage": 78.75, "elapsed_time": "3:39:34", "remaining_time": "0:59:15", "throughput": 2315.15, "total_tokens": 30500320} {"current_steps": 52875, "total_steps": 67140, "loss": 0.6009, "lr": 6.566968980013505e-06, "epoch": 7.875335120643432, "percentage": 78.75, "elapsed_time": "3:39:35", "remaining_time": "0:59:14", "throughput": 2315.17, "total_tokens": 30503264} {"current_steps": 52880, "total_steps": 67140, "loss": 0.7071, "lr": 6.5625793596446165e-06, "epoch": 7.876079833184391, "percentage": 78.76, "elapsed_time": "3:39:36", "remaining_time": "0:59:13", "throughput": 2315.2, "total_tokens": 30506368} {"current_steps": 52885, "total_steps": 67140, "loss": 0.906, "lr": 6.558190985201651e-06, "epoch": 7.87682454572535, "percentage": 78.77, "elapsed_time": "3:39:37", "remaining_time": "0:59:12", "throughput": 2315.22, "total_tokens": 30509248} {"current_steps": 52890, "total_steps": 67140, "loss": 0.3964, "lr": 6.553803856981152e-06, "epoch": 7.877569258266309, "percentage": 78.78, "elapsed_time": "3:39:38", "remaining_time": "0:59:10", "throughput": 2315.22, "total_tokens": 30511904} {"current_steps": 52895, "total_steps": 67140, "loss": 0.6256, "lr": 6.549417975279595e-06, "epoch": 7.878313970807269, "percentage": 78.78, "elapsed_time": "3:39:39", "remaining_time": "0:59:09", "throughput": 2315.24, "total_tokens": 30514816} {"current_steps": 52900, "total_steps": 67140, "loss": 0.6359, "lr": 6.545033340393356e-06, "epoch": 7.8790586833482275, "percentage": 78.79, "elapsed_time": "3:39:41", "remaining_time": "0:59:08", "throughput": 2315.26, "total_tokens": 30517728} {"current_steps": 52905, "total_steps": 67140, "loss": 0.6542, "lr": 6.540649952618727e-06, "epoch": 7.879803395889187, "percentage": 78.8, "elapsed_time": "3:39:42", "remaining_time": "0:59:06", "throughput": 2315.28, "total_tokens": 30520512} {"current_steps": 52910, "total_steps": 67140, "loss": 0.496, "lr": 6.536267812251928e-06, "epoch": 7.880548108430146, "percentage": 78.81, "elapsed_time": "3:39:43", "remaining_time": "0:59:05", "throughput": 2315.3, "total_tokens": 30523360} {"current_steps": 52915, "total_steps": 67140, "loss": 0.6842, "lr": 6.531886919589089e-06, "epoch": 7.8812928209711055, "percentage": 78.81, "elapsed_time": "3:39:44", "remaining_time": "0:59:04", "throughput": 2315.32, "total_tokens": 30526368} {"current_steps": 52920, "total_steps": 67140, "loss": 0.5317, "lr": 6.5275072749262395e-06, "epoch": 7.882037533512064, "percentage": 78.82, "elapsed_time": "3:39:45", "remaining_time": "0:59:03", "throughput": 2315.36, "total_tokens": 30529600} {"current_steps": 52925, "total_steps": 67140, "loss": 0.5144, "lr": 6.523128878559351e-06, "epoch": 7.882782246053024, "percentage": 78.83, "elapsed_time": "3:39:46", "remaining_time": "0:59:01", "throughput": 2315.38, "total_tokens": 30532640} {"current_steps": 52930, "total_steps": 67140, "loss": 0.4925, "lr": 6.518751730784284e-06, "epoch": 7.883526958593983, "percentage": 78.84, "elapsed_time": "3:39:47", "remaining_time": "0:59:00", "throughput": 2315.4, "total_tokens": 30535488} {"current_steps": 52935, "total_steps": 67140, "loss": 0.6013, "lr": 6.514375831896835e-06, "epoch": 7.884271671134941, "percentage": 78.84, "elapsed_time": "3:39:49", "remaining_time": "0:58:59", "throughput": 2315.43, "total_tokens": 30538592} {"current_steps": 52940, "total_steps": 67140, "loss": 0.5937, "lr": 6.51000118219271e-06, "epoch": 7.885016383675901, "percentage": 78.85, "elapsed_time": "3:39:50", "remaining_time": "0:58:58", "throughput": 2315.46, "total_tokens": 30541696} {"current_steps": 52945, "total_steps": 67140, "loss": 0.8564, "lr": 6.505627781967533e-06, "epoch": 7.885761096216861, "percentage": 78.86, "elapsed_time": "3:39:51", "remaining_time": "0:58:56", "throughput": 2315.47, "total_tokens": 30544416} {"current_steps": 52950, "total_steps": 67140, "loss": 0.6254, "lr": 6.501255631516842e-06, "epoch": 7.8865058087578195, "percentage": 78.87, "elapsed_time": "3:39:52", "remaining_time": "0:58:55", "throughput": 2315.48, "total_tokens": 30547040} {"current_steps": 52955, "total_steps": 67140, "loss": 0.4522, "lr": 6.4968847311360794e-06, "epoch": 7.887250521298778, "percentage": 78.87, "elapsed_time": "3:39:53", "remaining_time": "0:58:54", "throughput": 2315.49, "total_tokens": 30549760} {"current_steps": 52960, "total_steps": 67140, "loss": 0.4143, "lr": 6.4925150811206176e-06, "epoch": 7.887995233839738, "percentage": 78.88, "elapsed_time": "3:39:54", "remaining_time": "0:58:52", "throughput": 2315.49, "total_tokens": 30552384} {"current_steps": 52965, "total_steps": 67140, "loss": 0.4251, "lr": 6.48814668176575e-06, "epoch": 7.8887399463806975, "percentage": 78.89, "elapsed_time": "3:39:55", "remaining_time": "0:58:51", "throughput": 2315.51, "total_tokens": 30555136} {"current_steps": 52970, "total_steps": 67140, "loss": 0.6625, "lr": 6.483779533366654e-06, "epoch": 7.889484658921656, "percentage": 78.89, "elapsed_time": "3:39:57", "remaining_time": "0:58:50", "throughput": 2315.55, "total_tokens": 30558496} {"current_steps": 52975, "total_steps": 67140, "loss": 0.7044, "lr": 6.479413636218459e-06, "epoch": 7.890229371462615, "percentage": 78.9, "elapsed_time": "3:39:58", "remaining_time": "0:58:49", "throughput": 2315.57, "total_tokens": 30561376} {"current_steps": 52980, "total_steps": 67140, "loss": 0.5637, "lr": 6.4750489906162e-06, "epoch": 7.890974084003575, "percentage": 78.91, "elapsed_time": "3:39:59", "remaining_time": "0:58:47", "throughput": 2315.58, "total_tokens": 30564128} {"current_steps": 52985, "total_steps": 67140, "loss": 0.4889, "lr": 6.470685596854803e-06, "epoch": 7.8917187965445335, "percentage": 78.92, "elapsed_time": "3:40:00", "remaining_time": "0:58:46", "throughput": 2315.6, "total_tokens": 30567008} {"current_steps": 52990, "total_steps": 67140, "loss": 0.7069, "lr": 6.46632345522914e-06, "epoch": 7.892463509085493, "percentage": 78.92, "elapsed_time": "3:40:01", "remaining_time": "0:58:45", "throughput": 2315.62, "total_tokens": 30569856} {"current_steps": 52995, "total_steps": 67140, "loss": 0.6665, "lr": 6.461962566033986e-06, "epoch": 7.893208221626452, "percentage": 78.93, "elapsed_time": "3:40:02", "remaining_time": "0:58:43", "throughput": 2315.62, "total_tokens": 30572512} {"current_steps": 53000, "total_steps": 67140, "loss": 0.7749, "lr": 6.45760292956403e-06, "epoch": 7.8939529341674115, "percentage": 78.94, "elapsed_time": "3:40:03", "remaining_time": "0:58:42", "throughput": 2315.64, "total_tokens": 30575328} {"current_steps": 53005, "total_steps": 67140, "loss": 0.6423, "lr": 6.45324454611389e-06, "epoch": 7.89469764670837, "percentage": 78.95, "elapsed_time": "3:40:04", "remaining_time": "0:58:41", "throughput": 2315.65, "total_tokens": 30578144} {"current_steps": 53010, "total_steps": 67140, "loss": 0.4905, "lr": 6.448887415978069e-06, "epoch": 7.89544235924933, "percentage": 78.95, "elapsed_time": "3:40:06", "remaining_time": "0:58:40", "throughput": 2315.68, "total_tokens": 30581184} {"current_steps": 53015, "total_steps": 67140, "loss": 0.5688, "lr": 6.4445315394510205e-06, "epoch": 7.896187071790289, "percentage": 78.96, "elapsed_time": "3:40:07", "remaining_time": "0:58:38", "throughput": 2315.71, "total_tokens": 30584160} {"current_steps": 53020, "total_steps": 67140, "loss": 0.4215, "lr": 6.440176916827081e-06, "epoch": 7.896931784331248, "percentage": 78.97, "elapsed_time": "3:40:08", "remaining_time": "0:58:37", "throughput": 2315.72, "total_tokens": 30586880} {"current_steps": 53025, "total_steps": 67140, "loss": 0.6718, "lr": 6.435823548400529e-06, "epoch": 7.897676496872207, "percentage": 78.98, "elapsed_time": "3:40:09", "remaining_time": "0:58:36", "throughput": 2315.72, "total_tokens": 30589472} {"current_steps": 53030, "total_steps": 67140, "loss": 0.5685, "lr": 6.431471434465544e-06, "epoch": 7.898421209413167, "percentage": 78.98, "elapsed_time": "3:40:10", "remaining_time": "0:58:35", "throughput": 2315.75, "total_tokens": 30592512} {"current_steps": 53035, "total_steps": 67140, "loss": 0.5189, "lr": 6.427120575316226e-06, "epoch": 7.8991659219541255, "percentage": 78.99, "elapsed_time": "3:40:11", "remaining_time": "0:58:33", "throughput": 2315.77, "total_tokens": 30595328} {"current_steps": 53040, "total_steps": 67140, "loss": 0.4735, "lr": 6.422770971246586e-06, "epoch": 7.899910634495085, "percentage": 79.0, "elapsed_time": "3:40:12", "remaining_time": "0:58:32", "throughput": 2315.79, "total_tokens": 30598336} {"current_steps": 53045, "total_steps": 67140, "loss": 0.6406, "lr": 6.4184226225505625e-06, "epoch": 7.900655347036044, "percentage": 79.01, "elapsed_time": "3:40:14", "remaining_time": "0:58:31", "throughput": 2315.81, "total_tokens": 30601184} {"current_steps": 53050, "total_steps": 67140, "loss": 0.6057, "lr": 6.414075529521993e-06, "epoch": 7.9014000595770035, "percentage": 79.01, "elapsed_time": "3:40:15", "remaining_time": "0:58:29", "throughput": 2315.83, "total_tokens": 30604128} {"current_steps": 53055, "total_steps": 67140, "loss": 0.4882, "lr": 6.409729692454625e-06, "epoch": 7.902144772117962, "percentage": 79.02, "elapsed_time": "3:40:16", "remaining_time": "0:58:28", "throughput": 2315.84, "total_tokens": 30606880} {"current_steps": 53060, "total_steps": 67140, "loss": 0.6271, "lr": 6.4053851116421395e-06, "epoch": 7.902889484658922, "percentage": 79.03, "elapsed_time": "3:40:17", "remaining_time": "0:58:27", "throughput": 2315.87, "total_tokens": 30609888} {"current_steps": 53065, "total_steps": 67140, "loss": 0.6327, "lr": 6.401041787378131e-06, "epoch": 7.903634197199881, "percentage": 79.04, "elapsed_time": "3:40:18", "remaining_time": "0:58:26", "throughput": 2315.89, "total_tokens": 30612768} {"current_steps": 53070, "total_steps": 67140, "loss": 0.5837, "lr": 6.396699719956101e-06, "epoch": 7.90437890974084, "percentage": 79.04, "elapsed_time": "3:40:19", "remaining_time": "0:58:24", "throughput": 2315.91, "total_tokens": 30615584} {"current_steps": 53075, "total_steps": 67140, "loss": 0.5292, "lr": 6.3923589096694685e-06, "epoch": 7.905123622281799, "percentage": 79.05, "elapsed_time": "3:40:20", "remaining_time": "0:58:23", "throughput": 2315.93, "total_tokens": 30618464} {"current_steps": 53080, "total_steps": 67140, "loss": 0.5172, "lr": 6.388019356811573e-06, "epoch": 7.905868334822759, "percentage": 79.06, "elapsed_time": "3:40:21", "remaining_time": "0:58:22", "throughput": 2315.96, "total_tokens": 30621536} {"current_steps": 53085, "total_steps": 67140, "loss": 0.5975, "lr": 6.3836810616756614e-06, "epoch": 7.9066130473637175, "percentage": 79.07, "elapsed_time": "3:40:23", "remaining_time": "0:58:21", "throughput": 2315.98, "total_tokens": 30624448} {"current_steps": 53090, "total_steps": 67140, "loss": 0.6962, "lr": 6.379344024554884e-06, "epoch": 7.907357759904677, "percentage": 79.07, "elapsed_time": "3:40:24", "remaining_time": "0:58:19", "throughput": 2316.0, "total_tokens": 30627424} {"current_steps": 53095, "total_steps": 67140, "loss": 0.5409, "lr": 6.375008245742334e-06, "epoch": 7.908102472445636, "percentage": 79.08, "elapsed_time": "3:40:25", "remaining_time": "0:58:18", "throughput": 2316.01, "total_tokens": 30630080} {"current_steps": 53100, "total_steps": 67140, "loss": 0.6701, "lr": 6.370673725531004e-06, "epoch": 7.908847184986596, "percentage": 79.09, "elapsed_time": "3:40:26", "remaining_time": "0:58:17", "throughput": 2316.03, "total_tokens": 30632928} {"current_steps": 53105, "total_steps": 67140, "loss": 0.5779, "lr": 6.366340464213799e-06, "epoch": 7.909591897527554, "percentage": 79.1, "elapsed_time": "3:40:27", "remaining_time": "0:58:15", "throughput": 2316.05, "total_tokens": 30635712} {"current_steps": 53110, "total_steps": 67140, "loss": 0.5654, "lr": 6.3620084620835494e-06, "epoch": 7.910336610068514, "percentage": 79.1, "elapsed_time": "3:40:28", "remaining_time": "0:58:14", "throughput": 2316.06, "total_tokens": 30638528} {"current_steps": 53115, "total_steps": 67140, "loss": 0.5344, "lr": 6.357677719432998e-06, "epoch": 7.911081322609473, "percentage": 79.11, "elapsed_time": "3:40:29", "remaining_time": "0:58:13", "throughput": 2316.08, "total_tokens": 30641408} {"current_steps": 53120, "total_steps": 67140, "loss": 0.503, "lr": 6.353348236554784e-06, "epoch": 7.9118260351504315, "percentage": 79.12, "elapsed_time": "3:40:31", "remaining_time": "0:58:12", "throughput": 2316.1, "total_tokens": 30644320} {"current_steps": 53125, "total_steps": 67140, "loss": 0.4549, "lr": 6.349020013741491e-06, "epoch": 7.912570747691391, "percentage": 79.13, "elapsed_time": "3:40:32", "remaining_time": "0:58:10", "throughput": 2316.12, "total_tokens": 30647200} {"current_steps": 53130, "total_steps": 67140, "loss": 0.6922, "lr": 6.3446930512855914e-06, "epoch": 7.913315460232351, "percentage": 79.13, "elapsed_time": "3:40:33", "remaining_time": "0:58:09", "throughput": 2316.13, "total_tokens": 30649984} {"current_steps": 53135, "total_steps": 67140, "loss": 0.6056, "lr": 6.340367349479487e-06, "epoch": 7.9140601727733095, "percentage": 79.14, "elapsed_time": "3:40:34", "remaining_time": "0:58:08", "throughput": 2316.16, "total_tokens": 30652896} {"current_steps": 53140, "total_steps": 67140, "loss": 0.8286, "lr": 6.336042908615492e-06, "epoch": 7.914804885314268, "percentage": 79.15, "elapsed_time": "3:40:35", "remaining_time": "0:58:06", "throughput": 2316.17, "total_tokens": 30655776} {"current_steps": 53145, "total_steps": 67140, "loss": 0.5461, "lr": 6.331719728985844e-06, "epoch": 7.915549597855228, "percentage": 79.16, "elapsed_time": "3:40:36", "remaining_time": "0:58:05", "throughput": 2316.19, "total_tokens": 30658560} {"current_steps": 53150, "total_steps": 67140, "loss": 0.6571, "lr": 6.3273978108826685e-06, "epoch": 7.916294310396187, "percentage": 79.16, "elapsed_time": "3:40:37", "remaining_time": "0:58:04", "throughput": 2316.2, "total_tokens": 30661344} {"current_steps": 53155, "total_steps": 67140, "loss": 0.7362, "lr": 6.323077154598031e-06, "epoch": 7.917039022937146, "percentage": 79.17, "elapsed_time": "3:40:38", "remaining_time": "0:58:03", "throughput": 2316.21, "total_tokens": 30663968} {"current_steps": 53160, "total_steps": 67140, "loss": 0.5475, "lr": 6.3187577604239074e-06, "epoch": 7.917783735478105, "percentage": 79.18, "elapsed_time": "3:40:40", "remaining_time": "0:58:01", "throughput": 2316.23, "total_tokens": 30666880} {"current_steps": 53165, "total_steps": 67140, "loss": 0.7011, "lr": 6.314439628652186e-06, "epoch": 7.918528448019065, "percentage": 79.19, "elapsed_time": "3:40:41", "remaining_time": "0:58:00", "throughput": 2316.24, "total_tokens": 30669632} {"current_steps": 53170, "total_steps": 67140, "loss": 0.5739, "lr": 6.31012275957466e-06, "epoch": 7.9192731605600235, "percentage": 79.19, "elapsed_time": "3:40:42", "remaining_time": "0:57:59", "throughput": 2316.27, "total_tokens": 30672768} {"current_steps": 53175, "total_steps": 67140, "loss": 0.6929, "lr": 6.305807153483048e-06, "epoch": 7.920017873100983, "percentage": 79.2, "elapsed_time": "3:40:43", "remaining_time": "0:57:58", "throughput": 2316.29, "total_tokens": 30675648} {"current_steps": 53180, "total_steps": 67140, "loss": 0.5937, "lr": 6.3014928106689905e-06, "epoch": 7.920762585641942, "percentage": 79.21, "elapsed_time": "3:40:44", "remaining_time": "0:57:56", "throughput": 2316.31, "total_tokens": 30678528} {"current_steps": 53185, "total_steps": 67140, "loss": 0.5068, "lr": 6.297179731424022e-06, "epoch": 7.921507298182902, "percentage": 79.22, "elapsed_time": "3:40:45", "remaining_time": "0:57:55", "throughput": 2316.32, "total_tokens": 30681184} {"current_steps": 53190, "total_steps": 67140, "loss": 0.7021, "lr": 6.292867916039605e-06, "epoch": 7.92225201072386, "percentage": 79.22, "elapsed_time": "3:40:46", "remaining_time": "0:57:54", "throughput": 2316.34, "total_tokens": 30684192} {"current_steps": 53195, "total_steps": 67140, "loss": 0.6104, "lr": 6.288557364807118e-06, "epoch": 7.92299672326482, "percentage": 79.23, "elapsed_time": "3:40:48", "remaining_time": "0:57:52", "throughput": 2316.38, "total_tokens": 30687424} {"current_steps": 53200, "total_steps": 67140, "loss": 0.5132, "lr": 6.284248078017846e-06, "epoch": 7.923741435805779, "percentage": 79.24, "elapsed_time": "3:40:49", "remaining_time": "0:57:51", "throughput": 2316.39, "total_tokens": 30690240} {"current_steps": 53205, "total_steps": 67140, "loss": 0.4907, "lr": 6.279940055963007e-06, "epoch": 7.924486148346738, "percentage": 79.24, "elapsed_time": "3:40:50", "remaining_time": "0:57:50", "throughput": 2316.41, "total_tokens": 30693088} {"current_steps": 53210, "total_steps": 67140, "loss": 0.6259, "lr": 6.2756332989337005e-06, "epoch": 7.925230860887697, "percentage": 79.25, "elapsed_time": "3:40:51", "remaining_time": "0:57:49", "throughput": 2316.42, "total_tokens": 30695840} {"current_steps": 53215, "total_steps": 67140, "loss": 0.4947, "lr": 6.271327807220975e-06, "epoch": 7.925975573428657, "percentage": 79.26, "elapsed_time": "3:40:52", "remaining_time": "0:57:47", "throughput": 2316.44, "total_tokens": 30698720} {"current_steps": 53220, "total_steps": 67140, "loss": 0.6123, "lr": 6.267023581115763e-06, "epoch": 7.9267202859696155, "percentage": 79.27, "elapsed_time": "3:40:53", "remaining_time": "0:57:46", "throughput": 2316.46, "total_tokens": 30701696} {"current_steps": 53225, "total_steps": 67140, "loss": 0.5432, "lr": 6.262720620908935e-06, "epoch": 7.927464998510575, "percentage": 79.27, "elapsed_time": "3:40:54", "remaining_time": "0:57:45", "throughput": 2316.48, "total_tokens": 30704480} {"current_steps": 53230, "total_steps": 67140, "loss": 0.5563, "lr": 6.258418926891269e-06, "epoch": 7.928209711051534, "percentage": 79.28, "elapsed_time": "3:40:55", "remaining_time": "0:57:44", "throughput": 2316.5, "total_tokens": 30707392} {"current_steps": 53235, "total_steps": 67140, "loss": 0.5472, "lr": 6.254118499353451e-06, "epoch": 7.928954423592494, "percentage": 79.29, "elapsed_time": "3:40:57", "remaining_time": "0:57:42", "throughput": 2316.52, "total_tokens": 30710304} {"current_steps": 53240, "total_steps": 67140, "loss": 0.5907, "lr": 6.249819338586091e-06, "epoch": 7.929699136133452, "percentage": 79.3, "elapsed_time": "3:40:58", "remaining_time": "0:57:41", "throughput": 2316.54, "total_tokens": 30713184} {"current_steps": 53245, "total_steps": 67140, "loss": 0.5045, "lr": 6.245521444879715e-06, "epoch": 7.930443848674412, "percentage": 79.3, "elapsed_time": "3:40:59", "remaining_time": "0:57:40", "throughput": 2316.56, "total_tokens": 30716128} {"current_steps": 53250, "total_steps": 67140, "loss": 0.6705, "lr": 6.241224818524749e-06, "epoch": 7.931188561215371, "percentage": 79.31, "elapsed_time": "3:41:00", "remaining_time": "0:57:38", "throughput": 2316.57, "total_tokens": 30718912} {"current_steps": 53255, "total_steps": 67140, "loss": 0.6079, "lr": 6.236929459811536e-06, "epoch": 7.93193327375633, "percentage": 79.32, "elapsed_time": "3:41:01", "remaining_time": "0:57:37", "throughput": 2316.6, "total_tokens": 30721856} {"current_steps": 53260, "total_steps": 67140, "loss": 0.3373, "lr": 6.232635369030346e-06, "epoch": 7.932677986297289, "percentage": 79.33, "elapsed_time": "3:41:02", "remaining_time": "0:57:36", "throughput": 2316.62, "total_tokens": 30724960} {"current_steps": 53265, "total_steps": 67140, "loss": 0.5301, "lr": 6.228342546471353e-06, "epoch": 7.933422698838249, "percentage": 79.33, "elapsed_time": "3:41:03", "remaining_time": "0:57:35", "throughput": 2316.64, "total_tokens": 30727808} {"current_steps": 53270, "total_steps": 67140, "loss": 0.474, "lr": 6.224050992424652e-06, "epoch": 7.934167411379208, "percentage": 79.34, "elapsed_time": "3:41:05", "remaining_time": "0:57:33", "throughput": 2316.67, "total_tokens": 30730880} {"current_steps": 53275, "total_steps": 67140, "loss": 0.5926, "lr": 6.219760707180244e-06, "epoch": 7.934912123920167, "percentage": 79.35, "elapsed_time": "3:41:06", "remaining_time": "0:57:32", "throughput": 2316.68, "total_tokens": 30733632} {"current_steps": 53280, "total_steps": 67140, "loss": 0.5559, "lr": 6.215471691028063e-06, "epoch": 7.935656836461126, "percentage": 79.36, "elapsed_time": "3:41:07", "remaining_time": "0:57:31", "throughput": 2316.7, "total_tokens": 30736448} {"current_steps": 53285, "total_steps": 67140, "loss": 0.7726, "lr": 6.2111839442579335e-06, "epoch": 7.936401549002085, "percentage": 79.36, "elapsed_time": "3:41:08", "remaining_time": "0:57:30", "throughput": 2316.72, "total_tokens": 30739392} {"current_steps": 53290, "total_steps": 67140, "loss": 0.4571, "lr": 6.206897467159595e-06, "epoch": 7.937146261543044, "percentage": 79.37, "elapsed_time": "3:41:09", "remaining_time": "0:57:28", "throughput": 2316.76, "total_tokens": 30742720} {"current_steps": 53295, "total_steps": 67140, "loss": 0.673, "lr": 6.20261226002272e-06, "epoch": 7.937890974084004, "percentage": 79.38, "elapsed_time": "3:41:10", "remaining_time": "0:57:27", "throughput": 2316.76, "total_tokens": 30745344} {"current_steps": 53300, "total_steps": 67140, "loss": 0.66, "lr": 6.198328323136881e-06, "epoch": 7.938635686624963, "percentage": 79.39, "elapsed_time": "3:41:11", "remaining_time": "0:57:26", "throughput": 2316.78, "total_tokens": 30748128} {"current_steps": 53305, "total_steps": 67140, "loss": 0.5826, "lr": 6.1940456567915725e-06, "epoch": 7.9393803991659215, "percentage": 79.39, "elapsed_time": "3:41:13", "remaining_time": "0:57:24", "throughput": 2316.81, "total_tokens": 30751264} {"current_steps": 53310, "total_steps": 67140, "loss": 0.5417, "lr": 6.189764261276207e-06, "epoch": 7.940125111706881, "percentage": 79.4, "elapsed_time": "3:41:14", "remaining_time": "0:57:23", "throughput": 2316.82, "total_tokens": 30754016} {"current_steps": 53315, "total_steps": 67140, "loss": 0.5515, "lr": 6.185484136880088e-06, "epoch": 7.940869824247841, "percentage": 79.41, "elapsed_time": "3:41:15", "remaining_time": "0:57:22", "throughput": 2316.84, "total_tokens": 30756800} {"current_steps": 53320, "total_steps": 67140, "loss": 0.8071, "lr": 6.181205283892458e-06, "epoch": 7.9416145367888, "percentage": 79.42, "elapsed_time": "3:41:16", "remaining_time": "0:57:21", "throughput": 2316.85, "total_tokens": 30759616} {"current_steps": 53325, "total_steps": 67140, "loss": 0.7969, "lr": 6.1769277026024615e-06, "epoch": 7.942359249329758, "percentage": 79.42, "elapsed_time": "3:41:17", "remaining_time": "0:57:19", "throughput": 2316.87, "total_tokens": 30762496} {"current_steps": 53330, "total_steps": 67140, "loss": 0.688, "lr": 6.1726513932991724e-06, "epoch": 7.943103961870718, "percentage": 79.43, "elapsed_time": "3:41:18", "remaining_time": "0:57:18", "throughput": 2316.89, "total_tokens": 30765344} {"current_steps": 53335, "total_steps": 67140, "loss": 0.4047, "lr": 6.168376356271546e-06, "epoch": 7.943848674411677, "percentage": 79.44, "elapsed_time": "3:41:19", "remaining_time": "0:57:17", "throughput": 2316.9, "total_tokens": 30768160} {"current_steps": 53340, "total_steps": 67140, "loss": 0.5841, "lr": 6.1641025918084825e-06, "epoch": 7.944593386952636, "percentage": 79.45, "elapsed_time": "3:41:21", "remaining_time": "0:57:16", "throughput": 2316.93, "total_tokens": 30771328} {"current_steps": 53345, "total_steps": 67140, "loss": 0.7003, "lr": 6.15983010019879e-06, "epoch": 7.945338099493595, "percentage": 79.45, "elapsed_time": "3:41:22", "remaining_time": "0:57:14", "throughput": 2316.95, "total_tokens": 30774080} {"current_steps": 53350, "total_steps": 67140, "loss": 0.7816, "lr": 6.155558881731174e-06, "epoch": 7.946082812034555, "percentage": 79.46, "elapsed_time": "3:41:23", "remaining_time": "0:57:13", "throughput": 2316.95, "total_tokens": 30776768} {"current_steps": 53355, "total_steps": 67140, "loss": 0.6341, "lr": 6.151288936694274e-06, "epoch": 7.946827524575514, "percentage": 79.47, "elapsed_time": "3:41:24", "remaining_time": "0:57:12", "throughput": 2316.97, "total_tokens": 30779520} {"current_steps": 53360, "total_steps": 67140, "loss": 0.6746, "lr": 6.147020265376635e-06, "epoch": 7.947572237116473, "percentage": 79.48, "elapsed_time": "3:41:25", "remaining_time": "0:57:10", "throughput": 2316.99, "total_tokens": 30782464} {"current_steps": 53365, "total_steps": 67140, "loss": 0.6144, "lr": 6.1427528680667144e-06, "epoch": 7.948316949657432, "percentage": 79.48, "elapsed_time": "3:41:26", "remaining_time": "0:57:09", "throughput": 2317.0, "total_tokens": 30785248} {"current_steps": 53370, "total_steps": 67140, "loss": 0.3493, "lr": 6.138486745052896e-06, "epoch": 7.949061662198392, "percentage": 79.49, "elapsed_time": "3:41:27", "remaining_time": "0:57:08", "throughput": 2317.03, "total_tokens": 30788256} {"current_steps": 53375, "total_steps": 67140, "loss": 0.5003, "lr": 6.134221896623449e-06, "epoch": 7.94980637473935, "percentage": 79.5, "elapsed_time": "3:41:28", "remaining_time": "0:57:07", "throughput": 2317.05, "total_tokens": 30791168} {"current_steps": 53380, "total_steps": 67140, "loss": 0.4869, "lr": 6.129958323066592e-06, "epoch": 7.95055108728031, "percentage": 79.51, "elapsed_time": "3:41:30", "remaining_time": "0:57:05", "throughput": 2317.08, "total_tokens": 30794304} {"current_steps": 53385, "total_steps": 67140, "loss": 0.6933, "lr": 6.1256960246704245e-06, "epoch": 7.951295799821269, "percentage": 79.51, "elapsed_time": "3:41:31", "remaining_time": "0:57:04", "throughput": 2317.1, "total_tokens": 30797216} {"current_steps": 53390, "total_steps": 67140, "loss": 0.6029, "lr": 6.1214350017229805e-06, "epoch": 7.952040512362228, "percentage": 79.52, "elapsed_time": "3:41:32", "remaining_time": "0:57:03", "throughput": 2317.12, "total_tokens": 30800064} {"current_steps": 53395, "total_steps": 67140, "loss": 0.5634, "lr": 6.117175254512206e-06, "epoch": 7.952785224903187, "percentage": 79.53, "elapsed_time": "3:41:33", "remaining_time": "0:57:02", "throughput": 2317.14, "total_tokens": 30803008} {"current_steps": 53400, "total_steps": 67140, "loss": 0.4744, "lr": 6.1129167833259535e-06, "epoch": 7.953529937444147, "percentage": 79.54, "elapsed_time": "3:41:34", "remaining_time": "0:57:00", "throughput": 2317.16, "total_tokens": 30805888} {"current_steps": 53405, "total_steps": 67140, "loss": 0.415, "lr": 6.108659588451998e-06, "epoch": 7.954274649985106, "percentage": 79.54, "elapsed_time": "3:41:35", "remaining_time": "0:56:59", "throughput": 2317.19, "total_tokens": 30809024} {"current_steps": 53410, "total_steps": 67140, "loss": 0.6402, "lr": 6.104403670178027e-06, "epoch": 7.955019362526065, "percentage": 79.55, "elapsed_time": "3:41:37", "remaining_time": "0:56:58", "throughput": 2317.21, "total_tokens": 30811936} {"current_steps": 53415, "total_steps": 67140, "loss": 0.5368, "lr": 6.1001490287916326e-06, "epoch": 7.955764075067024, "percentage": 79.56, "elapsed_time": "3:41:38", "remaining_time": "0:56:56", "throughput": 2317.23, "total_tokens": 30814784} {"current_steps": 53420, "total_steps": 67140, "loss": 0.618, "lr": 6.095895664580317e-06, "epoch": 7.956508787607984, "percentage": 79.57, "elapsed_time": "3:41:39", "remaining_time": "0:56:55", "throughput": 2317.24, "total_tokens": 30817504} {"current_steps": 53425, "total_steps": 67140, "loss": 0.591, "lr": 6.0916435778315156e-06, "epoch": 7.957253500148942, "percentage": 79.57, "elapsed_time": "3:41:40", "remaining_time": "0:56:54", "throughput": 2317.26, "total_tokens": 30820512} {"current_steps": 53430, "total_steps": 67140, "loss": 0.6595, "lr": 6.087392768832567e-06, "epoch": 7.957998212689902, "percentage": 79.58, "elapsed_time": "3:41:41", "remaining_time": "0:56:53", "throughput": 2317.28, "total_tokens": 30823264} {"current_steps": 53435, "total_steps": 67140, "loss": 0.7787, "lr": 6.08314323787072e-06, "epoch": 7.958742925230861, "percentage": 79.59, "elapsed_time": "3:41:42", "remaining_time": "0:56:51", "throughput": 2317.29, "total_tokens": 30826112} {"current_steps": 53440, "total_steps": 67140, "loss": 0.5252, "lr": 6.078894985233141e-06, "epoch": 7.9594876377718204, "percentage": 79.59, "elapsed_time": "3:41:43", "remaining_time": "0:56:50", "throughput": 2317.32, "total_tokens": 30829216} {"current_steps": 53445, "total_steps": 67140, "loss": 0.5929, "lr": 6.074648011206921e-06, "epoch": 7.960232350312779, "percentage": 79.6, "elapsed_time": "3:41:44", "remaining_time": "0:56:49", "throughput": 2317.33, "total_tokens": 30831840} {"current_steps": 53450, "total_steps": 67140, "loss": 0.5804, "lr": 6.070402316079043e-06, "epoch": 7.960977062853738, "percentage": 79.61, "elapsed_time": "3:41:46", "remaining_time": "0:56:48", "throughput": 2317.34, "total_tokens": 30834656} {"current_steps": 53455, "total_steps": 67140, "loss": 0.5452, "lr": 6.066157900136407e-06, "epoch": 7.961721775394698, "percentage": 79.62, "elapsed_time": "3:41:47", "remaining_time": "0:56:46", "throughput": 2317.35, "total_tokens": 30837280} {"current_steps": 53460, "total_steps": 67140, "loss": 0.6864, "lr": 6.0619147636658405e-06, "epoch": 7.962466487935657, "percentage": 79.62, "elapsed_time": "3:41:48", "remaining_time": "0:56:45", "throughput": 2317.37, "total_tokens": 30840288} {"current_steps": 53465, "total_steps": 67140, "loss": 0.4397, "lr": 6.057672906954076e-06, "epoch": 7.963211200476616, "percentage": 79.63, "elapsed_time": "3:41:49", "remaining_time": "0:56:44", "throughput": 2317.4, "total_tokens": 30843328} {"current_steps": 53470, "total_steps": 67140, "loss": 0.6216, "lr": 6.053432330287765e-06, "epoch": 7.963955913017575, "percentage": 79.64, "elapsed_time": "3:41:50", "remaining_time": "0:56:42", "throughput": 2317.44, "total_tokens": 30846592} {"current_steps": 53475, "total_steps": 67140, "loss": 0.5232, "lr": 6.049193033953474e-06, "epoch": 7.964700625558534, "percentage": 79.65, "elapsed_time": "3:41:51", "remaining_time": "0:56:41", "throughput": 2317.46, "total_tokens": 30849536} {"current_steps": 53480, "total_steps": 67140, "loss": 0.553, "lr": 6.044955018237661e-06, "epoch": 7.965445338099494, "percentage": 79.65, "elapsed_time": "3:41:53", "remaining_time": "0:56:40", "throughput": 2317.51, "total_tokens": 30852992} {"current_steps": 53485, "total_steps": 67140, "loss": 0.6842, "lr": 6.040718283426722e-06, "epoch": 7.966190050640453, "percentage": 79.66, "elapsed_time": "3:41:54", "remaining_time": "0:56:39", "throughput": 2317.52, "total_tokens": 30855872} {"current_steps": 53490, "total_steps": 67140, "loss": 0.524, "lr": 6.036482829806964e-06, "epoch": 7.966934763181412, "percentage": 79.67, "elapsed_time": "3:41:55", "remaining_time": "0:56:37", "throughput": 2317.53, "total_tokens": 30858624} {"current_steps": 53495, "total_steps": 67140, "loss": 0.6769, "lr": 6.032248657664591e-06, "epoch": 7.967679475722371, "percentage": 79.68, "elapsed_time": "3:41:56", "remaining_time": "0:56:36", "throughput": 2317.56, "total_tokens": 30861760} {"current_steps": 53500, "total_steps": 67140, "loss": 0.6112, "lr": 6.028015767285735e-06, "epoch": 7.96842418826333, "percentage": 79.68, "elapsed_time": "3:41:57", "remaining_time": "0:56:35", "throughput": 2317.59, "total_tokens": 30864896} {"current_steps": 53505, "total_steps": 67140, "loss": 0.6018, "lr": 6.023784158956442e-06, "epoch": 7.96916890080429, "percentage": 79.69, "elapsed_time": "3:41:58", "remaining_time": "0:56:34", "throughput": 2317.61, "total_tokens": 30867712} {"current_steps": 53510, "total_steps": 67140, "loss": 0.5795, "lr": 6.019553832962668e-06, "epoch": 7.969913613345248, "percentage": 79.7, "elapsed_time": "3:41:59", "remaining_time": "0:56:32", "throughput": 2317.62, "total_tokens": 30870336} {"current_steps": 53515, "total_steps": 67140, "loss": 0.5947, "lr": 6.015324789590271e-06, "epoch": 7.970658325886208, "percentage": 79.71, "elapsed_time": "3:42:01", "remaining_time": "0:56:31", "throughput": 2317.67, "total_tokens": 30873760} {"current_steps": 53520, "total_steps": 67140, "loss": 0.4473, "lr": 6.01109702912504e-06, "epoch": 7.971403038427167, "percentage": 79.71, "elapsed_time": "3:42:02", "remaining_time": "0:56:30", "throughput": 2317.68, "total_tokens": 30876480} {"current_steps": 53525, "total_steps": 67140, "loss": 0.632, "lr": 6.006870551852667e-06, "epoch": 7.9721477509681264, "percentage": 79.72, "elapsed_time": "3:42:03", "remaining_time": "0:56:28", "throughput": 2317.68, "total_tokens": 30879104} {"current_steps": 53530, "total_steps": 67140, "loss": 0.6247, "lr": 6.00264535805877e-06, "epoch": 7.972892463509085, "percentage": 79.73, "elapsed_time": "3:42:04", "remaining_time": "0:56:27", "throughput": 2317.7, "total_tokens": 30881984} {"current_steps": 53535, "total_steps": 67140, "loss": 0.6227, "lr": 5.998421448028854e-06, "epoch": 7.973637176050045, "percentage": 79.74, "elapsed_time": "3:42:05", "remaining_time": "0:56:26", "throughput": 2317.73, "total_tokens": 30885024} {"current_steps": 53540, "total_steps": 67140, "loss": 0.6268, "lr": 5.994198822048361e-06, "epoch": 7.974381888591004, "percentage": 79.74, "elapsed_time": "3:42:06", "remaining_time": "0:56:25", "throughput": 2317.76, "total_tokens": 30888096} {"current_steps": 53545, "total_steps": 67140, "loss": 0.5941, "lr": 5.989977480402648e-06, "epoch": 7.975126601131963, "percentage": 79.75, "elapsed_time": "3:42:07", "remaining_time": "0:56:23", "throughput": 2317.77, "total_tokens": 30890880} {"current_steps": 53550, "total_steps": 67140, "loss": 0.5851, "lr": 5.985757423376962e-06, "epoch": 7.975871313672922, "percentage": 79.76, "elapsed_time": "3:42:08", "remaining_time": "0:56:22", "throughput": 2317.78, "total_tokens": 30893568} {"current_steps": 53555, "total_steps": 67140, "loss": 0.6606, "lr": 5.98153865125648e-06, "epoch": 7.976616026213882, "percentage": 79.77, "elapsed_time": "3:42:10", "remaining_time": "0:56:21", "throughput": 2317.8, "total_tokens": 30896384} {"current_steps": 53560, "total_steps": 67140, "loss": 0.6937, "lr": 5.977321164326294e-06, "epoch": 7.97736073875484, "percentage": 79.77, "elapsed_time": "3:42:11", "remaining_time": "0:56:20", "throughput": 2317.82, "total_tokens": 30899328} {"current_steps": 53565, "total_steps": 67140, "loss": 0.4847, "lr": 5.973104962871403e-06, "epoch": 7.9781054512958, "percentage": 79.78, "elapsed_time": "3:42:12", "remaining_time": "0:56:18", "throughput": 2317.84, "total_tokens": 30902176} {"current_steps": 53570, "total_steps": 67140, "loss": 0.4366, "lr": 5.968890047176728e-06, "epoch": 7.978850163836759, "percentage": 79.79, "elapsed_time": "3:42:13", "remaining_time": "0:56:17", "throughput": 2317.85, "total_tokens": 30904800} {"current_steps": 53575, "total_steps": 67140, "loss": 0.6769, "lr": 5.964676417527082e-06, "epoch": 7.9795948763777185, "percentage": 79.8, "elapsed_time": "3:42:14", "remaining_time": "0:56:16", "throughput": 2317.87, "total_tokens": 30907872} {"current_steps": 53580, "total_steps": 67140, "loss": 0.4885, "lr": 5.960464074207217e-06, "epoch": 7.980339588918677, "percentage": 79.8, "elapsed_time": "3:42:15", "remaining_time": "0:56:14", "throughput": 2317.88, "total_tokens": 30910464} {"current_steps": 53585, "total_steps": 67140, "loss": 0.7113, "lr": 5.956253017501776e-06, "epoch": 7.981084301459637, "percentage": 79.81, "elapsed_time": "3:42:16", "remaining_time": "0:56:13", "throughput": 2317.9, "total_tokens": 30913312} {"current_steps": 53590, "total_steps": 67140, "loss": 0.3792, "lr": 5.95204324769533e-06, "epoch": 7.981829014000596, "percentage": 79.82, "elapsed_time": "3:42:17", "remaining_time": "0:56:12", "throughput": 2317.91, "total_tokens": 30916160} {"current_steps": 53595, "total_steps": 67140, "loss": 0.6306, "lr": 5.947834765072355e-06, "epoch": 7.982573726541555, "percentage": 79.83, "elapsed_time": "3:42:19", "remaining_time": "0:56:11", "throughput": 2317.92, "total_tokens": 30918688} {"current_steps": 53600, "total_steps": 67140, "loss": 0.5597, "lr": 5.943627569917248e-06, "epoch": 7.983318439082514, "percentage": 79.83, "elapsed_time": "3:42:20", "remaining_time": "0:56:09", "throughput": 2317.95, "total_tokens": 30921824} {"current_steps": 53605, "total_steps": 67140, "loss": 0.5908, "lr": 5.939421662514314e-06, "epoch": 7.984063151623474, "percentage": 79.84, "elapsed_time": "3:42:21", "remaining_time": "0:56:08", "throughput": 2317.96, "total_tokens": 30924704} {"current_steps": 53610, "total_steps": 67140, "loss": 0.5726, "lr": 5.9352170431477755e-06, "epoch": 7.9848078641644324, "percentage": 79.85, "elapsed_time": "3:42:22", "remaining_time": "0:56:07", "throughput": 2317.98, "total_tokens": 30927552} {"current_steps": 53615, "total_steps": 67140, "loss": 0.6028, "lr": 5.931013712101754e-06, "epoch": 7.985552576705392, "percentage": 79.86, "elapsed_time": "3:42:23", "remaining_time": "0:56:06", "throughput": 2318.0, "total_tokens": 30930432} {"current_steps": 53620, "total_steps": 67140, "loss": 0.5506, "lr": 5.926811669660296e-06, "epoch": 7.986297289246351, "percentage": 79.86, "elapsed_time": "3:42:24", "remaining_time": "0:56:04", "throughput": 2318.02, "total_tokens": 30933376} {"current_steps": 53625, "total_steps": 67140, "loss": 0.537, "lr": 5.922610916107355e-06, "epoch": 7.9870420017873105, "percentage": 79.87, "elapsed_time": "3:42:25", "remaining_time": "0:56:03", "throughput": 2318.03, "total_tokens": 30936096} {"current_steps": 53630, "total_steps": 67140, "loss": 0.5757, "lr": 5.918411451726804e-06, "epoch": 7.987786714328269, "percentage": 79.88, "elapsed_time": "3:42:26", "remaining_time": "0:56:02", "throughput": 2318.04, "total_tokens": 30938816} {"current_steps": 53635, "total_steps": 67140, "loss": 0.499, "lr": 5.91421327680243e-06, "epoch": 7.988531426869228, "percentage": 79.89, "elapsed_time": "3:42:28", "remaining_time": "0:56:00", "throughput": 2318.06, "total_tokens": 30941600} {"current_steps": 53640, "total_steps": 67140, "loss": 0.5684, "lr": 5.910016391617934e-06, "epoch": 7.989276139410188, "percentage": 79.89, "elapsed_time": "3:42:29", "remaining_time": "0:55:59", "throughput": 2318.08, "total_tokens": 30944608} {"current_steps": 53645, "total_steps": 67140, "loss": 0.4711, "lr": 5.905820796456906e-06, "epoch": 7.990020851951147, "percentage": 79.9, "elapsed_time": "3:42:30", "remaining_time": "0:55:58", "throughput": 2318.1, "total_tokens": 30947424} {"current_steps": 53650, "total_steps": 67140, "loss": 0.5031, "lr": 5.901626491602885e-06, "epoch": 7.990765564492106, "percentage": 79.91, "elapsed_time": "3:42:31", "remaining_time": "0:55:57", "throughput": 2318.11, "total_tokens": 30950176} {"current_steps": 53655, "total_steps": 67140, "loss": 0.5209, "lr": 5.8974334773392924e-06, "epoch": 7.991510277033065, "percentage": 79.92, "elapsed_time": "3:42:32", "remaining_time": "0:55:55", "throughput": 2318.14, "total_tokens": 30953216} {"current_steps": 53660, "total_steps": 67140, "loss": 0.5345, "lr": 5.893241753949477e-06, "epoch": 7.9922549895740245, "percentage": 79.92, "elapsed_time": "3:42:33", "remaining_time": "0:55:54", "throughput": 2318.15, "total_tokens": 30956000} {"current_steps": 53665, "total_steps": 67140, "loss": 0.5994, "lr": 5.889051321716702e-06, "epoch": 7.992999702114983, "percentage": 79.93, "elapsed_time": "3:42:34", "remaining_time": "0:55:53", "throughput": 2318.18, "total_tokens": 30958944} {"current_steps": 53670, "total_steps": 67140, "loss": 0.4604, "lr": 5.8848621809241415e-06, "epoch": 7.993744414655943, "percentage": 79.94, "elapsed_time": "3:42:36", "remaining_time": "0:55:52", "throughput": 2318.2, "total_tokens": 30961984} {"current_steps": 53675, "total_steps": 67140, "loss": 0.5957, "lr": 5.880674331854882e-06, "epoch": 7.994489127196902, "percentage": 79.94, "elapsed_time": "3:42:37", "remaining_time": "0:55:50", "throughput": 2318.22, "total_tokens": 30964928} {"current_steps": 53680, "total_steps": 67140, "loss": 0.5825, "lr": 5.876487774791914e-06, "epoch": 7.995233839737861, "percentage": 79.95, "elapsed_time": "3:42:38", "remaining_time": "0:55:49", "throughput": 2318.23, "total_tokens": 30967552} {"current_steps": 53685, "total_steps": 67140, "loss": 0.53, "lr": 5.872302510018149e-06, "epoch": 7.99597855227882, "percentage": 79.96, "elapsed_time": "3:42:39", "remaining_time": "0:55:48", "throughput": 2318.25, "total_tokens": 30970528} {"current_steps": 53690, "total_steps": 67140, "loss": 0.6082, "lr": 5.8681185378164224e-06, "epoch": 7.99672326481978, "percentage": 79.97, "elapsed_time": "3:42:40", "remaining_time": "0:55:46", "throughput": 2318.28, "total_tokens": 30973600} {"current_steps": 53695, "total_steps": 67140, "loss": 0.5779, "lr": 5.863935858469452e-06, "epoch": 7.9974679773607384, "percentage": 79.97, "elapsed_time": "3:42:41", "remaining_time": "0:55:45", "throughput": 2318.29, "total_tokens": 30976320} {"current_steps": 53700, "total_steps": 67140, "loss": 0.5796, "lr": 5.859754472259893e-06, "epoch": 7.998212689901698, "percentage": 79.98, "elapsed_time": "3:42:42", "remaining_time": "0:55:44", "throughput": 2318.29, "total_tokens": 30978880} {"current_steps": 53705, "total_steps": 67140, "loss": 0.7507, "lr": 5.855574379470311e-06, "epoch": 7.998957402442657, "percentage": 79.99, "elapsed_time": "3:42:43", "remaining_time": "0:55:43", "throughput": 2318.3, "total_tokens": 30981632} {"current_steps": 53710, "total_steps": 67140, "loss": 0.5107, "lr": 5.851395580383182e-06, "epoch": 7.9997021149836165, "percentage": 80.0, "elapsed_time": "3:42:45", "remaining_time": "0:55:41", "throughput": 2318.33, "total_tokens": 30984608} {"current_steps": 53712, "total_steps": 67140, "eval_loss": 0.6710728406906128, "epoch": 8.0, "percentage": 80.0, "elapsed_time": "3:43:59", "remaining_time": "0:55:59", "throughput": 2305.49, "total_tokens": 30985288} {"current_steps": 53715, "total_steps": 67140, "loss": 0.4861, "lr": 5.8472180752808805e-06, "epoch": 8.000446827524575, "percentage": 80.0, "elapsed_time": "3:44:02", "remaining_time": "0:55:59", "throughput": 2305.15, "total_tokens": 30986824} {"current_steps": 53720, "total_steps": 67140, "loss": 0.6092, "lr": 5.843041864445714e-06, "epoch": 8.001191540065534, "percentage": 80.01, "elapsed_time": "3:44:03", "remaining_time": "0:55:58", "throughput": 2305.18, "total_tokens": 30989800} {"current_steps": 53725, "total_steps": 67140, "loss": 0.4512, "lr": 5.838866948159888e-06, "epoch": 8.001936252606495, "percentage": 80.02, "elapsed_time": "3:44:04", "remaining_time": "0:55:57", "throughput": 2305.19, "total_tokens": 30992520} {"current_steps": 53730, "total_steps": 67140, "loss": 0.5141, "lr": 5.8346933267055394e-06, "epoch": 8.002680965147453, "percentage": 80.03, "elapsed_time": "3:44:05", "remaining_time": "0:55:55", "throughput": 2305.2, "total_tokens": 30995336} {"current_steps": 53735, "total_steps": 67140, "loss": 0.6592, "lr": 5.830521000364689e-06, "epoch": 8.003425677688412, "percentage": 80.03, "elapsed_time": "3:44:06", "remaining_time": "0:55:54", "throughput": 2305.23, "total_tokens": 30998312} {"current_steps": 53740, "total_steps": 67140, "loss": 0.7474, "lr": 5.826349969419292e-06, "epoch": 8.00417039022937, "percentage": 80.04, "elapsed_time": "3:44:08", "remaining_time": "0:55:53", "throughput": 2305.26, "total_tokens": 31001480} {"current_steps": 53745, "total_steps": 67140, "loss": 0.6291, "lr": 5.822180234151214e-06, "epoch": 8.004915102770331, "percentage": 80.05, "elapsed_time": "3:44:09", "remaining_time": "0:55:51", "throughput": 2305.27, "total_tokens": 31004232} {"current_steps": 53750, "total_steps": 67140, "loss": 0.7795, "lr": 5.818011794842221e-06, "epoch": 8.00565981531129, "percentage": 80.06, "elapsed_time": "3:44:10", "remaining_time": "0:55:50", "throughput": 2305.3, "total_tokens": 31007176} {"current_steps": 53755, "total_steps": 67140, "loss": 0.7803, "lr": 5.8138446517740005e-06, "epoch": 8.006404527852249, "percentage": 80.06, "elapsed_time": "3:44:11", "remaining_time": "0:55:49", "throughput": 2305.32, "total_tokens": 31010184} {"current_steps": 53760, "total_steps": 67140, "loss": 0.441, "lr": 5.809678805228152e-06, "epoch": 8.007149240393208, "percentage": 80.07, "elapsed_time": "3:44:12", "remaining_time": "0:55:48", "throughput": 2305.34, "total_tokens": 31013192} {"current_steps": 53765, "total_steps": 67140, "loss": 0.5363, "lr": 5.805514255486191e-06, "epoch": 8.007893952934168, "percentage": 80.08, "elapsed_time": "3:44:13", "remaining_time": "0:55:46", "throughput": 2305.36, "total_tokens": 31016072} {"current_steps": 53770, "total_steps": 67140, "loss": 0.5745, "lr": 5.801351002829542e-06, "epoch": 8.008638665475127, "percentage": 80.09, "elapsed_time": "3:44:15", "remaining_time": "0:55:45", "throughput": 2305.38, "total_tokens": 31018952} {"current_steps": 53775, "total_steps": 67140, "loss": 0.6512, "lr": 5.797189047539531e-06, "epoch": 8.009383378016086, "percentage": 80.09, "elapsed_time": "3:44:16", "remaining_time": "0:55:44", "throughput": 2305.41, "total_tokens": 31021864} {"current_steps": 53780, "total_steps": 67140, "loss": 0.567, "lr": 5.793028389897418e-06, "epoch": 8.010128090557044, "percentage": 80.1, "elapsed_time": "3:44:17", "remaining_time": "0:55:43", "throughput": 2305.42, "total_tokens": 31024648} {"current_steps": 53785, "total_steps": 67140, "loss": 0.5447, "lr": 5.788869030184346e-06, "epoch": 8.010872803098005, "percentage": 80.11, "elapsed_time": "3:44:18", "remaining_time": "0:55:41", "throughput": 2305.44, "total_tokens": 31027528} {"current_steps": 53790, "total_steps": 67140, "loss": 0.7016, "lr": 5.784710968681403e-06, "epoch": 8.011617515638964, "percentage": 80.12, "elapsed_time": "3:44:19", "remaining_time": "0:55:40", "throughput": 2305.45, "total_tokens": 31030248} {"current_steps": 53795, "total_steps": 67140, "loss": 0.7551, "lr": 5.780554205669567e-06, "epoch": 8.012362228179922, "percentage": 80.12, "elapsed_time": "3:44:20", "remaining_time": "0:55:39", "throughput": 2305.46, "total_tokens": 31033000} {"current_steps": 53800, "total_steps": 67140, "loss": 0.5178, "lr": 5.776398741429737e-06, "epoch": 8.013106940720881, "percentage": 80.13, "elapsed_time": "3:44:21", "remaining_time": "0:55:37", "throughput": 2305.48, "total_tokens": 31035848} {"current_steps": 53805, "total_steps": 67140, "loss": 0.4399, "lr": 5.77224457624273e-06, "epoch": 8.013851653261842, "percentage": 80.14, "elapsed_time": "3:44:22", "remaining_time": "0:55:36", "throughput": 2305.51, "total_tokens": 31038952} {"current_steps": 53810, "total_steps": 67140, "loss": 0.65, "lr": 5.768091710389254e-06, "epoch": 8.0145963658028, "percentage": 80.15, "elapsed_time": "3:44:24", "remaining_time": "0:55:35", "throughput": 2305.54, "total_tokens": 31042088} {"current_steps": 53815, "total_steps": 67140, "loss": 0.7132, "lr": 5.763940144149954e-06, "epoch": 8.01534107834376, "percentage": 80.15, "elapsed_time": "3:44:25", "remaining_time": "0:55:34", "throughput": 2305.56, "total_tokens": 31044840} {"current_steps": 53820, "total_steps": 67140, "loss": 0.5554, "lr": 5.759789877805363e-06, "epoch": 8.016085790884718, "percentage": 80.16, "elapsed_time": "3:44:26", "remaining_time": "0:55:32", "throughput": 2305.58, "total_tokens": 31047752} {"current_steps": 53825, "total_steps": 67140, "loss": 0.6208, "lr": 5.755640911635951e-06, "epoch": 8.016830503425677, "percentage": 80.17, "elapsed_time": "3:44:27", "remaining_time": "0:55:31", "throughput": 2305.61, "total_tokens": 31050824} {"current_steps": 53830, "total_steps": 67140, "loss": 0.6471, "lr": 5.7514932459220825e-06, "epoch": 8.017575215966637, "percentage": 80.18, "elapsed_time": "3:44:28", "remaining_time": "0:55:30", "throughput": 2305.63, "total_tokens": 31053672} {"current_steps": 53835, "total_steps": 67140, "loss": 0.5333, "lr": 5.747346880944041e-06, "epoch": 8.018319928507596, "percentage": 80.18, "elapsed_time": "3:44:29", "remaining_time": "0:55:28", "throughput": 2305.63, "total_tokens": 31056232} {"current_steps": 53840, "total_steps": 67140, "loss": 0.5486, "lr": 5.743201816982027e-06, "epoch": 8.019064641048555, "percentage": 80.19, "elapsed_time": "3:44:30", "remaining_time": "0:55:27", "throughput": 2305.66, "total_tokens": 31059304} {"current_steps": 53845, "total_steps": 67140, "loss": 0.436, "lr": 5.739058054316138e-06, "epoch": 8.019809353589514, "percentage": 80.2, "elapsed_time": "3:44:32", "remaining_time": "0:55:26", "throughput": 2305.69, "total_tokens": 31062376} {"current_steps": 53850, "total_steps": 67140, "loss": 0.5934, "lr": 5.7349155932264035e-06, "epoch": 8.020554066130474, "percentage": 80.21, "elapsed_time": "3:44:33", "remaining_time": "0:55:25", "throughput": 2305.71, "total_tokens": 31065352} {"current_steps": 53855, "total_steps": 67140, "loss": 0.7285, "lr": 5.730774433992739e-06, "epoch": 8.021298778671433, "percentage": 80.21, "elapsed_time": "3:44:34", "remaining_time": "0:55:23", "throughput": 2305.73, "total_tokens": 31068168} {"current_steps": 53860, "total_steps": 67140, "loss": 0.6901, "lr": 5.726634576894993e-06, "epoch": 8.022043491212392, "percentage": 80.22, "elapsed_time": "3:44:35", "remaining_time": "0:55:22", "throughput": 2305.76, "total_tokens": 31071208} {"current_steps": 53865, "total_steps": 67140, "loss": 0.4738, "lr": 5.7224960222129255e-06, "epoch": 8.02278820375335, "percentage": 80.23, "elapsed_time": "3:44:36", "remaining_time": "0:55:21", "throughput": 2305.78, "total_tokens": 31074184} {"current_steps": 53870, "total_steps": 67140, "loss": 0.4762, "lr": 5.718358770226201e-06, "epoch": 8.023532916294311, "percentage": 80.24, "elapsed_time": "3:44:37", "remaining_time": "0:55:20", "throughput": 2305.79, "total_tokens": 31077032} {"current_steps": 53875, "total_steps": 67140, "loss": 0.5011, "lr": 5.714222821214402e-06, "epoch": 8.02427762883527, "percentage": 80.24, "elapsed_time": "3:44:38", "remaining_time": "0:55:18", "throughput": 2305.79, "total_tokens": 31079528} {"current_steps": 53880, "total_steps": 67140, "loss": 0.6267, "lr": 5.710088175457007e-06, "epoch": 8.025022341376228, "percentage": 80.25, "elapsed_time": "3:44:40", "remaining_time": "0:55:17", "throughput": 2305.81, "total_tokens": 31082408} {"current_steps": 53885, "total_steps": 67140, "loss": 0.5281, "lr": 5.705954833233429e-06, "epoch": 8.025767053917187, "percentage": 80.26, "elapsed_time": "3:44:41", "remaining_time": "0:55:16", "throughput": 2305.82, "total_tokens": 31085096} {"current_steps": 53890, "total_steps": 67140, "loss": 0.6034, "lr": 5.701822794822978e-06, "epoch": 8.026511766458148, "percentage": 80.27, "elapsed_time": "3:44:42", "remaining_time": "0:55:14", "throughput": 2305.86, "total_tokens": 31088296} {"current_steps": 53895, "total_steps": 67140, "loss": 0.6148, "lr": 5.6976920605048885e-06, "epoch": 8.027256478999107, "percentage": 80.27, "elapsed_time": "3:44:43", "remaining_time": "0:55:13", "throughput": 2305.89, "total_tokens": 31091432} {"current_steps": 53900, "total_steps": 67140, "loss": 0.7181, "lr": 5.6935626305582855e-06, "epoch": 8.028001191540065, "percentage": 80.28, "elapsed_time": "3:44:44", "remaining_time": "0:55:12", "throughput": 2305.92, "total_tokens": 31094536} {"current_steps": 53905, "total_steps": 67140, "loss": 0.5662, "lr": 5.6894345052622255e-06, "epoch": 8.028745904081024, "percentage": 80.29, "elapsed_time": "3:44:45", "remaining_time": "0:55:11", "throughput": 2305.95, "total_tokens": 31097512} {"current_steps": 53910, "total_steps": 67140, "loss": 0.6264, "lr": 5.685307684895677e-06, "epoch": 8.029490616621985, "percentage": 80.29, "elapsed_time": "3:44:46", "remaining_time": "0:55:09", "throughput": 2305.97, "total_tokens": 31100392} {"current_steps": 53915, "total_steps": 67140, "loss": 0.5211, "lr": 5.6811821697375005e-06, "epoch": 8.030235329162943, "percentage": 80.3, "elapsed_time": "3:44:48", "remaining_time": "0:55:08", "throughput": 2305.97, "total_tokens": 31103080} {"current_steps": 53920, "total_steps": 67140, "loss": 0.6749, "lr": 5.67705796006649e-06, "epoch": 8.030980041703902, "percentage": 80.31, "elapsed_time": "3:44:49", "remaining_time": "0:55:07", "throughput": 2306.01, "total_tokens": 31106344} {"current_steps": 53925, "total_steps": 67140, "loss": 0.5818, "lr": 5.672935056161338e-06, "epoch": 8.03172475424486, "percentage": 80.32, "elapsed_time": "3:44:50", "remaining_time": "0:55:05", "throughput": 2306.03, "total_tokens": 31109320} {"current_steps": 53930, "total_steps": 67140, "loss": 0.7112, "lr": 5.668813458300659e-06, "epoch": 8.032469466785821, "percentage": 80.32, "elapsed_time": "3:44:51", "remaining_time": "0:55:04", "throughput": 2306.05, "total_tokens": 31112072} {"current_steps": 53935, "total_steps": 67140, "loss": 0.7468, "lr": 5.664693166762977e-06, "epoch": 8.03321417932678, "percentage": 80.33, "elapsed_time": "3:44:52", "remaining_time": "0:55:03", "throughput": 2306.06, "total_tokens": 31114824} {"current_steps": 53940, "total_steps": 67140, "loss": 0.576, "lr": 5.660574181826714e-06, "epoch": 8.033958891867739, "percentage": 80.34, "elapsed_time": "3:44:53", "remaining_time": "0:55:02", "throughput": 2306.07, "total_tokens": 31117640} {"current_steps": 53945, "total_steps": 67140, "loss": 0.454, "lr": 5.656456503770227e-06, "epoch": 8.034703604408698, "percentage": 80.35, "elapsed_time": "3:44:54", "remaining_time": "0:55:00", "throughput": 2306.11, "total_tokens": 31120840} {"current_steps": 53950, "total_steps": 67140, "loss": 0.4329, "lr": 5.652340132871756e-06, "epoch": 8.035448316949658, "percentage": 80.35, "elapsed_time": "3:44:56", "remaining_time": "0:54:59", "throughput": 2306.15, "total_tokens": 31124104} {"current_steps": 53955, "total_steps": 67140, "loss": 0.635, "lr": 5.648225069409477e-06, "epoch": 8.036193029490617, "percentage": 80.36, "elapsed_time": "3:44:57", "remaining_time": "0:54:58", "throughput": 2306.15, "total_tokens": 31126728} {"current_steps": 53960, "total_steps": 67140, "loss": 0.5311, "lr": 5.644111313661471e-06, "epoch": 8.036937742031576, "percentage": 80.37, "elapsed_time": "3:44:58", "remaining_time": "0:54:57", "throughput": 2306.16, "total_tokens": 31129480} {"current_steps": 53965, "total_steps": 67140, "loss": 0.6615, "lr": 5.639998865905724e-06, "epoch": 8.037682454572534, "percentage": 80.38, "elapsed_time": "3:44:59", "remaining_time": "0:54:55", "throughput": 2306.2, "total_tokens": 31132584} {"current_steps": 53970, "total_steps": 67140, "loss": 0.7071, "lr": 5.63588772642015e-06, "epoch": 8.038427167113495, "percentage": 80.38, "elapsed_time": "3:45:00", "remaining_time": "0:54:54", "throughput": 2306.23, "total_tokens": 31135848} {"current_steps": 53975, "total_steps": 67140, "loss": 0.6542, "lr": 5.631777895482549e-06, "epoch": 8.039171879654454, "percentage": 80.39, "elapsed_time": "3:45:01", "remaining_time": "0:54:53", "throughput": 2306.25, "total_tokens": 31138792} {"current_steps": 53980, "total_steps": 67140, "loss": 0.632, "lr": 5.627669373370658e-06, "epoch": 8.039916592195413, "percentage": 80.4, "elapsed_time": "3:45:03", "remaining_time": "0:54:51", "throughput": 2306.27, "total_tokens": 31141704} {"current_steps": 53985, "total_steps": 67140, "loss": 0.5292, "lr": 5.6235621603621004e-06, "epoch": 8.040661304736371, "percentage": 80.41, "elapsed_time": "3:45:04", "remaining_time": "0:54:50", "throughput": 2306.29, "total_tokens": 31144552} {"current_steps": 53990, "total_steps": 67140, "loss": 0.4176, "lr": 5.619456256734434e-06, "epoch": 8.041406017277332, "percentage": 80.41, "elapsed_time": "3:45:05", "remaining_time": "0:54:49", "throughput": 2306.31, "total_tokens": 31147560} {"current_steps": 53995, "total_steps": 67140, "loss": 0.4966, "lr": 5.61535166276512e-06, "epoch": 8.04215072981829, "percentage": 80.42, "elapsed_time": "3:45:06", "remaining_time": "0:54:48", "throughput": 2306.34, "total_tokens": 31150568} {"current_steps": 54000, "total_steps": 67140, "loss": 0.5861, "lr": 5.611248378731526e-06, "epoch": 8.04289544235925, "percentage": 80.43, "elapsed_time": "3:45:07", "remaining_time": "0:54:46", "throughput": 2306.36, "total_tokens": 31153512} {"current_steps": 54005, "total_steps": 67140, "loss": 0.6458, "lr": 5.607146404910949e-06, "epoch": 8.043640154900208, "percentage": 80.44, "elapsed_time": "3:45:08", "remaining_time": "0:54:45", "throughput": 2306.37, "total_tokens": 31156232} {"current_steps": 54010, "total_steps": 67140, "loss": 0.7964, "lr": 5.603045741580559e-06, "epoch": 8.044384867441167, "percentage": 80.44, "elapsed_time": "3:45:09", "remaining_time": "0:54:44", "throughput": 2306.39, "total_tokens": 31159048} {"current_steps": 54015, "total_steps": 67140, "loss": 0.6374, "lr": 5.598946389017487e-06, "epoch": 8.045129579982127, "percentage": 80.45, "elapsed_time": "3:45:11", "remaining_time": "0:54:43", "throughput": 2306.41, "total_tokens": 31161928} {"current_steps": 54020, "total_steps": 67140, "loss": 0.6489, "lr": 5.59484834749873e-06, "epoch": 8.045874292523086, "percentage": 80.46, "elapsed_time": "3:45:12", "remaining_time": "0:54:41", "throughput": 2306.43, "total_tokens": 31164776} {"current_steps": 54025, "total_steps": 67140, "loss": 0.6038, "lr": 5.590751617301226e-06, "epoch": 8.046619005064045, "percentage": 80.47, "elapsed_time": "3:45:13", "remaining_time": "0:54:40", "throughput": 2306.46, "total_tokens": 31167944} {"current_steps": 54030, "total_steps": 67140, "loss": 0.4737, "lr": 5.5866561987018176e-06, "epoch": 8.047363717605004, "percentage": 80.47, "elapsed_time": "3:45:14", "remaining_time": "0:54:39", "throughput": 2306.47, "total_tokens": 31170536} {"current_steps": 54035, "total_steps": 67140, "loss": 0.6441, "lr": 5.582562091977253e-06, "epoch": 8.048108430145964, "percentage": 80.48, "elapsed_time": "3:45:15", "remaining_time": "0:54:37", "throughput": 2306.5, "total_tokens": 31173736} {"current_steps": 54040, "total_steps": 67140, "loss": 0.8055, "lr": 5.578469297404204e-06, "epoch": 8.048853142686923, "percentage": 80.49, "elapsed_time": "3:45:16", "remaining_time": "0:54:36", "throughput": 2306.53, "total_tokens": 31176872} {"current_steps": 54045, "total_steps": 67140, "loss": 0.6069, "lr": 5.574377815259229e-06, "epoch": 8.049597855227882, "percentage": 80.5, "elapsed_time": "3:45:17", "remaining_time": "0:54:35", "throughput": 2306.55, "total_tokens": 31179784} {"current_steps": 54050, "total_steps": 67140, "loss": 0.5411, "lr": 5.570287645818825e-06, "epoch": 8.05034256776884, "percentage": 80.5, "elapsed_time": "3:45:19", "remaining_time": "0:54:34", "throughput": 2306.57, "total_tokens": 31182536} {"current_steps": 54055, "total_steps": 67140, "loss": 0.6019, "lr": 5.566198789359392e-06, "epoch": 8.051087280309801, "percentage": 80.51, "elapsed_time": "3:45:20", "remaining_time": "0:54:32", "throughput": 2306.58, "total_tokens": 31185352} {"current_steps": 54060, "total_steps": 67140, "loss": 0.7081, "lr": 5.562111246157228e-06, "epoch": 8.05183199285076, "percentage": 80.52, "elapsed_time": "3:45:21", "remaining_time": "0:54:31", "throughput": 2306.61, "total_tokens": 31188360} {"current_steps": 54065, "total_steps": 67140, "loss": 0.6414, "lr": 5.558025016488555e-06, "epoch": 8.052576705391719, "percentage": 80.53, "elapsed_time": "3:45:22", "remaining_time": "0:54:30", "throughput": 2306.63, "total_tokens": 31191272} {"current_steps": 54070, "total_steps": 67140, "loss": 0.4632, "lr": 5.553940100629507e-06, "epoch": 8.053321417932677, "percentage": 80.53, "elapsed_time": "3:45:23", "remaining_time": "0:54:28", "throughput": 2306.64, "total_tokens": 31193992} {"current_steps": 54075, "total_steps": 67140, "loss": 0.3858, "lr": 5.549856498856129e-06, "epoch": 8.054066130473638, "percentage": 80.54, "elapsed_time": "3:45:24", "remaining_time": "0:54:27", "throughput": 2306.65, "total_tokens": 31196712} {"current_steps": 54080, "total_steps": 67140, "loss": 0.6632, "lr": 5.545774211444369e-06, "epoch": 8.054810843014597, "percentage": 80.55, "elapsed_time": "3:45:25", "remaining_time": "0:54:26", "throughput": 2306.69, "total_tokens": 31199848} {"current_steps": 54085, "total_steps": 67140, "loss": 0.6288, "lr": 5.541693238670087e-06, "epoch": 8.055555555555555, "percentage": 80.56, "elapsed_time": "3:45:26", "remaining_time": "0:54:25", "throughput": 2306.7, "total_tokens": 31202696} {"current_steps": 54090, "total_steps": 67140, "loss": 0.4712, "lr": 5.537613580809067e-06, "epoch": 8.056300268096514, "percentage": 80.56, "elapsed_time": "3:45:28", "remaining_time": "0:54:23", "throughput": 2306.71, "total_tokens": 31205320} {"current_steps": 54095, "total_steps": 67140, "loss": 0.6069, "lr": 5.533535238137e-06, "epoch": 8.057044980637475, "percentage": 80.57, "elapsed_time": "3:45:29", "remaining_time": "0:54:22", "throughput": 2306.75, "total_tokens": 31208584} {"current_steps": 54100, "total_steps": 67140, "loss": 0.4445, "lr": 5.5294582109294696e-06, "epoch": 8.057789693178433, "percentage": 80.58, "elapsed_time": "3:45:30", "remaining_time": "0:54:21", "throughput": 2306.78, "total_tokens": 31211624} {"current_steps": 54105, "total_steps": 67140, "loss": 0.5212, "lr": 5.525382499461993e-06, "epoch": 8.058534405719392, "percentage": 80.59, "elapsed_time": "3:45:31", "remaining_time": "0:54:20", "throughput": 2306.79, "total_tokens": 31214376} {"current_steps": 54110, "total_steps": 67140, "loss": 0.5874, "lr": 5.521308104009992e-06, "epoch": 8.059279118260351, "percentage": 80.59, "elapsed_time": "3:45:32", "remaining_time": "0:54:18", "throughput": 2306.81, "total_tokens": 31217288} {"current_steps": 54115, "total_steps": 67140, "loss": 0.5361, "lr": 5.517235024848791e-06, "epoch": 8.060023830801311, "percentage": 80.6, "elapsed_time": "3:45:33", "remaining_time": "0:54:17", "throughput": 2306.82, "total_tokens": 31220040} {"current_steps": 54120, "total_steps": 67140, "loss": 0.5367, "lr": 5.513163262253635e-06, "epoch": 8.06076854334227, "percentage": 80.61, "elapsed_time": "3:45:34", "remaining_time": "0:54:16", "throughput": 2306.85, "total_tokens": 31222984} {"current_steps": 54125, "total_steps": 67140, "loss": 0.4809, "lr": 5.509092816499678e-06, "epoch": 8.061513255883229, "percentage": 80.62, "elapsed_time": "3:45:36", "remaining_time": "0:54:14", "throughput": 2306.87, "total_tokens": 31225928} {"current_steps": 54130, "total_steps": 67140, "loss": 0.5171, "lr": 5.505023687861985e-06, "epoch": 8.062257968424188, "percentage": 80.62, "elapsed_time": "3:45:37", "remaining_time": "0:54:13", "throughput": 2306.91, "total_tokens": 31229192} {"current_steps": 54135, "total_steps": 67140, "loss": 0.4943, "lr": 5.500955876615538e-06, "epoch": 8.063002680965148, "percentage": 80.63, "elapsed_time": "3:45:38", "remaining_time": "0:54:12", "throughput": 2306.93, "total_tokens": 31232136} {"current_steps": 54140, "total_steps": 67140, "loss": 0.6409, "lr": 5.496889383035206e-06, "epoch": 8.063747393506107, "percentage": 80.64, "elapsed_time": "3:45:39", "remaining_time": "0:54:11", "throughput": 2306.95, "total_tokens": 31235080} {"current_steps": 54145, "total_steps": 67140, "loss": 0.5772, "lr": 5.492824207395805e-06, "epoch": 8.064492106047066, "percentage": 80.64, "elapsed_time": "3:45:40", "remaining_time": "0:54:09", "throughput": 2306.98, "total_tokens": 31238152} {"current_steps": 54150, "total_steps": 67140, "loss": 0.4736, "lr": 5.4887603499720244e-06, "epoch": 8.065236818588025, "percentage": 80.65, "elapsed_time": "3:45:41", "remaining_time": "0:54:08", "throughput": 2307.0, "total_tokens": 31240968} {"current_steps": 54155, "total_steps": 67140, "loss": 0.4971, "lr": 5.484697811038494e-06, "epoch": 8.065981531128985, "percentage": 80.66, "elapsed_time": "3:45:42", "remaining_time": "0:54:07", "throughput": 2307.02, "total_tokens": 31243880} {"current_steps": 54160, "total_steps": 67140, "loss": 0.7, "lr": 5.480636590869742e-06, "epoch": 8.066726243669944, "percentage": 80.67, "elapsed_time": "3:45:44", "remaining_time": "0:54:05", "throughput": 2307.05, "total_tokens": 31246888} {"current_steps": 54165, "total_steps": 67140, "loss": 0.5146, "lr": 5.476576689740209e-06, "epoch": 8.067470956210903, "percentage": 80.67, "elapsed_time": "3:45:45", "remaining_time": "0:54:04", "throughput": 2307.08, "total_tokens": 31250120} {"current_steps": 54170, "total_steps": 67140, "loss": 0.5803, "lr": 5.472518107924255e-06, "epoch": 8.068215668751861, "percentage": 80.68, "elapsed_time": "3:45:46", "remaining_time": "0:54:03", "throughput": 2307.11, "total_tokens": 31253128} {"current_steps": 54175, "total_steps": 67140, "loss": 0.6023, "lr": 5.468460845696133e-06, "epoch": 8.06896038129282, "percentage": 80.69, "elapsed_time": "3:45:47", "remaining_time": "0:54:02", "throughput": 2307.12, "total_tokens": 31255944} {"current_steps": 54180, "total_steps": 67140, "loss": 0.5415, "lr": 5.4644049033300085e-06, "epoch": 8.06970509383378, "percentage": 80.7, "elapsed_time": "3:45:48", "remaining_time": "0:54:00", "throughput": 2307.14, "total_tokens": 31258760} {"current_steps": 54185, "total_steps": 67140, "loss": 0.5231, "lr": 5.460350281099977e-06, "epoch": 8.07044980637474, "percentage": 80.7, "elapsed_time": "3:45:49", "remaining_time": "0:53:59", "throughput": 2307.16, "total_tokens": 31261672} {"current_steps": 54190, "total_steps": 67140, "loss": 0.5626, "lr": 5.4562969792800315e-06, "epoch": 8.071194518915698, "percentage": 80.71, "elapsed_time": "3:45:51", "remaining_time": "0:53:58", "throughput": 2307.18, "total_tokens": 31264552} {"current_steps": 54195, "total_steps": 67140, "loss": 0.5979, "lr": 5.452244998144076e-06, "epoch": 8.071939231456657, "percentage": 80.72, "elapsed_time": "3:45:52", "remaining_time": "0:53:57", "throughput": 2307.2, "total_tokens": 31267464} {"current_steps": 54200, "total_steps": 67140, "loss": 0.5026, "lr": 5.448194337965931e-06, "epoch": 8.072683943997617, "percentage": 80.73, "elapsed_time": "3:45:53", "remaining_time": "0:53:55", "throughput": 2307.2, "total_tokens": 31270024} {"current_steps": 54205, "total_steps": 67140, "loss": 0.6068, "lr": 5.444144999019324e-06, "epoch": 8.073428656538576, "percentage": 80.73, "elapsed_time": "3:45:54", "remaining_time": "0:53:54", "throughput": 2307.22, "total_tokens": 31272872} {"current_steps": 54210, "total_steps": 67140, "loss": 0.5757, "lr": 5.4400969815778854e-06, "epoch": 8.074173369079535, "percentage": 80.74, "elapsed_time": "3:45:55", "remaining_time": "0:53:53", "throughput": 2307.24, "total_tokens": 31275848} {"current_steps": 54215, "total_steps": 67140, "loss": 0.9031, "lr": 5.436050285915173e-06, "epoch": 8.074918081620494, "percentage": 80.75, "elapsed_time": "3:45:56", "remaining_time": "0:53:51", "throughput": 2307.27, "total_tokens": 31278824} {"current_steps": 54220, "total_steps": 67140, "loss": 0.6204, "lr": 5.432004912304636e-06, "epoch": 8.075662794161454, "percentage": 80.76, "elapsed_time": "3:45:57", "remaining_time": "0:53:50", "throughput": 2307.3, "total_tokens": 31282152} {"current_steps": 54225, "total_steps": 67140, "loss": 0.6366, "lr": 5.427960861019648e-06, "epoch": 8.076407506702413, "percentage": 80.76, "elapsed_time": "3:45:59", "remaining_time": "0:53:49", "throughput": 2307.32, "total_tokens": 31285032} {"current_steps": 54230, "total_steps": 67140, "loss": 0.4973, "lr": 5.423918132333491e-06, "epoch": 8.077152219243372, "percentage": 80.77, "elapsed_time": "3:46:00", "remaining_time": "0:53:48", "throughput": 2307.34, "total_tokens": 31287944} {"current_steps": 54235, "total_steps": 67140, "loss": 0.5077, "lr": 5.4198767265193574e-06, "epoch": 8.07789693178433, "percentage": 80.78, "elapsed_time": "3:46:01", "remaining_time": "0:53:46", "throughput": 2307.37, "total_tokens": 31290856} {"current_steps": 54240, "total_steps": 67140, "loss": 0.5528, "lr": 5.415836643850352e-06, "epoch": 8.078641644325291, "percentage": 80.79, "elapsed_time": "3:46:02", "remaining_time": "0:53:45", "throughput": 2307.38, "total_tokens": 31293704} {"current_steps": 54245, "total_steps": 67140, "loss": 0.5404, "lr": 5.411797884599479e-06, "epoch": 8.07938635686625, "percentage": 80.79, "elapsed_time": "3:46:03", "remaining_time": "0:53:44", "throughput": 2307.41, "total_tokens": 31296680} {"current_steps": 54250, "total_steps": 67140, "loss": 0.7356, "lr": 5.407760449039662e-06, "epoch": 8.080131069407209, "percentage": 80.8, "elapsed_time": "3:46:04", "remaining_time": "0:53:43", "throughput": 2307.43, "total_tokens": 31299528} {"current_steps": 54255, "total_steps": 67140, "loss": 0.7999, "lr": 5.403724337443747e-06, "epoch": 8.080875781948167, "percentage": 80.81, "elapsed_time": "3:46:05", "remaining_time": "0:53:41", "throughput": 2307.44, "total_tokens": 31302216} {"current_steps": 54260, "total_steps": 67140, "loss": 0.4748, "lr": 5.399689550084461e-06, "epoch": 8.081620494489128, "percentage": 80.82, "elapsed_time": "3:46:06", "remaining_time": "0:53:40", "throughput": 2307.46, "total_tokens": 31305128} {"current_steps": 54265, "total_steps": 67140, "loss": 0.5127, "lr": 5.395656087234466e-06, "epoch": 8.082365207030087, "percentage": 80.82, "elapsed_time": "3:46:08", "remaining_time": "0:53:39", "throughput": 2307.46, "total_tokens": 31307784} {"current_steps": 54270, "total_steps": 67140, "loss": 0.687, "lr": 5.391623949166327e-06, "epoch": 8.083109919571045, "percentage": 80.83, "elapsed_time": "3:46:09", "remaining_time": "0:53:37", "throughput": 2307.47, "total_tokens": 31310408} {"current_steps": 54275, "total_steps": 67140, "loss": 0.6292, "lr": 5.387593136152527e-06, "epoch": 8.083854632112004, "percentage": 80.84, "elapsed_time": "3:46:10", "remaining_time": "0:53:36", "throughput": 2307.5, "total_tokens": 31313576} {"current_steps": 54280, "total_steps": 67140, "loss": 0.6616, "lr": 5.383563648465437e-06, "epoch": 8.084599344652965, "percentage": 80.85, "elapsed_time": "3:46:11", "remaining_time": "0:53:35", "throughput": 2307.52, "total_tokens": 31316488} {"current_steps": 54285, "total_steps": 67140, "loss": 0.5666, "lr": 5.37953548637736e-06, "epoch": 8.085344057193923, "percentage": 80.85, "elapsed_time": "3:46:12", "remaining_time": "0:53:34", "throughput": 2307.54, "total_tokens": 31319336} {"current_steps": 54290, "total_steps": 67140, "loss": 0.3909, "lr": 5.375508650160507e-06, "epoch": 8.086088769734882, "percentage": 80.86, "elapsed_time": "3:46:13", "remaining_time": "0:53:32", "throughput": 2307.56, "total_tokens": 31322152} {"current_steps": 54295, "total_steps": 67140, "loss": 0.5012, "lr": 5.371483140086997e-06, "epoch": 8.086833482275841, "percentage": 80.87, "elapsed_time": "3:46:14", "remaining_time": "0:53:31", "throughput": 2307.58, "total_tokens": 31325064} {"current_steps": 54300, "total_steps": 67140, "loss": 0.3962, "lr": 5.367458956428845e-06, "epoch": 8.087578194816802, "percentage": 80.88, "elapsed_time": "3:46:16", "remaining_time": "0:53:30", "throughput": 2307.61, "total_tokens": 31328200} {"current_steps": 54305, "total_steps": 67140, "loss": 0.4704, "lr": 5.363436099457997e-06, "epoch": 8.08832290735776, "percentage": 80.88, "elapsed_time": "3:46:17", "remaining_time": "0:53:28", "throughput": 2307.63, "total_tokens": 31331176} {"current_steps": 54310, "total_steps": 67140, "loss": 0.5481, "lr": 5.359414569446308e-06, "epoch": 8.089067619898719, "percentage": 80.89, "elapsed_time": "3:46:18", "remaining_time": "0:53:27", "throughput": 2307.64, "total_tokens": 31333864} {"current_steps": 54315, "total_steps": 67140, "loss": 0.4411, "lr": 5.355394366665525e-06, "epoch": 8.089812332439678, "percentage": 80.9, "elapsed_time": "3:46:19", "remaining_time": "0:53:26", "throughput": 2307.66, "total_tokens": 31336648} {"current_steps": 54320, "total_steps": 67140, "loss": 0.4248, "lr": 5.35137549138732e-06, "epoch": 8.090557044980638, "percentage": 80.91, "elapsed_time": "3:46:20", "remaining_time": "0:53:25", "throughput": 2307.66, "total_tokens": 31339304} {"current_steps": 54325, "total_steps": 67140, "loss": 0.4012, "lr": 5.347357943883272e-06, "epoch": 8.091301757521597, "percentage": 80.91, "elapsed_time": "3:46:21", "remaining_time": "0:53:23", "throughput": 2307.68, "total_tokens": 31342024} {"current_steps": 54330, "total_steps": 67140, "loss": 0.611, "lr": 5.343341724424875e-06, "epoch": 8.092046470062556, "percentage": 80.92, "elapsed_time": "3:46:22", "remaining_time": "0:53:22", "throughput": 2307.7, "total_tokens": 31344968} {"current_steps": 54335, "total_steps": 67140, "loss": 0.5144, "lr": 5.339326833283531e-06, "epoch": 8.092791182603515, "percentage": 80.93, "elapsed_time": "3:46:23", "remaining_time": "0:53:21", "throughput": 2307.72, "total_tokens": 31347816} {"current_steps": 54340, "total_steps": 67140, "loss": 0.7245, "lr": 5.335313270730546e-06, "epoch": 8.093535895144473, "percentage": 80.94, "elapsed_time": "3:46:25", "remaining_time": "0:53:20", "throughput": 2307.73, "total_tokens": 31350536} {"current_steps": 54345, "total_steps": 67140, "loss": 0.5312, "lr": 5.331301037037132e-06, "epoch": 8.094280607685434, "percentage": 80.94, "elapsed_time": "3:46:26", "remaining_time": "0:53:18", "throughput": 2307.74, "total_tokens": 31353384} {"current_steps": 54350, "total_steps": 67140, "loss": 0.6679, "lr": 5.327290132474427e-06, "epoch": 8.095025320226393, "percentage": 80.95, "elapsed_time": "3:46:27", "remaining_time": "0:53:17", "throughput": 2307.78, "total_tokens": 31356584} {"current_steps": 54355, "total_steps": 67140, "loss": 0.5425, "lr": 5.323280557313473e-06, "epoch": 8.095770032767351, "percentage": 80.96, "elapsed_time": "3:46:28", "remaining_time": "0:53:16", "throughput": 2307.79, "total_tokens": 31359304} {"current_steps": 54360, "total_steps": 67140, "loss": 0.6401, "lr": 5.319272311825216e-06, "epoch": 8.09651474530831, "percentage": 80.97, "elapsed_time": "3:46:29", "remaining_time": "0:53:14", "throughput": 2307.81, "total_tokens": 31362216} {"current_steps": 54365, "total_steps": 67140, "loss": 0.7554, "lr": 5.315265396280522e-06, "epoch": 8.09725945784927, "percentage": 80.97, "elapsed_time": "3:46:30", "remaining_time": "0:53:13", "throughput": 2307.82, "total_tokens": 31364968} {"current_steps": 54370, "total_steps": 67140, "loss": 0.4816, "lr": 5.311259810950167e-06, "epoch": 8.09800417039023, "percentage": 80.98, "elapsed_time": "3:46:31", "remaining_time": "0:53:12", "throughput": 2307.85, "total_tokens": 31368072} {"current_steps": 54375, "total_steps": 67140, "loss": 0.5611, "lr": 5.3072555561048255e-06, "epoch": 8.098748882931188, "percentage": 80.99, "elapsed_time": "3:46:33", "remaining_time": "0:53:11", "throughput": 2307.86, "total_tokens": 31370728} {"current_steps": 54380, "total_steps": 67140, "loss": 0.5804, "lr": 5.303252632015082e-06, "epoch": 8.099493595472147, "percentage": 80.99, "elapsed_time": "3:46:34", "remaining_time": "0:53:09", "throughput": 2307.88, "total_tokens": 31373672} {"current_steps": 54385, "total_steps": 67140, "loss": 0.5411, "lr": 5.299251038951444e-06, "epoch": 8.100238308013108, "percentage": 81.0, "elapsed_time": "3:46:35", "remaining_time": "0:53:08", "throughput": 2307.9, "total_tokens": 31376616} {"current_steps": 54390, "total_steps": 67140, "loss": 0.5941, "lr": 5.295250777184324e-06, "epoch": 8.100983020554066, "percentage": 81.01, "elapsed_time": "3:46:36", "remaining_time": "0:53:07", "throughput": 2307.92, "total_tokens": 31379656} {"current_steps": 54395, "total_steps": 67140, "loss": 0.7539, "lr": 5.2912518469840436e-06, "epoch": 8.101727733095025, "percentage": 81.02, "elapsed_time": "3:46:37", "remaining_time": "0:53:05", "throughput": 2307.94, "total_tokens": 31382600} {"current_steps": 54400, "total_steps": 67140, "loss": 0.6445, "lr": 5.287254248620832e-06, "epoch": 8.102472445635984, "percentage": 81.02, "elapsed_time": "3:46:38", "remaining_time": "0:53:04", "throughput": 2307.96, "total_tokens": 31385352} {"current_steps": 54405, "total_steps": 67140, "loss": 0.4707, "lr": 5.283257982364839e-06, "epoch": 8.103217158176944, "percentage": 81.03, "elapsed_time": "3:46:39", "remaining_time": "0:53:03", "throughput": 2307.98, "total_tokens": 31388232} {"current_steps": 54410, "total_steps": 67140, "loss": 0.5514, "lr": 5.279263048486102e-06, "epoch": 8.103961870717903, "percentage": 81.04, "elapsed_time": "3:46:41", "remaining_time": "0:53:02", "throughput": 2307.99, "total_tokens": 31390952} {"current_steps": 54415, "total_steps": 67140, "loss": 0.4473, "lr": 5.275269447254597e-06, "epoch": 8.104706583258862, "percentage": 81.05, "elapsed_time": "3:46:42", "remaining_time": "0:53:00", "throughput": 2308.0, "total_tokens": 31393736} {"current_steps": 54420, "total_steps": 67140, "loss": 0.5122, "lr": 5.271277178940182e-06, "epoch": 8.10545129579982, "percentage": 81.05, "elapsed_time": "3:46:43", "remaining_time": "0:52:59", "throughput": 2308.03, "total_tokens": 31396776} {"current_steps": 54425, "total_steps": 67140, "loss": 0.5284, "lr": 5.267286243812641e-06, "epoch": 8.106196008340781, "percentage": 81.06, "elapsed_time": "3:46:44", "remaining_time": "0:52:58", "throughput": 2308.07, "total_tokens": 31400104} {"current_steps": 54430, "total_steps": 67140, "loss": 0.7258, "lr": 5.263296642141671e-06, "epoch": 8.10694072088174, "percentage": 81.07, "elapsed_time": "3:46:45", "remaining_time": "0:52:57", "throughput": 2308.09, "total_tokens": 31403016} {"current_steps": 54435, "total_steps": 67140, "loss": 0.4876, "lr": 5.25930837419687e-06, "epoch": 8.107685433422699, "percentage": 81.08, "elapsed_time": "3:46:46", "remaining_time": "0:52:55", "throughput": 2308.1, "total_tokens": 31405800} {"current_steps": 54440, "total_steps": 67140, "loss": 0.6273, "lr": 5.2553214402477565e-06, "epoch": 8.108430145963657, "percentage": 81.08, "elapsed_time": "3:46:47", "remaining_time": "0:52:54", "throughput": 2308.13, "total_tokens": 31408744} {"current_steps": 54445, "total_steps": 67140, "loss": 0.4779, "lr": 5.251335840563737e-06, "epoch": 8.109174858504618, "percentage": 81.09, "elapsed_time": "3:46:48", "remaining_time": "0:52:53", "throughput": 2308.14, "total_tokens": 31411432} {"current_steps": 54450, "total_steps": 67140, "loss": 0.654, "lr": 5.247351575414148e-06, "epoch": 8.109919571045577, "percentage": 81.1, "elapsed_time": "3:46:50", "remaining_time": "0:52:51", "throughput": 2308.16, "total_tokens": 31414408} {"current_steps": 54455, "total_steps": 67140, "loss": 0.5985, "lr": 5.243368645068239e-06, "epoch": 8.110664283586535, "percentage": 81.11, "elapsed_time": "3:46:51", "remaining_time": "0:52:50", "throughput": 2308.18, "total_tokens": 31417256} {"current_steps": 54460, "total_steps": 67140, "loss": 0.6721, "lr": 5.239387049795144e-06, "epoch": 8.111408996127494, "percentage": 81.11, "elapsed_time": "3:46:52", "remaining_time": "0:52:49", "throughput": 2308.19, "total_tokens": 31420040} {"current_steps": 54465, "total_steps": 67140, "loss": 0.5281, "lr": 5.235406789863934e-06, "epoch": 8.112153708668455, "percentage": 81.12, "elapsed_time": "3:46:53", "remaining_time": "0:52:48", "throughput": 2308.21, "total_tokens": 31422824} {"current_steps": 54470, "total_steps": 67140, "loss": 0.5513, "lr": 5.2314278655435726e-06, "epoch": 8.112898421209414, "percentage": 81.13, "elapsed_time": "3:46:54", "remaining_time": "0:52:46", "throughput": 2308.23, "total_tokens": 31425800} {"current_steps": 54475, "total_steps": 67140, "loss": 0.5725, "lr": 5.227450277102952e-06, "epoch": 8.113643133750372, "percentage": 81.14, "elapsed_time": "3:46:55", "remaining_time": "0:52:45", "throughput": 2308.25, "total_tokens": 31428744} {"current_steps": 54480, "total_steps": 67140, "loss": 0.6889, "lr": 5.223474024810846e-06, "epoch": 8.114387846291331, "percentage": 81.14, "elapsed_time": "3:46:56", "remaining_time": "0:52:44", "throughput": 2308.27, "total_tokens": 31431624} {"current_steps": 54485, "total_steps": 67140, "loss": 0.7407, "lr": 5.219499108935957e-06, "epoch": 8.115132558832292, "percentage": 81.15, "elapsed_time": "3:46:58", "remaining_time": "0:52:43", "throughput": 2308.29, "total_tokens": 31434536} {"current_steps": 54490, "total_steps": 67140, "loss": 0.483, "lr": 5.215525529746901e-06, "epoch": 8.11587727137325, "percentage": 81.16, "elapsed_time": "3:46:59", "remaining_time": "0:52:41", "throughput": 2308.31, "total_tokens": 31437416} {"current_steps": 54495, "total_steps": 67140, "loss": 0.6115, "lr": 5.211553287512189e-06, "epoch": 8.116621983914209, "percentage": 81.17, "elapsed_time": "3:47:00", "remaining_time": "0:52:40", "throughput": 2308.32, "total_tokens": 31440200} {"current_steps": 54500, "total_steps": 67140, "loss": 0.6815, "lr": 5.207582382500259e-06, "epoch": 8.117366696455168, "percentage": 81.17, "elapsed_time": "3:47:01", "remaining_time": "0:52:39", "throughput": 2308.35, "total_tokens": 31443240} {"current_steps": 54505, "total_steps": 67140, "loss": 0.6086, "lr": 5.203612814979442e-06, "epoch": 8.118111408996128, "percentage": 81.18, "elapsed_time": "3:47:02", "remaining_time": "0:52:37", "throughput": 2308.37, "total_tokens": 31446056} {"current_steps": 54510, "total_steps": 67140, "loss": 0.5897, "lr": 5.199644585217978e-06, "epoch": 8.118856121537087, "percentage": 81.19, "elapsed_time": "3:47:03", "remaining_time": "0:52:36", "throughput": 2308.39, "total_tokens": 31448968} {"current_steps": 54515, "total_steps": 67140, "loss": 0.6098, "lr": 5.19567769348403e-06, "epoch": 8.119600834078046, "percentage": 81.2, "elapsed_time": "3:47:04", "remaining_time": "0:52:35", "throughput": 2308.42, "total_tokens": 31452072} {"current_steps": 54520, "total_steps": 67140, "loss": 0.5041, "lr": 5.1917121400456654e-06, "epoch": 8.120345546619005, "percentage": 81.2, "elapsed_time": "3:47:06", "remaining_time": "0:52:34", "throughput": 2308.45, "total_tokens": 31455208} {"current_steps": 54525, "total_steps": 67140, "loss": 0.6462, "lr": 5.187747925170858e-06, "epoch": 8.121090259159963, "percentage": 81.21, "elapsed_time": "3:47:07", "remaining_time": "0:52:32", "throughput": 2308.47, "total_tokens": 31458120} {"current_steps": 54530, "total_steps": 67140, "loss": 0.5351, "lr": 5.1837850491274985e-06, "epoch": 8.121834971700924, "percentage": 81.22, "elapsed_time": "3:47:08", "remaining_time": "0:52:31", "throughput": 2308.48, "total_tokens": 31460712} {"current_steps": 54535, "total_steps": 67140, "loss": 0.5818, "lr": 5.179823512183382e-06, "epoch": 8.122579684241883, "percentage": 81.23, "elapsed_time": "3:47:09", "remaining_time": "0:52:30", "throughput": 2308.5, "total_tokens": 31463656} {"current_steps": 54540, "total_steps": 67140, "loss": 0.5297, "lr": 5.175863314606211e-06, "epoch": 8.123324396782841, "percentage": 81.23, "elapsed_time": "3:47:10", "remaining_time": "0:52:28", "throughput": 2308.51, "total_tokens": 31466504} {"current_steps": 54545, "total_steps": 67140, "loss": 0.5835, "lr": 5.171904456663592e-06, "epoch": 8.1240691093238, "percentage": 81.24, "elapsed_time": "3:47:11", "remaining_time": "0:52:27", "throughput": 2308.55, "total_tokens": 31469800} {"current_steps": 54550, "total_steps": 67140, "loss": 0.6853, "lr": 5.167946938623053e-06, "epoch": 8.12481382186476, "percentage": 81.25, "elapsed_time": "3:47:12", "remaining_time": "0:52:26", "throughput": 2308.57, "total_tokens": 31472680} {"current_steps": 54555, "total_steps": 67140, "loss": 0.3009, "lr": 5.16399076075203e-06, "epoch": 8.12555853440572, "percentage": 81.26, "elapsed_time": "3:47:14", "remaining_time": "0:52:25", "throughput": 2308.59, "total_tokens": 31475496} {"current_steps": 54560, "total_steps": 67140, "loss": 0.5461, "lr": 5.160035923317863e-06, "epoch": 8.126303246946678, "percentage": 81.26, "elapsed_time": "3:47:15", "remaining_time": "0:52:23", "throughput": 2308.61, "total_tokens": 31478408} {"current_steps": 54565, "total_steps": 67140, "loss": 0.7231, "lr": 5.156082426587808e-06, "epoch": 8.127047959487637, "percentage": 81.27, "elapsed_time": "3:47:16", "remaining_time": "0:52:22", "throughput": 2308.63, "total_tokens": 31481480} {"current_steps": 54570, "total_steps": 67140, "loss": 0.5589, "lr": 5.152130270829025e-06, "epoch": 8.127792672028598, "percentage": 81.28, "elapsed_time": "3:47:17", "remaining_time": "0:52:21", "throughput": 2308.65, "total_tokens": 31484232} {"current_steps": 54575, "total_steps": 67140, "loss": 0.61, "lr": 5.14817945630858e-06, "epoch": 8.128537384569556, "percentage": 81.29, "elapsed_time": "3:47:18", "remaining_time": "0:52:20", "throughput": 2308.66, "total_tokens": 31487080} {"current_steps": 54580, "total_steps": 67140, "loss": 0.5383, "lr": 5.144229983293461e-06, "epoch": 8.129282097110515, "percentage": 81.29, "elapsed_time": "3:47:19", "remaining_time": "0:52:18", "throughput": 2308.67, "total_tokens": 31489800} {"current_steps": 54585, "total_steps": 67140, "loss": 0.4732, "lr": 5.140281852050544e-06, "epoch": 8.130026809651474, "percentage": 81.3, "elapsed_time": "3:47:20", "remaining_time": "0:52:17", "throughput": 2308.7, "total_tokens": 31492936} {"current_steps": 54590, "total_steps": 67140, "loss": 0.5615, "lr": 5.136335062846636e-06, "epoch": 8.130771522192434, "percentage": 81.31, "elapsed_time": "3:47:22", "remaining_time": "0:52:16", "throughput": 2308.73, "total_tokens": 31495944} {"current_steps": 54595, "total_steps": 67140, "loss": 0.5976, "lr": 5.132389615948446e-06, "epoch": 8.131516234733393, "percentage": 81.32, "elapsed_time": "3:47:23", "remaining_time": "0:52:15", "throughput": 2308.78, "total_tokens": 31499496} {"current_steps": 54600, "total_steps": 67140, "loss": 0.6598, "lr": 5.12844551162259e-06, "epoch": 8.132260947274352, "percentage": 81.32, "elapsed_time": "3:47:24", "remaining_time": "0:52:13", "throughput": 2308.79, "total_tokens": 31502312} {"current_steps": 54605, "total_steps": 67140, "loss": 0.5363, "lr": 5.124502750135601e-06, "epoch": 8.13300565981531, "percentage": 81.33, "elapsed_time": "3:47:25", "remaining_time": "0:52:12", "throughput": 2308.83, "total_tokens": 31505480} {"current_steps": 54610, "total_steps": 67140, "loss": 0.6149, "lr": 5.120561331753901e-06, "epoch": 8.133750372356271, "percentage": 81.34, "elapsed_time": "3:47:26", "remaining_time": "0:52:11", "throughput": 2308.84, "total_tokens": 31508296} {"current_steps": 54615, "total_steps": 67140, "loss": 0.505, "lr": 5.116621256743842e-06, "epoch": 8.13449508489723, "percentage": 81.34, "elapsed_time": "3:47:27", "remaining_time": "0:52:09", "throughput": 2308.86, "total_tokens": 31511208} {"current_steps": 54620, "total_steps": 67140, "loss": 0.7251, "lr": 5.112682525371687e-06, "epoch": 8.135239797438189, "percentage": 81.35, "elapsed_time": "3:47:29", "remaining_time": "0:52:08", "throughput": 2308.9, "total_tokens": 31514440} {"current_steps": 54625, "total_steps": 67140, "loss": 0.6673, "lr": 5.108745137903584e-06, "epoch": 8.135984509979147, "percentage": 81.36, "elapsed_time": "3:47:30", "remaining_time": "0:52:07", "throughput": 2308.92, "total_tokens": 31517320} {"current_steps": 54630, "total_steps": 67140, "loss": 0.7101, "lr": 5.104809094605612e-06, "epoch": 8.136729222520108, "percentage": 81.37, "elapsed_time": "3:47:31", "remaining_time": "0:52:06", "throughput": 2308.94, "total_tokens": 31520360} {"current_steps": 54635, "total_steps": 67140, "loss": 0.4042, "lr": 5.100874395743752e-06, "epoch": 8.137473935061067, "percentage": 81.37, "elapsed_time": "3:47:32", "remaining_time": "0:52:04", "throughput": 2308.95, "total_tokens": 31522920} {"current_steps": 54640, "total_steps": 67140, "loss": 0.447, "lr": 5.0969410415839026e-06, "epoch": 8.138218647602026, "percentage": 81.38, "elapsed_time": "3:47:33", "remaining_time": "0:52:03", "throughput": 2308.97, "total_tokens": 31525832} {"current_steps": 54645, "total_steps": 67140, "loss": 0.4088, "lr": 5.093009032391854e-06, "epoch": 8.138963360142984, "percentage": 81.39, "elapsed_time": "3:47:34", "remaining_time": "0:52:02", "throughput": 2308.98, "total_tokens": 31528552} {"current_steps": 54650, "total_steps": 67140, "loss": 0.4459, "lr": 5.089078368433317e-06, "epoch": 8.139708072683945, "percentage": 81.4, "elapsed_time": "3:47:35", "remaining_time": "0:52:00", "throughput": 2309.0, "total_tokens": 31531368} {"current_steps": 54655, "total_steps": 67140, "loss": 0.6171, "lr": 5.0851490499739144e-06, "epoch": 8.140452785224904, "percentage": 81.4, "elapsed_time": "3:47:36", "remaining_time": "0:51:59", "throughput": 2309.01, "total_tokens": 31534120} {"current_steps": 54660, "total_steps": 67140, "loss": 0.6488, "lr": 5.081221077279174e-06, "epoch": 8.141197497765862, "percentage": 81.41, "elapsed_time": "3:47:38", "remaining_time": "0:51:58", "throughput": 2309.04, "total_tokens": 31537192} {"current_steps": 54665, "total_steps": 67140, "loss": 0.6331, "lr": 5.0772944506145254e-06, "epoch": 8.141942210306821, "percentage": 81.42, "elapsed_time": "3:47:39", "remaining_time": "0:51:57", "throughput": 2309.06, "total_tokens": 31540168} {"current_steps": 54670, "total_steps": 67140, "loss": 0.6532, "lr": 5.073369170245324e-06, "epoch": 8.142686922847782, "percentage": 81.43, "elapsed_time": "3:47:40", "remaining_time": "0:51:55", "throughput": 2309.07, "total_tokens": 31542888} {"current_steps": 54675, "total_steps": 67140, "loss": 0.6689, "lr": 5.069445236436813e-06, "epoch": 8.14343163538874, "percentage": 81.43, "elapsed_time": "3:47:41", "remaining_time": "0:51:54", "throughput": 2309.11, "total_tokens": 31546184} {"current_steps": 54680, "total_steps": 67140, "loss": 0.4496, "lr": 5.065522649454157e-06, "epoch": 8.1441763479297, "percentage": 81.44, "elapsed_time": "3:47:42", "remaining_time": "0:51:53", "throughput": 2309.13, "total_tokens": 31549192} {"current_steps": 54685, "total_steps": 67140, "loss": 0.6164, "lr": 5.061601409562436e-06, "epoch": 8.144921060470658, "percentage": 81.45, "elapsed_time": "3:47:43", "remaining_time": "0:51:52", "throughput": 2309.15, "total_tokens": 31552008} {"current_steps": 54690, "total_steps": 67140, "loss": 0.6849, "lr": 5.057681517026627e-06, "epoch": 8.145665773011617, "percentage": 81.46, "elapsed_time": "3:47:45", "remaining_time": "0:51:50", "throughput": 2309.18, "total_tokens": 31555016} {"current_steps": 54695, "total_steps": 67140, "loss": 0.7061, "lr": 5.053762972111623e-06, "epoch": 8.146410485552577, "percentage": 81.46, "elapsed_time": "3:47:46", "remaining_time": "0:51:49", "throughput": 2309.19, "total_tokens": 31557704} {"current_steps": 54700, "total_steps": 67140, "loss": 0.5779, "lr": 5.049845775082227e-06, "epoch": 8.147155198093536, "percentage": 81.47, "elapsed_time": "3:47:47", "remaining_time": "0:51:48", "throughput": 2309.2, "total_tokens": 31560456} {"current_steps": 54705, "total_steps": 67140, "loss": 0.3759, "lr": 5.045929926203144e-06, "epoch": 8.147899910634495, "percentage": 81.48, "elapsed_time": "3:47:48", "remaining_time": "0:51:46", "throughput": 2309.21, "total_tokens": 31563208} {"current_steps": 54710, "total_steps": 67140, "loss": 0.5617, "lr": 5.04201542573898e-06, "epoch": 8.148644623175453, "percentage": 81.49, "elapsed_time": "3:47:49", "remaining_time": "0:51:45", "throughput": 2309.24, "total_tokens": 31566216} {"current_steps": 54715, "total_steps": 67140, "loss": 0.6548, "lr": 5.0381022739542734e-06, "epoch": 8.149389335716414, "percentage": 81.49, "elapsed_time": "3:47:50", "remaining_time": "0:51:44", "throughput": 2309.25, "total_tokens": 31569032} {"current_steps": 54720, "total_steps": 67140, "loss": 0.5854, "lr": 5.034190471113453e-06, "epoch": 8.150134048257373, "percentage": 81.5, "elapsed_time": "3:47:51", "remaining_time": "0:51:43", "throughput": 2309.27, "total_tokens": 31571880} {"current_steps": 54725, "total_steps": 67140, "loss": 0.6869, "lr": 5.0302800174808654e-06, "epoch": 8.150878760798332, "percentage": 81.51, "elapsed_time": "3:47:52", "remaining_time": "0:51:41", "throughput": 2309.3, "total_tokens": 31574888} {"current_steps": 54730, "total_steps": 67140, "loss": 0.2865, "lr": 5.026370913320766e-06, "epoch": 8.15162347333929, "percentage": 81.52, "elapsed_time": "3:47:54", "remaining_time": "0:51:40", "throughput": 2309.32, "total_tokens": 31577800} {"current_steps": 54735, "total_steps": 67140, "loss": 0.5624, "lr": 5.022463158897317e-06, "epoch": 8.15236818588025, "percentage": 81.52, "elapsed_time": "3:47:55", "remaining_time": "0:51:39", "throughput": 2309.32, "total_tokens": 31580456} {"current_steps": 54740, "total_steps": 67140, "loss": 0.6366, "lr": 5.018556754474588e-06, "epoch": 8.15311289842121, "percentage": 81.53, "elapsed_time": "3:47:56", "remaining_time": "0:51:38", "throughput": 2309.35, "total_tokens": 31583496} {"current_steps": 54745, "total_steps": 67140, "loss": 0.4028, "lr": 5.014651700316547e-06, "epoch": 8.153857610962168, "percentage": 81.54, "elapsed_time": "3:47:57", "remaining_time": "0:51:36", "throughput": 2309.37, "total_tokens": 31586408} {"current_steps": 54750, "total_steps": 67140, "loss": 0.6275, "lr": 5.010747996687087e-06, "epoch": 8.154602323503127, "percentage": 81.55, "elapsed_time": "3:47:58", "remaining_time": "0:51:35", "throughput": 2309.38, "total_tokens": 31589192} {"current_steps": 54755, "total_steps": 67140, "loss": 0.3848, "lr": 5.006845643850011e-06, "epoch": 8.155347036044088, "percentage": 81.55, "elapsed_time": "3:47:59", "remaining_time": "0:51:34", "throughput": 2309.41, "total_tokens": 31592168} {"current_steps": 54760, "total_steps": 67140, "loss": 0.4662, "lr": 5.002944642069019e-06, "epoch": 8.156091748585046, "percentage": 81.56, "elapsed_time": "3:48:00", "remaining_time": "0:51:32", "throughput": 2309.42, "total_tokens": 31594952} {"current_steps": 54765, "total_steps": 67140, "loss": 0.4793, "lr": 4.9990449916077234e-06, "epoch": 8.156836461126005, "percentage": 81.57, "elapsed_time": "3:48:02", "remaining_time": "0:51:31", "throughput": 2309.45, "total_tokens": 31597960} {"current_steps": 54770, "total_steps": 67140, "loss": 0.7013, "lr": 4.995146692729661e-06, "epoch": 8.157581173666964, "percentage": 81.58, "elapsed_time": "3:48:03", "remaining_time": "0:51:30", "throughput": 2309.46, "total_tokens": 31600712} {"current_steps": 54775, "total_steps": 67140, "loss": 0.5456, "lr": 4.99124974569824e-06, "epoch": 8.158325886207924, "percentage": 81.58, "elapsed_time": "3:48:04", "remaining_time": "0:51:29", "throughput": 2309.49, "total_tokens": 31603816} {"current_steps": 54780, "total_steps": 67140, "loss": 0.4567, "lr": 4.987354150776819e-06, "epoch": 8.159070598748883, "percentage": 81.59, "elapsed_time": "3:48:05", "remaining_time": "0:51:27", "throughput": 2309.51, "total_tokens": 31606600} {"current_steps": 54785, "total_steps": 67140, "loss": 0.5978, "lr": 4.9834599082286325e-06, "epoch": 8.159815311289842, "percentage": 81.6, "elapsed_time": "3:48:06", "remaining_time": "0:51:26", "throughput": 2309.53, "total_tokens": 31609544} {"current_steps": 54790, "total_steps": 67140, "loss": 0.6638, "lr": 4.979567018316847e-06, "epoch": 8.1605600238308, "percentage": 81.61, "elapsed_time": "3:48:07", "remaining_time": "0:51:25", "throughput": 2309.57, "total_tokens": 31612904} {"current_steps": 54795, "total_steps": 67140, "loss": 0.6863, "lr": 4.975675481304523e-06, "epoch": 8.161304736371761, "percentage": 81.61, "elapsed_time": "3:48:08", "remaining_time": "0:51:24", "throughput": 2309.58, "total_tokens": 31615656} {"current_steps": 54800, "total_steps": 67140, "loss": 0.2363, "lr": 4.971785297454637e-06, "epoch": 8.16204944891272, "percentage": 81.62, "elapsed_time": "3:48:10", "remaining_time": "0:51:22", "throughput": 2309.6, "total_tokens": 31618536} {"current_steps": 54805, "total_steps": 67140, "loss": 0.709, "lr": 4.9678964670300785e-06, "epoch": 8.162794161453679, "percentage": 81.63, "elapsed_time": "3:48:11", "remaining_time": "0:51:21", "throughput": 2309.63, "total_tokens": 31621512} {"current_steps": 54810, "total_steps": 67140, "loss": 0.6039, "lr": 4.964008990293626e-06, "epoch": 8.163538873994638, "percentage": 81.64, "elapsed_time": "3:48:12", "remaining_time": "0:51:20", "throughput": 2309.64, "total_tokens": 31624296} {"current_steps": 54815, "total_steps": 67140, "loss": 0.562, "lr": 4.960122867507983e-06, "epoch": 8.164283586535598, "percentage": 81.64, "elapsed_time": "3:48:13", "remaining_time": "0:51:18", "throughput": 2309.67, "total_tokens": 31627400} {"current_steps": 54820, "total_steps": 67140, "loss": 0.4905, "lr": 4.95623809893577e-06, "epoch": 8.165028299076557, "percentage": 81.65, "elapsed_time": "3:48:14", "remaining_time": "0:51:17", "throughput": 2309.7, "total_tokens": 31630408} {"current_steps": 54825, "total_steps": 67140, "loss": 0.5379, "lr": 4.952354684839486e-06, "epoch": 8.165773011617516, "percentage": 81.66, "elapsed_time": "3:48:15", "remaining_time": "0:51:16", "throughput": 2309.72, "total_tokens": 31633352} {"current_steps": 54830, "total_steps": 67140, "loss": 0.6845, "lr": 4.948472625481565e-06, "epoch": 8.166517724158474, "percentage": 81.67, "elapsed_time": "3:48:16", "remaining_time": "0:51:15", "throughput": 2309.74, "total_tokens": 31636264} {"current_steps": 54835, "total_steps": 67140, "loss": 0.4958, "lr": 4.944591921124348e-06, "epoch": 8.167262436699435, "percentage": 81.67, "elapsed_time": "3:48:18", "remaining_time": "0:51:13", "throughput": 2309.75, "total_tokens": 31638920} {"current_steps": 54840, "total_steps": 67140, "loss": 0.7305, "lr": 4.940712572030062e-06, "epoch": 8.168007149240394, "percentage": 81.68, "elapsed_time": "3:48:19", "remaining_time": "0:51:12", "throughput": 2309.77, "total_tokens": 31641896} {"current_steps": 54845, "total_steps": 67140, "loss": 0.5176, "lr": 4.936834578460867e-06, "epoch": 8.168751861781352, "percentage": 81.69, "elapsed_time": "3:48:20", "remaining_time": "0:51:11", "throughput": 2309.78, "total_tokens": 31644712} {"current_steps": 54850, "total_steps": 67140, "loss": 0.6726, "lr": 4.932957940678818e-06, "epoch": 8.169496574322311, "percentage": 81.69, "elapsed_time": "3:48:21", "remaining_time": "0:51:10", "throughput": 2309.81, "total_tokens": 31647688} {"current_steps": 54855, "total_steps": 67140, "loss": 0.5831, "lr": 4.9290826589458854e-06, "epoch": 8.17024128686327, "percentage": 81.7, "elapsed_time": "3:48:22", "remaining_time": "0:51:08", "throughput": 2309.81, "total_tokens": 31650280} {"current_steps": 54860, "total_steps": 67140, "loss": 0.5904, "lr": 4.92520873352395e-06, "epoch": 8.17098599940423, "percentage": 81.71, "elapsed_time": "3:48:23", "remaining_time": "0:51:07", "throughput": 2309.84, "total_tokens": 31653224} {"current_steps": 54865, "total_steps": 67140, "loss": 0.591, "lr": 4.921336164674786e-06, "epoch": 8.17173071194519, "percentage": 81.72, "elapsed_time": "3:48:24", "remaining_time": "0:51:06", "throughput": 2309.87, "total_tokens": 31656392} {"current_steps": 54870, "total_steps": 67140, "loss": 0.3899, "lr": 4.917464952660094e-06, "epoch": 8.172475424486148, "percentage": 81.72, "elapsed_time": "3:48:25", "remaining_time": "0:51:04", "throughput": 2309.88, "total_tokens": 31659272} {"current_steps": 54875, "total_steps": 67140, "loss": 0.7127, "lr": 4.9135950977414666e-06, "epoch": 8.173220137027107, "percentage": 81.73, "elapsed_time": "3:48:27", "remaining_time": "0:51:03", "throughput": 2309.9, "total_tokens": 31662056} {"current_steps": 54880, "total_steps": 67140, "loss": 0.5168, "lr": 4.909726600180417e-06, "epoch": 8.173964849568067, "percentage": 81.74, "elapsed_time": "3:48:28", "remaining_time": "0:51:02", "throughput": 2309.93, "total_tokens": 31665128} {"current_steps": 54885, "total_steps": 67140, "loss": 0.4869, "lr": 4.9058594602383625e-06, "epoch": 8.174709562109026, "percentage": 81.75, "elapsed_time": "3:48:29", "remaining_time": "0:51:01", "throughput": 2309.96, "total_tokens": 31668232} {"current_steps": 54890, "total_steps": 67140, "loss": 0.5937, "lr": 4.9019936781766275e-06, "epoch": 8.175454274649985, "percentage": 81.75, "elapsed_time": "3:48:30", "remaining_time": "0:50:59", "throughput": 2309.98, "total_tokens": 31671112} {"current_steps": 54895, "total_steps": 67140, "loss": 0.6242, "lr": 4.898129254256448e-06, "epoch": 8.176198987190944, "percentage": 81.76, "elapsed_time": "3:48:31", "remaining_time": "0:50:58", "throughput": 2310.0, "total_tokens": 31674088} {"current_steps": 54900, "total_steps": 67140, "loss": 0.4797, "lr": 4.8942661887389715e-06, "epoch": 8.176943699731904, "percentage": 81.77, "elapsed_time": "3:48:32", "remaining_time": "0:50:57", "throughput": 2310.01, "total_tokens": 31676680} {"current_steps": 54905, "total_steps": 67140, "loss": 0.6242, "lr": 4.890404481885244e-06, "epoch": 8.177688412272863, "percentage": 81.78, "elapsed_time": "3:48:33", "remaining_time": "0:50:56", "throughput": 2310.03, "total_tokens": 31679624} {"current_steps": 54910, "total_steps": 67140, "loss": 0.7408, "lr": 4.886544133956211e-06, "epoch": 8.178433124813822, "percentage": 81.78, "elapsed_time": "3:48:35", "remaining_time": "0:50:54", "throughput": 2310.05, "total_tokens": 31682568} {"current_steps": 54915, "total_steps": 67140, "loss": 0.6177, "lr": 4.882685145212754e-06, "epoch": 8.17917783735478, "percentage": 81.79, "elapsed_time": "3:48:36", "remaining_time": "0:50:53", "throughput": 2310.07, "total_tokens": 31685448} {"current_steps": 54920, "total_steps": 67140, "loss": 0.6637, "lr": 4.878827515915643e-06, "epoch": 8.17992254989574, "percentage": 81.8, "elapsed_time": "3:48:37", "remaining_time": "0:50:52", "throughput": 2310.09, "total_tokens": 31688264} {"current_steps": 54925, "total_steps": 67140, "loss": 0.4588, "lr": 4.8749712463255605e-06, "epoch": 8.1806672624367, "percentage": 81.81, "elapsed_time": "3:48:38", "remaining_time": "0:50:50", "throughput": 2310.11, "total_tokens": 31691336} {"current_steps": 54930, "total_steps": 67140, "loss": 0.4087, "lr": 4.871116336703099e-06, "epoch": 8.181411974977658, "percentage": 81.81, "elapsed_time": "3:48:39", "remaining_time": "0:50:49", "throughput": 2310.14, "total_tokens": 31694376} {"current_steps": 54935, "total_steps": 67140, "loss": 0.4979, "lr": 4.867262787308765e-06, "epoch": 8.182156687518617, "percentage": 81.82, "elapsed_time": "3:48:40", "remaining_time": "0:50:48", "throughput": 2310.16, "total_tokens": 31697352} {"current_steps": 54940, "total_steps": 67140, "loss": 0.7327, "lr": 4.863410598402959e-06, "epoch": 8.182901400059578, "percentage": 81.83, "elapsed_time": "3:48:41", "remaining_time": "0:50:47", "throughput": 2310.18, "total_tokens": 31700232} {"current_steps": 54945, "total_steps": 67140, "loss": 0.6141, "lr": 4.859559770245986e-06, "epoch": 8.183646112600536, "percentage": 81.84, "elapsed_time": "3:48:43", "remaining_time": "0:50:45", "throughput": 2310.21, "total_tokens": 31703240} {"current_steps": 54950, "total_steps": 67140, "loss": 0.4703, "lr": 4.855710303098082e-06, "epoch": 8.184390825141495, "percentage": 81.84, "elapsed_time": "3:48:44", "remaining_time": "0:50:44", "throughput": 2310.22, "total_tokens": 31705992} {"current_steps": 54955, "total_steps": 67140, "loss": 0.5905, "lr": 4.851862197219373e-06, "epoch": 8.185135537682454, "percentage": 81.85, "elapsed_time": "3:48:45", "remaining_time": "0:50:43", "throughput": 2310.26, "total_tokens": 31709192} {"current_steps": 54960, "total_steps": 67140, "loss": 0.4461, "lr": 4.8480154528699e-06, "epoch": 8.185880250223414, "percentage": 81.86, "elapsed_time": "3:48:46", "remaining_time": "0:50:42", "throughput": 2310.26, "total_tokens": 31711880} {"current_steps": 54965, "total_steps": 67140, "loss": 0.4488, "lr": 4.844170070309612e-06, "epoch": 8.186624962764373, "percentage": 81.87, "elapsed_time": "3:48:47", "remaining_time": "0:50:40", "throughput": 2310.28, "total_tokens": 31714568} {"current_steps": 54970, "total_steps": 67140, "loss": 0.5798, "lr": 4.840326049798369e-06, "epoch": 8.187369675305332, "percentage": 81.87, "elapsed_time": "3:48:48", "remaining_time": "0:50:39", "throughput": 2310.3, "total_tokens": 31717480} {"current_steps": 54975, "total_steps": 67140, "loss": 0.6726, "lr": 4.83648339159592e-06, "epoch": 8.18811438784629, "percentage": 81.88, "elapsed_time": "3:48:49", "remaining_time": "0:50:38", "throughput": 2310.32, "total_tokens": 31720488} {"current_steps": 54980, "total_steps": 67140, "loss": 0.5621, "lr": 4.832642095961953e-06, "epoch": 8.188859100387251, "percentage": 81.89, "elapsed_time": "3:48:51", "remaining_time": "0:50:36", "throughput": 2310.34, "total_tokens": 31723368} {"current_steps": 54985, "total_steps": 67140, "loss": 0.5326, "lr": 4.828802163156032e-06, "epoch": 8.18960381292821, "percentage": 81.9, "elapsed_time": "3:48:52", "remaining_time": "0:50:35", "throughput": 2310.36, "total_tokens": 31726344} {"current_steps": 54990, "total_steps": 67140, "loss": 0.673, "lr": 4.824963593437648e-06, "epoch": 8.190348525469169, "percentage": 81.9, "elapsed_time": "3:48:53", "remaining_time": "0:50:34", "throughput": 2310.38, "total_tokens": 31729096} {"current_steps": 54995, "total_steps": 67140, "loss": 0.6295, "lr": 4.821126387066202e-06, "epoch": 8.191093238010128, "percentage": 81.91, "elapsed_time": "3:48:54", "remaining_time": "0:50:33", "throughput": 2310.39, "total_tokens": 31731976} {"current_steps": 55000, "total_steps": 67140, "loss": 0.6714, "lr": 4.817290544300998e-06, "epoch": 8.191837950551088, "percentage": 81.92, "elapsed_time": "3:48:55", "remaining_time": "0:50:31", "throughput": 2310.43, "total_tokens": 31735304} {"current_steps": 55005, "total_steps": 67140, "loss": 0.8633, "lr": 4.813456065401237e-06, "epoch": 8.192582663092047, "percentage": 81.93, "elapsed_time": "3:48:56", "remaining_time": "0:50:30", "throughput": 2310.44, "total_tokens": 31737928} {"current_steps": 55010, "total_steps": 67140, "loss": 0.4618, "lr": 4.809622950626041e-06, "epoch": 8.193327375633006, "percentage": 81.93, "elapsed_time": "3:48:57", "remaining_time": "0:50:29", "throughput": 2310.46, "total_tokens": 31740776} {"current_steps": 55015, "total_steps": 67140, "loss": 0.5415, "lr": 4.805791200234441e-06, "epoch": 8.194072088173964, "percentage": 81.94, "elapsed_time": "3:48:58", "remaining_time": "0:50:27", "throughput": 2310.47, "total_tokens": 31743432} {"current_steps": 55020, "total_steps": 67140, "loss": 0.6147, "lr": 4.801960814485373e-06, "epoch": 8.194816800714925, "percentage": 81.95, "elapsed_time": "3:49:00", "remaining_time": "0:50:26", "throughput": 2310.49, "total_tokens": 31746376} {"current_steps": 55025, "total_steps": 67140, "loss": 0.5539, "lr": 4.798131793637667e-06, "epoch": 8.195561513255884, "percentage": 81.96, "elapsed_time": "3:49:01", "remaining_time": "0:50:25", "throughput": 2310.5, "total_tokens": 31749256} {"current_steps": 55030, "total_steps": 67140, "loss": 0.566, "lr": 4.794304137950079e-06, "epoch": 8.196306225796842, "percentage": 81.96, "elapsed_time": "3:49:02", "remaining_time": "0:50:24", "throughput": 2310.52, "total_tokens": 31752072} {"current_steps": 55035, "total_steps": 67140, "loss": 0.4793, "lr": 4.790477847681274e-06, "epoch": 8.197050938337801, "percentage": 81.97, "elapsed_time": "3:49:03", "remaining_time": "0:50:22", "throughput": 2310.54, "total_tokens": 31754920} {"current_steps": 55040, "total_steps": 67140, "loss": 0.5862, "lr": 4.786652923089804e-06, "epoch": 8.19779565087876, "percentage": 81.98, "elapsed_time": "3:49:04", "remaining_time": "0:50:21", "throughput": 2310.55, "total_tokens": 31757672} {"current_steps": 55045, "total_steps": 67140, "loss": 0.4843, "lr": 4.782829364434146e-06, "epoch": 8.19854036341972, "percentage": 81.99, "elapsed_time": "3:49:05", "remaining_time": "0:50:20", "throughput": 2310.57, "total_tokens": 31760712} {"current_steps": 55050, "total_steps": 67140, "loss": 0.6304, "lr": 4.779007171972685e-06, "epoch": 8.19928507596068, "percentage": 81.99, "elapsed_time": "3:49:06", "remaining_time": "0:50:19", "throughput": 2310.59, "total_tokens": 31763560} {"current_steps": 55055, "total_steps": 67140, "loss": 0.4804, "lr": 4.775186345963706e-06, "epoch": 8.200029788501638, "percentage": 82.0, "elapsed_time": "3:49:08", "remaining_time": "0:50:17", "throughput": 2310.59, "total_tokens": 31766056} {"current_steps": 55060, "total_steps": 67140, "loss": 0.4404, "lr": 4.771366886665412e-06, "epoch": 8.200774501042597, "percentage": 82.01, "elapsed_time": "3:49:09", "remaining_time": "0:50:16", "throughput": 2310.6, "total_tokens": 31768712} {"current_steps": 55065, "total_steps": 67140, "loss": 0.5441, "lr": 4.767548794335894e-06, "epoch": 8.201519213583557, "percentage": 82.02, "elapsed_time": "3:49:10", "remaining_time": "0:50:15", "throughput": 2310.62, "total_tokens": 31771656} {"current_steps": 55070, "total_steps": 67140, "loss": 0.6564, "lr": 4.763732069233173e-06, "epoch": 8.202263926124516, "percentage": 82.02, "elapsed_time": "3:49:11", "remaining_time": "0:50:13", "throughput": 2310.64, "total_tokens": 31774600} {"current_steps": 55075, "total_steps": 67140, "loss": 0.4663, "lr": 4.759916711615162e-06, "epoch": 8.203008638665475, "percentage": 82.03, "elapsed_time": "3:49:12", "remaining_time": "0:50:12", "throughput": 2310.66, "total_tokens": 31777384} {"current_steps": 55080, "total_steps": 67140, "loss": 0.5517, "lr": 4.756102721739686e-06, "epoch": 8.203753351206434, "percentage": 82.04, "elapsed_time": "3:49:13", "remaining_time": "0:50:11", "throughput": 2310.66, "total_tokens": 31780008} {"current_steps": 55085, "total_steps": 67140, "loss": 0.5349, "lr": 4.752290099864484e-06, "epoch": 8.204498063747394, "percentage": 82.04, "elapsed_time": "3:49:14", "remaining_time": "0:50:10", "throughput": 2310.68, "total_tokens": 31782728} {"current_steps": 55090, "total_steps": 67140, "loss": 0.5345, "lr": 4.748478846247198e-06, "epoch": 8.205242776288353, "percentage": 82.05, "elapsed_time": "3:49:15", "remaining_time": "0:50:08", "throughput": 2310.7, "total_tokens": 31785672} {"current_steps": 55095, "total_steps": 67140, "loss": 0.519, "lr": 4.744668961145371e-06, "epoch": 8.205987488829312, "percentage": 82.06, "elapsed_time": "3:49:16", "remaining_time": "0:50:07", "throughput": 2310.71, "total_tokens": 31788328} {"current_steps": 55100, "total_steps": 67140, "loss": 0.502, "lr": 4.740860444816472e-06, "epoch": 8.20673220137027, "percentage": 82.07, "elapsed_time": "3:49:18", "remaining_time": "0:50:06", "throughput": 2310.72, "total_tokens": 31791048} {"current_steps": 55105, "total_steps": 67140, "loss": 0.4489, "lr": 4.7370532975178575e-06, "epoch": 8.207476913911231, "percentage": 82.07, "elapsed_time": "3:49:19", "remaining_time": "0:50:05", "throughput": 2310.73, "total_tokens": 31793768} {"current_steps": 55110, "total_steps": 67140, "loss": 0.5642, "lr": 4.733247519506789e-06, "epoch": 8.20822162645219, "percentage": 82.08, "elapsed_time": "3:49:20", "remaining_time": "0:50:03", "throughput": 2310.76, "total_tokens": 31796840} {"current_steps": 55115, "total_steps": 67140, "loss": 0.3814, "lr": 4.7294431110404545e-06, "epoch": 8.208966338993148, "percentage": 82.09, "elapsed_time": "3:49:21", "remaining_time": "0:50:02", "throughput": 2310.77, "total_tokens": 31799624} {"current_steps": 55120, "total_steps": 67140, "loss": 0.421, "lr": 4.725640072375942e-06, "epoch": 8.209711051534107, "percentage": 82.1, "elapsed_time": "3:49:22", "remaining_time": "0:50:01", "throughput": 2310.78, "total_tokens": 31802344} {"current_steps": 55125, "total_steps": 67140, "loss": 0.4468, "lr": 4.7218384037702425e-06, "epoch": 8.210455764075068, "percentage": 82.1, "elapsed_time": "3:49:23", "remaining_time": "0:49:59", "throughput": 2310.81, "total_tokens": 31805384} {"current_steps": 55130, "total_steps": 67140, "loss": 0.6166, "lr": 4.71803810548026e-06, "epoch": 8.211200476616026, "percentage": 82.11, "elapsed_time": "3:49:24", "remaining_time": "0:49:58", "throughput": 2310.83, "total_tokens": 31808328} {"current_steps": 55135, "total_steps": 67140, "loss": 0.5572, "lr": 4.714239177762808e-06, "epoch": 8.211945189156985, "percentage": 82.12, "elapsed_time": "3:49:25", "remaining_time": "0:49:57", "throughput": 2310.84, "total_tokens": 31810952} {"current_steps": 55140, "total_steps": 67140, "loss": 0.5395, "lr": 4.710441620874589e-06, "epoch": 8.212689901697944, "percentage": 82.13, "elapsed_time": "3:49:27", "remaining_time": "0:49:56", "throughput": 2310.87, "total_tokens": 31814120} {"current_steps": 55145, "total_steps": 67140, "loss": 0.6107, "lr": 4.706645435072243e-06, "epoch": 8.213434614238905, "percentage": 82.13, "elapsed_time": "3:49:28", "remaining_time": "0:49:54", "throughput": 2310.91, "total_tokens": 31817448} {"current_steps": 55150, "total_steps": 67140, "loss": 0.4927, "lr": 4.702850620612284e-06, "epoch": 8.214179326779863, "percentage": 82.14, "elapsed_time": "3:49:29", "remaining_time": "0:49:53", "throughput": 2310.92, "total_tokens": 31820264} {"current_steps": 55155, "total_steps": 67140, "loss": 0.6275, "lr": 4.699057177751157e-06, "epoch": 8.214924039320822, "percentage": 82.15, "elapsed_time": "3:49:30", "remaining_time": "0:49:52", "throughput": 2310.94, "total_tokens": 31823112} {"current_steps": 55160, "total_steps": 67140, "loss": 0.585, "lr": 4.695265106745209e-06, "epoch": 8.21566875186178, "percentage": 82.16, "elapsed_time": "3:49:31", "remaining_time": "0:49:51", "throughput": 2310.96, "total_tokens": 31825864} {"current_steps": 55165, "total_steps": 67140, "loss": 0.3362, "lr": 4.691474407850699e-06, "epoch": 8.216413464402741, "percentage": 82.16, "elapsed_time": "3:49:32", "remaining_time": "0:49:49", "throughput": 2310.99, "total_tokens": 31829000} {"current_steps": 55170, "total_steps": 67140, "loss": 0.5771, "lr": 4.687685081323773e-06, "epoch": 8.2171581769437, "percentage": 82.17, "elapsed_time": "3:49:34", "remaining_time": "0:49:48", "throughput": 2311.0, "total_tokens": 31831752} {"current_steps": 55175, "total_steps": 67140, "loss": 0.5851, "lr": 4.683897127420503e-06, "epoch": 8.217902889484659, "percentage": 82.18, "elapsed_time": "3:49:35", "remaining_time": "0:49:47", "throughput": 2311.02, "total_tokens": 31834568} {"current_steps": 55180, "total_steps": 67140, "loss": 0.7737, "lr": 4.680110546396868e-06, "epoch": 8.218647602025618, "percentage": 82.19, "elapsed_time": "3:49:36", "remaining_time": "0:49:45", "throughput": 2311.05, "total_tokens": 31837640} {"current_steps": 55185, "total_steps": 67140, "loss": 0.6591, "lr": 4.676325338508755e-06, "epoch": 8.219392314566578, "percentage": 82.19, "elapsed_time": "3:49:37", "remaining_time": "0:49:44", "throughput": 2311.07, "total_tokens": 31840520} {"current_steps": 55190, "total_steps": 67140, "loss": 0.6485, "lr": 4.672541504011938e-06, "epoch": 8.220137027107537, "percentage": 82.2, "elapsed_time": "3:49:38", "remaining_time": "0:49:43", "throughput": 2311.09, "total_tokens": 31843528} {"current_steps": 55195, "total_steps": 67140, "loss": 0.5249, "lr": 4.668759043162121e-06, "epoch": 8.220881739648496, "percentage": 82.21, "elapsed_time": "3:49:39", "remaining_time": "0:49:42", "throughput": 2311.09, "total_tokens": 31846152} {"current_steps": 55200, "total_steps": 67140, "loss": 0.4846, "lr": 4.664977956214914e-06, "epoch": 8.221626452189454, "percentage": 82.22, "elapsed_time": "3:49:40", "remaining_time": "0:49:40", "throughput": 2311.12, "total_tokens": 31849096} {"current_steps": 55205, "total_steps": 67140, "loss": 0.625, "lr": 4.661198243425813e-06, "epoch": 8.222371164730415, "percentage": 82.22, "elapsed_time": "3:49:41", "remaining_time": "0:49:39", "throughput": 2311.12, "total_tokens": 31851688} {"current_steps": 55210, "total_steps": 67140, "loss": 0.4971, "lr": 4.6574199050502445e-06, "epoch": 8.223115877271374, "percentage": 82.23, "elapsed_time": "3:49:43", "remaining_time": "0:49:38", "throughput": 2311.13, "total_tokens": 31854408} {"current_steps": 55215, "total_steps": 67140, "loss": 0.6712, "lr": 4.653642941343531e-06, "epoch": 8.223860589812332, "percentage": 82.24, "elapsed_time": "3:49:44", "remaining_time": "0:49:37", "throughput": 2311.15, "total_tokens": 31857352} {"current_steps": 55220, "total_steps": 67140, "loss": 0.4981, "lr": 4.649867352560905e-06, "epoch": 8.224605302353291, "percentage": 82.25, "elapsed_time": "3:49:45", "remaining_time": "0:49:35", "throughput": 2311.16, "total_tokens": 31860104} {"current_steps": 55225, "total_steps": 67140, "loss": 0.5455, "lr": 4.646093138957514e-06, "epoch": 8.22535001489425, "percentage": 82.25, "elapsed_time": "3:49:46", "remaining_time": "0:49:34", "throughput": 2311.18, "total_tokens": 31862856} {"current_steps": 55230, "total_steps": 67140, "loss": 0.6291, "lr": 4.6423203007883886e-06, "epoch": 8.22609472743521, "percentage": 82.26, "elapsed_time": "3:49:47", "remaining_time": "0:49:33", "throughput": 2311.19, "total_tokens": 31865576} {"current_steps": 55235, "total_steps": 67140, "loss": 0.5598, "lr": 4.638548838308493e-06, "epoch": 8.22683943997617, "percentage": 82.27, "elapsed_time": "3:49:48", "remaining_time": "0:49:31", "throughput": 2311.21, "total_tokens": 31868584} {"current_steps": 55240, "total_steps": 67140, "loss": 0.4233, "lr": 4.6347787517726785e-06, "epoch": 8.227584152517128, "percentage": 82.28, "elapsed_time": "3:49:49", "remaining_time": "0:49:30", "throughput": 2311.22, "total_tokens": 31871304} {"current_steps": 55245, "total_steps": 67140, "loss": 0.4459, "lr": 4.6310100414357185e-06, "epoch": 8.228328865058087, "percentage": 82.28, "elapsed_time": "3:49:50", "remaining_time": "0:49:29", "throughput": 2311.23, "total_tokens": 31874056} {"current_steps": 55250, "total_steps": 67140, "loss": 0.7462, "lr": 4.6272427075522845e-06, "epoch": 8.229073577599047, "percentage": 82.29, "elapsed_time": "3:49:52", "remaining_time": "0:49:28", "throughput": 2311.25, "total_tokens": 31876968} {"current_steps": 55255, "total_steps": 67140, "loss": 0.5259, "lr": 4.623476750376956e-06, "epoch": 8.229818290140006, "percentage": 82.3, "elapsed_time": "3:49:53", "remaining_time": "0:49:26", "throughput": 2311.28, "total_tokens": 31880008} {"current_steps": 55260, "total_steps": 67140, "loss": 0.5988, "lr": 4.6197121701642286e-06, "epoch": 8.230563002680965, "percentage": 82.31, "elapsed_time": "3:49:54", "remaining_time": "0:49:25", "throughput": 2311.31, "total_tokens": 31883240} {"current_steps": 55265, "total_steps": 67140, "loss": 0.7376, "lr": 4.615948967168496e-06, "epoch": 8.231307715221924, "percentage": 82.31, "elapsed_time": "3:49:55", "remaining_time": "0:49:24", "throughput": 2311.33, "total_tokens": 31886120} {"current_steps": 55270, "total_steps": 67140, "loss": 0.7867, "lr": 4.612187141644056e-06, "epoch": 8.232052427762884, "percentage": 82.32, "elapsed_time": "3:49:56", "remaining_time": "0:49:23", "throughput": 2311.36, "total_tokens": 31889192} {"current_steps": 55275, "total_steps": 67140, "loss": 0.5798, "lr": 4.6084266938451135e-06, "epoch": 8.232797140303843, "percentage": 82.33, "elapsed_time": "3:49:57", "remaining_time": "0:49:21", "throughput": 2311.37, "total_tokens": 31891880} {"current_steps": 55280, "total_steps": 67140, "loss": 0.5971, "lr": 4.604667624025788e-06, "epoch": 8.233541852844802, "percentage": 82.34, "elapsed_time": "3:49:58", "remaining_time": "0:49:20", "throughput": 2311.37, "total_tokens": 31894472} {"current_steps": 55285, "total_steps": 67140, "loss": 0.3335, "lr": 4.600909932440103e-06, "epoch": 8.23428656538576, "percentage": 82.34, "elapsed_time": "3:50:00", "remaining_time": "0:49:19", "throughput": 2311.4, "total_tokens": 31897448} {"current_steps": 55290, "total_steps": 67140, "loss": 0.5397, "lr": 4.59715361934199e-06, "epoch": 8.235031277926721, "percentage": 82.35, "elapsed_time": "3:50:01", "remaining_time": "0:49:17", "throughput": 2311.4, "total_tokens": 31900040} {"current_steps": 55295, "total_steps": 67140, "loss": 0.5339, "lr": 4.593398684985281e-06, "epoch": 8.23577599046768, "percentage": 82.36, "elapsed_time": "3:50:02", "remaining_time": "0:49:16", "throughput": 2311.41, "total_tokens": 31902856} {"current_steps": 55300, "total_steps": 67140, "loss": 0.4666, "lr": 4.589645129623729e-06, "epoch": 8.236520703008638, "percentage": 82.37, "elapsed_time": "3:50:03", "remaining_time": "0:49:15", "throughput": 2311.43, "total_tokens": 31905672} {"current_steps": 55305, "total_steps": 67140, "loss": 0.4718, "lr": 4.585892953510978e-06, "epoch": 8.237265415549597, "percentage": 82.37, "elapsed_time": "3:50:04", "remaining_time": "0:49:14", "throughput": 2311.45, "total_tokens": 31908552} {"current_steps": 55310, "total_steps": 67140, "loss": 0.5711, "lr": 4.582142156900576e-06, "epoch": 8.238010128090558, "percentage": 82.38, "elapsed_time": "3:50:05", "remaining_time": "0:49:12", "throughput": 2311.46, "total_tokens": 31911400} {"current_steps": 55315, "total_steps": 67140, "loss": 0.449, "lr": 4.578392740045994e-06, "epoch": 8.238754840631517, "percentage": 82.39, "elapsed_time": "3:50:06", "remaining_time": "0:49:11", "throughput": 2311.47, "total_tokens": 31914024} {"current_steps": 55320, "total_steps": 67140, "loss": 0.822, "lr": 4.5746447032006005e-06, "epoch": 8.239499553172475, "percentage": 82.39, "elapsed_time": "3:50:07", "remaining_time": "0:49:10", "throughput": 2311.49, "total_tokens": 31916968} {"current_steps": 55325, "total_steps": 67140, "loss": 0.5795, "lr": 4.570898046617677e-06, "epoch": 8.240244265713434, "percentage": 82.4, "elapsed_time": "3:50:09", "remaining_time": "0:49:09", "throughput": 2311.5, "total_tokens": 31919624} {"current_steps": 55330, "total_steps": 67140, "loss": 0.4951, "lr": 4.567152770550412e-06, "epoch": 8.240988978254395, "percentage": 82.41, "elapsed_time": "3:50:10", "remaining_time": "0:49:07", "throughput": 2311.52, "total_tokens": 31922472} {"current_steps": 55335, "total_steps": 67140, "loss": 0.5741, "lr": 4.563408875251882e-06, "epoch": 8.241733690795353, "percentage": 82.42, "elapsed_time": "3:50:11", "remaining_time": "0:49:06", "throughput": 2311.53, "total_tokens": 31925128} {"current_steps": 55340, "total_steps": 67140, "loss": 0.6572, "lr": 4.5596663609750904e-06, "epoch": 8.242478403336312, "percentage": 82.42, "elapsed_time": "3:50:12", "remaining_time": "0:49:05", "throughput": 2311.55, "total_tokens": 31928136} {"current_steps": 55345, "total_steps": 67140, "loss": 0.7077, "lr": 4.555925227972946e-06, "epoch": 8.24322311587727, "percentage": 82.43, "elapsed_time": "3:50:13", "remaining_time": "0:49:03", "throughput": 2311.56, "total_tokens": 31930856} {"current_steps": 55350, "total_steps": 67140, "loss": 0.5317, "lr": 4.552185476498252e-06, "epoch": 8.243967828418231, "percentage": 82.44, "elapsed_time": "3:50:14", "remaining_time": "0:49:02", "throughput": 2311.58, "total_tokens": 31933640} {"current_steps": 55355, "total_steps": 67140, "loss": 0.4824, "lr": 4.5484471068037275e-06, "epoch": 8.24471254095919, "percentage": 82.45, "elapsed_time": "3:50:15", "remaining_time": "0:49:01", "throughput": 2311.6, "total_tokens": 31936744} {"current_steps": 55360, "total_steps": 67140, "loss": 0.3992, "lr": 4.544710119141996e-06, "epoch": 8.245457253500149, "percentage": 82.45, "elapsed_time": "3:50:16", "remaining_time": "0:49:00", "throughput": 2311.62, "total_tokens": 31939624} {"current_steps": 55365, "total_steps": 67140, "loss": 0.5561, "lr": 4.540974513765597e-06, "epoch": 8.246201966041108, "percentage": 82.46, "elapsed_time": "3:50:18", "remaining_time": "0:48:58", "throughput": 2311.65, "total_tokens": 31942696} {"current_steps": 55370, "total_steps": 67140, "loss": 0.6425, "lr": 4.537240290926955e-06, "epoch": 8.246946678582066, "percentage": 82.47, "elapsed_time": "3:50:19", "remaining_time": "0:48:57", "throughput": 2311.68, "total_tokens": 31945736} {"current_steps": 55375, "total_steps": 67140, "loss": 0.4568, "lr": 4.5335074508784185e-06, "epoch": 8.247691391123027, "percentage": 82.48, "elapsed_time": "3:50:20", "remaining_time": "0:48:56", "throughput": 2311.69, "total_tokens": 31948456} {"current_steps": 55380, "total_steps": 67140, "loss": 0.6621, "lr": 4.529775993872237e-06, "epoch": 8.248436103663986, "percentage": 82.48, "elapsed_time": "3:50:21", "remaining_time": "0:48:55", "throughput": 2311.72, "total_tokens": 31951496} {"current_steps": 55385, "total_steps": 67140, "loss": 0.5752, "lr": 4.526045920160574e-06, "epoch": 8.249180816204944, "percentage": 82.49, "elapsed_time": "3:50:22", "remaining_time": "0:48:53", "throughput": 2311.72, "total_tokens": 31954152} {"current_steps": 55390, "total_steps": 67140, "loss": 0.5557, "lr": 4.522317229995479e-06, "epoch": 8.249925528745903, "percentage": 82.5, "elapsed_time": "3:50:23", "remaining_time": "0:48:52", "throughput": 2311.74, "total_tokens": 31956968} {"current_steps": 55395, "total_steps": 67140, "loss": 0.5859, "lr": 4.518589923628932e-06, "epoch": 8.250670241286864, "percentage": 82.51, "elapsed_time": "3:50:24", "remaining_time": "0:48:51", "throughput": 2311.76, "total_tokens": 31959784} {"current_steps": 55400, "total_steps": 67140, "loss": 0.687, "lr": 4.514864001312813e-06, "epoch": 8.251414953827823, "percentage": 82.51, "elapsed_time": "3:50:26", "remaining_time": "0:48:49", "throughput": 2311.77, "total_tokens": 31962600} {"current_steps": 55405, "total_steps": 67140, "loss": 0.5384, "lr": 4.511139463298891e-06, "epoch": 8.252159666368781, "percentage": 82.52, "elapsed_time": "3:50:27", "remaining_time": "0:48:48", "throughput": 2311.79, "total_tokens": 31965544} {"current_steps": 55410, "total_steps": 67140, "loss": 0.4831, "lr": 4.507416309838861e-06, "epoch": 8.25290437890974, "percentage": 82.53, "elapsed_time": "3:50:28", "remaining_time": "0:48:47", "throughput": 2311.8, "total_tokens": 31968264} {"current_steps": 55415, "total_steps": 67140, "loss": 0.8099, "lr": 4.503694541184322e-06, "epoch": 8.2536490914507, "percentage": 82.54, "elapsed_time": "3:50:29", "remaining_time": "0:48:46", "throughput": 2311.82, "total_tokens": 31971016} {"current_steps": 55420, "total_steps": 67140, "loss": 0.5361, "lr": 4.499974157586773e-06, "epoch": 8.25439380399166, "percentage": 82.54, "elapsed_time": "3:50:30", "remaining_time": "0:48:44", "throughput": 2311.85, "total_tokens": 31974152} {"current_steps": 55425, "total_steps": 67140, "loss": 0.5068, "lr": 4.49625515929763e-06, "epoch": 8.255138516532618, "percentage": 82.55, "elapsed_time": "3:50:31", "remaining_time": "0:48:43", "throughput": 2311.86, "total_tokens": 31976936} {"current_steps": 55430, "total_steps": 67140, "loss": 0.5122, "lr": 4.492537546568196e-06, "epoch": 8.255883229073577, "percentage": 82.56, "elapsed_time": "3:50:32", "remaining_time": "0:48:42", "throughput": 2311.88, "total_tokens": 31979784} {"current_steps": 55435, "total_steps": 67140, "loss": 0.447, "lr": 4.488821319649702e-06, "epoch": 8.256627941614537, "percentage": 82.57, "elapsed_time": "3:50:33", "remaining_time": "0:48:41", "throughput": 2311.89, "total_tokens": 31982440} {"current_steps": 55440, "total_steps": 67140, "loss": 0.5195, "lr": 4.485106478793266e-06, "epoch": 8.257372654155496, "percentage": 82.57, "elapsed_time": "3:50:35", "remaining_time": "0:48:39", "throughput": 2311.91, "total_tokens": 31985448} {"current_steps": 55445, "total_steps": 67140, "loss": 0.471, "lr": 4.481393024249925e-06, "epoch": 8.258117366696455, "percentage": 82.58, "elapsed_time": "3:50:36", "remaining_time": "0:48:38", "throughput": 2311.94, "total_tokens": 31988488} {"current_steps": 55450, "total_steps": 67140, "loss": 0.6228, "lr": 4.477680956270621e-06, "epoch": 8.258862079237414, "percentage": 82.59, "elapsed_time": "3:50:37", "remaining_time": "0:48:37", "throughput": 2311.96, "total_tokens": 31991432} {"current_steps": 55455, "total_steps": 67140, "loss": 0.5691, "lr": 4.4739702751062015e-06, "epoch": 8.259606791778374, "percentage": 82.6, "elapsed_time": "3:50:38", "remaining_time": "0:48:35", "throughput": 2311.99, "total_tokens": 31994408} {"current_steps": 55460, "total_steps": 67140, "loss": 0.7098, "lr": 4.470260981007418e-06, "epoch": 8.260351504319333, "percentage": 82.6, "elapsed_time": "3:50:39", "remaining_time": "0:48:34", "throughput": 2312.0, "total_tokens": 31997192} {"current_steps": 55465, "total_steps": 67140, "loss": 0.6736, "lr": 4.466553074224936e-06, "epoch": 8.261096216860292, "percentage": 82.61, "elapsed_time": "3:50:40", "remaining_time": "0:48:33", "throughput": 2312.01, "total_tokens": 31999848} {"current_steps": 55470, "total_steps": 67140, "loss": 0.7255, "lr": 4.462846555009312e-06, "epoch": 8.26184092940125, "percentage": 82.62, "elapsed_time": "3:50:41", "remaining_time": "0:48:32", "throughput": 2312.03, "total_tokens": 32002856} {"current_steps": 55475, "total_steps": 67140, "loss": 0.4939, "lr": 4.459141423611016e-06, "epoch": 8.262585641942211, "percentage": 82.63, "elapsed_time": "3:50:42", "remaining_time": "0:48:30", "throughput": 2312.05, "total_tokens": 32005640} {"current_steps": 55480, "total_steps": 67140, "loss": 0.6014, "lr": 4.455437680280427e-06, "epoch": 8.26333035448317, "percentage": 82.63, "elapsed_time": "3:50:44", "remaining_time": "0:48:29", "throughput": 2312.06, "total_tokens": 32008488} {"current_steps": 55485, "total_steps": 67140, "loss": 0.6246, "lr": 4.451735325267836e-06, "epoch": 8.264075067024129, "percentage": 82.64, "elapsed_time": "3:50:45", "remaining_time": "0:48:28", "throughput": 2312.08, "total_tokens": 32011368} {"current_steps": 55490, "total_steps": 67140, "loss": 0.5814, "lr": 4.448034358823424e-06, "epoch": 8.264819779565087, "percentage": 82.65, "elapsed_time": "3:50:46", "remaining_time": "0:48:27", "throughput": 2312.1, "total_tokens": 32014312} {"current_steps": 55495, "total_steps": 67140, "loss": 0.5576, "lr": 4.444334781197301e-06, "epoch": 8.265564492106048, "percentage": 82.66, "elapsed_time": "3:50:47", "remaining_time": "0:48:25", "throughput": 2312.13, "total_tokens": 32017480} {"current_steps": 55500, "total_steps": 67140, "loss": 0.553, "lr": 4.440636592639452e-06, "epoch": 8.266309204647007, "percentage": 82.66, "elapsed_time": "3:50:48", "remaining_time": "0:48:24", "throughput": 2312.18, "total_tokens": 32020936} {"current_steps": 55505, "total_steps": 67140, "loss": 0.4656, "lr": 4.436939793399803e-06, "epoch": 8.267053917187965, "percentage": 82.67, "elapsed_time": "3:50:49", "remaining_time": "0:48:23", "throughput": 2312.19, "total_tokens": 32023656} {"current_steps": 55510, "total_steps": 67140, "loss": 0.4249, "lr": 4.433244383728149e-06, "epoch": 8.267798629728924, "percentage": 82.68, "elapsed_time": "3:50:51", "remaining_time": "0:48:21", "throughput": 2312.22, "total_tokens": 32026760} {"current_steps": 55515, "total_steps": 67140, "loss": 0.6637, "lr": 4.429550363874224e-06, "epoch": 8.268543342269885, "percentage": 82.69, "elapsed_time": "3:50:52", "remaining_time": "0:48:20", "throughput": 2312.24, "total_tokens": 32029544} {"current_steps": 55520, "total_steps": 67140, "loss": 0.5189, "lr": 4.4258577340876514e-06, "epoch": 8.269288054810843, "percentage": 82.69, "elapsed_time": "3:50:53", "remaining_time": "0:48:19", "throughput": 2312.26, "total_tokens": 32032488} {"current_steps": 55525, "total_steps": 67140, "loss": 0.7053, "lr": 4.422166494617966e-06, "epoch": 8.270032767351802, "percentage": 82.7, "elapsed_time": "3:50:54", "remaining_time": "0:48:18", "throughput": 2312.28, "total_tokens": 32035528} {"current_steps": 55530, "total_steps": 67140, "loss": 0.6664, "lr": 4.418476645714609e-06, "epoch": 8.270777479892761, "percentage": 82.71, "elapsed_time": "3:50:55", "remaining_time": "0:48:16", "throughput": 2312.32, "total_tokens": 32038696} {"current_steps": 55535, "total_steps": 67140, "loss": 0.6017, "lr": 4.414788187626917e-06, "epoch": 8.271522192433721, "percentage": 82.72, "elapsed_time": "3:50:56", "remaining_time": "0:48:15", "throughput": 2312.34, "total_tokens": 32041640} {"current_steps": 55540, "total_steps": 67140, "loss": 0.5, "lr": 4.411101120604147e-06, "epoch": 8.27226690497468, "percentage": 82.72, "elapsed_time": "3:50:57", "remaining_time": "0:48:14", "throughput": 2312.36, "total_tokens": 32044520} {"current_steps": 55545, "total_steps": 67140, "loss": 0.6308, "lr": 4.40741544489546e-06, "epoch": 8.273011617515639, "percentage": 82.73, "elapsed_time": "3:50:59", "remaining_time": "0:48:13", "throughput": 2312.38, "total_tokens": 32047592} {"current_steps": 55550, "total_steps": 67140, "loss": 0.6417, "lr": 4.403731160749907e-06, "epoch": 8.273756330056598, "percentage": 82.74, "elapsed_time": "3:51:00", "remaining_time": "0:48:11", "throughput": 2312.39, "total_tokens": 32050120} {"current_steps": 55555, "total_steps": 67140, "loss": 0.4822, "lr": 4.400048268416465e-06, "epoch": 8.274501042597556, "percentage": 82.75, "elapsed_time": "3:51:01", "remaining_time": "0:48:10", "throughput": 2312.41, "total_tokens": 32053160} {"current_steps": 55560, "total_steps": 67140, "loss": 0.5794, "lr": 4.396366768144009e-06, "epoch": 8.275245755138517, "percentage": 82.75, "elapsed_time": "3:51:02", "remaining_time": "0:48:09", "throughput": 2312.42, "total_tokens": 32055848} {"current_steps": 55565, "total_steps": 67140, "loss": 0.7086, "lr": 4.3926866601813224e-06, "epoch": 8.275990467679476, "percentage": 82.76, "elapsed_time": "3:51:03", "remaining_time": "0:48:07", "throughput": 2312.44, "total_tokens": 32058632} {"current_steps": 55570, "total_steps": 67140, "loss": 0.7887, "lr": 4.389007944777082e-06, "epoch": 8.276735180220435, "percentage": 82.77, "elapsed_time": "3:51:04", "remaining_time": "0:48:06", "throughput": 2312.44, "total_tokens": 32061256} {"current_steps": 55575, "total_steps": 67140, "loss": 0.4663, "lr": 4.385330622179887e-06, "epoch": 8.277479892761393, "percentage": 82.77, "elapsed_time": "3:51:05", "remaining_time": "0:48:05", "throughput": 2312.47, "total_tokens": 32064392} {"current_steps": 55580, "total_steps": 67140, "loss": 0.6746, "lr": 4.3816546926382345e-06, "epoch": 8.278224605302354, "percentage": 82.78, "elapsed_time": "3:51:07", "remaining_time": "0:48:04", "throughput": 2312.49, "total_tokens": 32067368} {"current_steps": 55585, "total_steps": 67140, "loss": 0.7819, "lr": 4.377980156400538e-06, "epoch": 8.278969317843313, "percentage": 82.79, "elapsed_time": "3:51:08", "remaining_time": "0:48:02", "throughput": 2312.52, "total_tokens": 32070344} {"current_steps": 55590, "total_steps": 67140, "loss": 0.7002, "lr": 4.374307013715093e-06, "epoch": 8.279714030384271, "percentage": 82.8, "elapsed_time": "3:51:09", "remaining_time": "0:48:01", "throughput": 2312.53, "total_tokens": 32073096} {"current_steps": 55595, "total_steps": 67140, "loss": 0.5081, "lr": 4.370635264830122e-06, "epoch": 8.28045874292523, "percentage": 82.8, "elapsed_time": "3:51:10", "remaining_time": "0:48:00", "throughput": 2312.56, "total_tokens": 32076296} {"current_steps": 55600, "total_steps": 67140, "loss": 0.6206, "lr": 4.366964909993751e-06, "epoch": 8.28120345546619, "percentage": 82.81, "elapsed_time": "3:51:11", "remaining_time": "0:47:59", "throughput": 2312.57, "total_tokens": 32078984} {"current_steps": 55605, "total_steps": 67140, "loss": 0.3788, "lr": 4.363295949453999e-06, "epoch": 8.28194816800715, "percentage": 82.82, "elapsed_time": "3:51:12", "remaining_time": "0:47:57", "throughput": 2312.58, "total_tokens": 32081736} {"current_steps": 55610, "total_steps": 67140, "loss": 0.5751, "lr": 4.3596283834588054e-06, "epoch": 8.282692880548108, "percentage": 82.83, "elapsed_time": "3:51:13", "remaining_time": "0:47:56", "throughput": 2312.6, "total_tokens": 32084744} {"current_steps": 55615, "total_steps": 67140, "loss": 0.6418, "lr": 4.355962212256006e-06, "epoch": 8.283437593089067, "percentage": 82.83, "elapsed_time": "3:51:15", "remaining_time": "0:47:55", "throughput": 2312.63, "total_tokens": 32087720} {"current_steps": 55620, "total_steps": 67140, "loss": 0.6915, "lr": 4.3522974360933475e-06, "epoch": 8.284182305630027, "percentage": 82.84, "elapsed_time": "3:51:16", "remaining_time": "0:47:54", "throughput": 2312.64, "total_tokens": 32090504} {"current_steps": 55625, "total_steps": 67140, "loss": 0.5437, "lr": 4.348634055218489e-06, "epoch": 8.284927018170986, "percentage": 82.85, "elapsed_time": "3:51:17", "remaining_time": "0:47:52", "throughput": 2312.67, "total_tokens": 32093640} {"current_steps": 55630, "total_steps": 67140, "loss": 0.5182, "lr": 4.34497206987897e-06, "epoch": 8.285671730711945, "percentage": 82.86, "elapsed_time": "3:51:18", "remaining_time": "0:47:51", "throughput": 2312.69, "total_tokens": 32096552} {"current_steps": 55635, "total_steps": 67140, "loss": 0.5916, "lr": 4.3413114803222685e-06, "epoch": 8.286416443252904, "percentage": 82.86, "elapsed_time": "3:51:19", "remaining_time": "0:47:50", "throughput": 2312.71, "total_tokens": 32099368} {"current_steps": 55640, "total_steps": 67140, "loss": 0.5321, "lr": 4.33765228679574e-06, "epoch": 8.287161155793864, "percentage": 82.87, "elapsed_time": "3:51:20", "remaining_time": "0:47:48", "throughput": 2312.72, "total_tokens": 32102152} {"current_steps": 55645, "total_steps": 67140, "loss": 0.6225, "lr": 4.333994489546661e-06, "epoch": 8.287905868334823, "percentage": 82.88, "elapsed_time": "3:51:21", "remaining_time": "0:47:47", "throughput": 2312.75, "total_tokens": 32105192} {"current_steps": 55650, "total_steps": 67140, "loss": 0.6945, "lr": 4.330338088822214e-06, "epoch": 8.288650580875782, "percentage": 82.89, "elapsed_time": "3:51:23", "remaining_time": "0:47:46", "throughput": 2312.77, "total_tokens": 32108264} {"current_steps": 55655, "total_steps": 67140, "loss": 0.641, "lr": 4.3266830848694815e-06, "epoch": 8.28939529341674, "percentage": 82.89, "elapsed_time": "3:51:24", "remaining_time": "0:47:45", "throughput": 2312.79, "total_tokens": 32111112} {"current_steps": 55660, "total_steps": 67140, "loss": 0.3633, "lr": 4.3230294779354615e-06, "epoch": 8.290140005957701, "percentage": 82.9, "elapsed_time": "3:51:25", "remaining_time": "0:47:43", "throughput": 2312.83, "total_tokens": 32114472} {"current_steps": 55665, "total_steps": 67140, "loss": 0.5597, "lr": 4.319377268267035e-06, "epoch": 8.29088471849866, "percentage": 82.91, "elapsed_time": "3:51:26", "remaining_time": "0:47:42", "throughput": 2312.86, "total_tokens": 32117544} {"current_steps": 55670, "total_steps": 67140, "loss": 0.6796, "lr": 4.315726456111022e-06, "epoch": 8.291629431039619, "percentage": 82.92, "elapsed_time": "3:51:27", "remaining_time": "0:47:41", "throughput": 2312.88, "total_tokens": 32120360} {"current_steps": 55675, "total_steps": 67140, "loss": 0.7119, "lr": 4.312077041714108e-06, "epoch": 8.292374143580577, "percentage": 82.92, "elapsed_time": "3:51:28", "remaining_time": "0:47:40", "throughput": 2312.9, "total_tokens": 32123304} {"current_steps": 55680, "total_steps": 67140, "loss": 0.4746, "lr": 4.3084290253229185e-06, "epoch": 8.293118856121538, "percentage": 82.93, "elapsed_time": "3:51:29", "remaining_time": "0:47:38", "throughput": 2312.93, "total_tokens": 32126568} {"current_steps": 55685, "total_steps": 67140, "loss": 0.6076, "lr": 4.304782407183971e-06, "epoch": 8.293863568662497, "percentage": 82.94, "elapsed_time": "3:51:31", "remaining_time": "0:47:37", "throughput": 2312.95, "total_tokens": 32129416} {"current_steps": 55690, "total_steps": 67140, "loss": 0.4903, "lr": 4.3011371875436856e-06, "epoch": 8.294608281203455, "percentage": 82.95, "elapsed_time": "3:51:32", "remaining_time": "0:47:36", "throughput": 2312.97, "total_tokens": 32132232} {"current_steps": 55695, "total_steps": 67140, "loss": 0.6045, "lr": 4.2974933666484e-06, "epoch": 8.295352993744414, "percentage": 82.95, "elapsed_time": "3:51:33", "remaining_time": "0:47:35", "throughput": 2313.0, "total_tokens": 32135400} {"current_steps": 55700, "total_steps": 67140, "loss": 0.5914, "lr": 4.293850944744337e-06, "epoch": 8.296097706285375, "percentage": 82.96, "elapsed_time": "3:51:34", "remaining_time": "0:47:33", "throughput": 2313.01, "total_tokens": 32138088} {"current_steps": 55705, "total_steps": 67140, "loss": 0.9033, "lr": 4.290209922077643e-06, "epoch": 8.296842418826333, "percentage": 82.97, "elapsed_time": "3:51:35", "remaining_time": "0:47:32", "throughput": 2313.03, "total_tokens": 32141064} {"current_steps": 55710, "total_steps": 67140, "loss": 0.5131, "lr": 4.286570298894365e-06, "epoch": 8.297587131367292, "percentage": 82.98, "elapsed_time": "3:51:36", "remaining_time": "0:47:31", "throughput": 2313.05, "total_tokens": 32143848} {"current_steps": 55715, "total_steps": 67140, "loss": 0.4981, "lr": 4.282932075440449e-06, "epoch": 8.298331843908251, "percentage": 82.98, "elapsed_time": "3:51:37", "remaining_time": "0:47:29", "throughput": 2313.06, "total_tokens": 32146696} {"current_steps": 55720, "total_steps": 67140, "loss": 0.5547, "lr": 4.279295251961754e-06, "epoch": 8.299076556449211, "percentage": 82.99, "elapsed_time": "3:51:39", "remaining_time": "0:47:28", "throughput": 2313.09, "total_tokens": 32149896} {"current_steps": 55725, "total_steps": 67140, "loss": 0.6984, "lr": 4.27565982870404e-06, "epoch": 8.29982126899017, "percentage": 83.0, "elapsed_time": "3:51:40", "remaining_time": "0:47:27", "throughput": 2313.12, "total_tokens": 32152872} {"current_steps": 55730, "total_steps": 67140, "loss": 0.6577, "lr": 4.272025805912982e-06, "epoch": 8.300565981531129, "percentage": 83.01, "elapsed_time": "3:51:41", "remaining_time": "0:47:26", "throughput": 2313.13, "total_tokens": 32155592} {"current_steps": 55735, "total_steps": 67140, "loss": 0.4833, "lr": 4.26839318383414e-06, "epoch": 8.301310694072088, "percentage": 83.01, "elapsed_time": "3:51:42", "remaining_time": "0:47:24", "throughput": 2313.14, "total_tokens": 32158312} {"current_steps": 55740, "total_steps": 67140, "loss": 0.4951, "lr": 4.2647619627129986e-06, "epoch": 8.302055406613047, "percentage": 83.02, "elapsed_time": "3:51:43", "remaining_time": "0:47:23", "throughput": 2313.15, "total_tokens": 32161096} {"current_steps": 55745, "total_steps": 67140, "loss": 0.587, "lr": 4.261132142794941e-06, "epoch": 8.302800119154007, "percentage": 83.03, "elapsed_time": "3:51:44", "remaining_time": "0:47:22", "throughput": 2313.17, "total_tokens": 32163880} {"current_steps": 55750, "total_steps": 67140, "loss": 0.6583, "lr": 4.25750372432526e-06, "epoch": 8.303544831694966, "percentage": 83.04, "elapsed_time": "3:51:45", "remaining_time": "0:47:21", "throughput": 2313.18, "total_tokens": 32166696} {"current_steps": 55755, "total_steps": 67140, "loss": 0.3958, "lr": 4.2538767075491394e-06, "epoch": 8.304289544235925, "percentage": 83.04, "elapsed_time": "3:51:46", "remaining_time": "0:47:19", "throughput": 2313.2, "total_tokens": 32169512} {"current_steps": 55760, "total_steps": 67140, "loss": 0.5294, "lr": 4.250251092711682e-06, "epoch": 8.305034256776883, "percentage": 83.05, "elapsed_time": "3:51:48", "remaining_time": "0:47:18", "throughput": 2313.2, "total_tokens": 32172200} {"current_steps": 55765, "total_steps": 67140, "loss": 0.605, "lr": 4.2466268800579026e-06, "epoch": 8.305778969317844, "percentage": 83.06, "elapsed_time": "3:51:49", "remaining_time": "0:47:17", "throughput": 2313.21, "total_tokens": 32174952} {"current_steps": 55770, "total_steps": 67140, "loss": 0.6107, "lr": 4.243004069832693e-06, "epoch": 8.306523681858803, "percentage": 83.07, "elapsed_time": "3:51:50", "remaining_time": "0:47:15", "throughput": 2313.23, "total_tokens": 32177768} {"current_steps": 55775, "total_steps": 67140, "loss": 0.4727, "lr": 4.239382662280875e-06, "epoch": 8.307268394399761, "percentage": 83.07, "elapsed_time": "3:51:51", "remaining_time": "0:47:14", "throughput": 2313.25, "total_tokens": 32180648} {"current_steps": 55780, "total_steps": 67140, "loss": 0.6771, "lr": 4.235762657647172e-06, "epoch": 8.30801310694072, "percentage": 83.08, "elapsed_time": "3:51:52", "remaining_time": "0:47:13", "throughput": 2313.26, "total_tokens": 32183400} {"current_steps": 55785, "total_steps": 67140, "loss": 0.772, "lr": 4.232144056176207e-06, "epoch": 8.30875781948168, "percentage": 83.09, "elapsed_time": "3:51:53", "remaining_time": "0:47:12", "throughput": 2313.27, "total_tokens": 32186120} {"current_steps": 55790, "total_steps": 67140, "loss": 0.6762, "lr": 4.2285268581125165e-06, "epoch": 8.30950253202264, "percentage": 83.1, "elapsed_time": "3:51:54", "remaining_time": "0:47:10", "throughput": 2313.28, "total_tokens": 32188776} {"current_steps": 55795, "total_steps": 67140, "loss": 0.5605, "lr": 4.224911063700526e-06, "epoch": 8.310247244563598, "percentage": 83.1, "elapsed_time": "3:51:55", "remaining_time": "0:47:09", "throughput": 2313.3, "total_tokens": 32191752} {"current_steps": 55800, "total_steps": 67140, "loss": 0.6045, "lr": 4.221296673184585e-06, "epoch": 8.310991957104557, "percentage": 83.11, "elapsed_time": "3:51:57", "remaining_time": "0:47:08", "throughput": 2313.32, "total_tokens": 32194664} {"current_steps": 55805, "total_steps": 67140, "loss": 0.644, "lr": 4.217683686808929e-06, "epoch": 8.311736669645517, "percentage": 83.12, "elapsed_time": "3:51:58", "remaining_time": "0:47:07", "throughput": 2313.33, "total_tokens": 32197384} {"current_steps": 55810, "total_steps": 67140, "loss": 0.4391, "lr": 4.214072104817715e-06, "epoch": 8.312481382186476, "percentage": 83.12, "elapsed_time": "3:51:59", "remaining_time": "0:47:05", "throughput": 2313.35, "total_tokens": 32200360} {"current_steps": 55815, "total_steps": 67140, "loss": 0.4164, "lr": 4.2104619274549975e-06, "epoch": 8.313226094727435, "percentage": 83.13, "elapsed_time": "3:52:00", "remaining_time": "0:47:04", "throughput": 2313.37, "total_tokens": 32203304} {"current_steps": 55820, "total_steps": 67140, "loss": 0.6864, "lr": 4.2068531549647405e-06, "epoch": 8.313970807268394, "percentage": 83.14, "elapsed_time": "3:52:01", "remaining_time": "0:47:03", "throughput": 2313.39, "total_tokens": 32206152} {"current_steps": 55825, "total_steps": 67140, "loss": 0.3545, "lr": 4.203245787590815e-06, "epoch": 8.314715519809354, "percentage": 83.15, "elapsed_time": "3:52:02", "remaining_time": "0:47:01", "throughput": 2313.4, "total_tokens": 32208968} {"current_steps": 55830, "total_steps": 67140, "loss": 0.6074, "lr": 4.199639825576979e-06, "epoch": 8.315460232350313, "percentage": 83.15, "elapsed_time": "3:52:03", "remaining_time": "0:47:00", "throughput": 2313.44, "total_tokens": 32212232} {"current_steps": 55835, "total_steps": 67140, "loss": 0.5477, "lr": 4.196035269166921e-06, "epoch": 8.316204944891272, "percentage": 83.16, "elapsed_time": "3:52:05", "remaining_time": "0:46:59", "throughput": 2313.46, "total_tokens": 32215080} {"current_steps": 55840, "total_steps": 67140, "loss": 0.6154, "lr": 4.192432118604209e-06, "epoch": 8.31694965743223, "percentage": 83.17, "elapsed_time": "3:52:06", "remaining_time": "0:46:58", "throughput": 2313.48, "total_tokens": 32218120} {"current_steps": 55845, "total_steps": 67140, "loss": 0.6253, "lr": 4.188830374132341e-06, "epoch": 8.317694369973191, "percentage": 83.18, "elapsed_time": "3:52:07", "remaining_time": "0:46:56", "throughput": 2313.5, "total_tokens": 32220968} {"current_steps": 55850, "total_steps": 67140, "loss": 0.5523, "lr": 4.1852300359946996e-06, "epoch": 8.31843908251415, "percentage": 83.18, "elapsed_time": "3:52:08", "remaining_time": "0:46:55", "throughput": 2313.51, "total_tokens": 32223720} {"current_steps": 55855, "total_steps": 67140, "loss": 0.5498, "lr": 4.181631104434588e-06, "epoch": 8.319183795055109, "percentage": 83.19, "elapsed_time": "3:52:09", "remaining_time": "0:46:54", "throughput": 2313.53, "total_tokens": 32226696} {"current_steps": 55860, "total_steps": 67140, "loss": 0.7335, "lr": 4.178033579695212e-06, "epoch": 8.319928507596067, "percentage": 83.2, "elapsed_time": "3:52:10", "remaining_time": "0:46:53", "throughput": 2313.55, "total_tokens": 32229608} {"current_steps": 55865, "total_steps": 67140, "loss": 0.3609, "lr": 4.174437462019665e-06, "epoch": 8.320673220137028, "percentage": 83.21, "elapsed_time": "3:52:11", "remaining_time": "0:46:51", "throughput": 2313.59, "total_tokens": 32232808} {"current_steps": 55870, "total_steps": 67140, "loss": 0.5852, "lr": 4.170842751650969e-06, "epoch": 8.321417932677987, "percentage": 83.21, "elapsed_time": "3:52:13", "remaining_time": "0:46:50", "throughput": 2313.6, "total_tokens": 32235560} {"current_steps": 55875, "total_steps": 67140, "loss": 0.5109, "lr": 4.167249448832028e-06, "epoch": 8.322162645218945, "percentage": 83.22, "elapsed_time": "3:52:14", "remaining_time": "0:46:49", "throughput": 2313.62, "total_tokens": 32238504} {"current_steps": 55880, "total_steps": 67140, "loss": 0.4527, "lr": 4.163657553805669e-06, "epoch": 8.322907357759904, "percentage": 83.23, "elapsed_time": "3:52:15", "remaining_time": "0:46:48", "throughput": 2313.62, "total_tokens": 32241064} {"current_steps": 55885, "total_steps": 67140, "loss": 0.6417, "lr": 4.160067066814619e-06, "epoch": 8.323652070300863, "percentage": 83.24, "elapsed_time": "3:52:16", "remaining_time": "0:46:46", "throughput": 2313.63, "total_tokens": 32243816} {"current_steps": 55890, "total_steps": 67140, "loss": 0.5793, "lr": 4.156477988101507e-06, "epoch": 8.324396782841823, "percentage": 83.24, "elapsed_time": "3:52:17", "remaining_time": "0:46:45", "throughput": 2313.65, "total_tokens": 32246696} {"current_steps": 55895, "total_steps": 67140, "loss": 0.4778, "lr": 4.152890317908875e-06, "epoch": 8.325141495382782, "percentage": 83.25, "elapsed_time": "3:52:18", "remaining_time": "0:46:44", "throughput": 2313.67, "total_tokens": 32249544} {"current_steps": 55900, "total_steps": 67140, "loss": 0.4398, "lr": 4.149304056479153e-06, "epoch": 8.325886207923741, "percentage": 83.26, "elapsed_time": "3:52:19", "remaining_time": "0:46:42", "throughput": 2313.68, "total_tokens": 32252360} {"current_steps": 55905, "total_steps": 67140, "loss": 0.4232, "lr": 4.145719204054688e-06, "epoch": 8.3266309204647, "percentage": 83.27, "elapsed_time": "3:52:20", "remaining_time": "0:46:41", "throughput": 2313.69, "total_tokens": 32254888} {"current_steps": 55910, "total_steps": 67140, "loss": 0.5547, "lr": 4.1421357608777386e-06, "epoch": 8.32737563300566, "percentage": 83.27, "elapsed_time": "3:52:22", "remaining_time": "0:46:40", "throughput": 2313.7, "total_tokens": 32257768} {"current_steps": 55915, "total_steps": 67140, "loss": 0.6682, "lr": 4.138553727190447e-06, "epoch": 8.328120345546619, "percentage": 83.28, "elapsed_time": "3:52:23", "remaining_time": "0:46:39", "throughput": 2313.73, "total_tokens": 32260840} {"current_steps": 55920, "total_steps": 67140, "loss": 0.7031, "lr": 4.134973103234877e-06, "epoch": 8.328865058087578, "percentage": 83.29, "elapsed_time": "3:52:24", "remaining_time": "0:46:37", "throughput": 2313.76, "total_tokens": 32263976} {"current_steps": 55925, "total_steps": 67140, "loss": 0.4126, "lr": 4.131393889252996e-06, "epoch": 8.329609770628537, "percentage": 83.3, "elapsed_time": "3:52:25", "remaining_time": "0:46:36", "throughput": 2313.79, "total_tokens": 32267048} {"current_steps": 55930, "total_steps": 67140, "loss": 0.7403, "lr": 4.127816085486674e-06, "epoch": 8.330354483169497, "percentage": 83.3, "elapsed_time": "3:52:26", "remaining_time": "0:46:35", "throughput": 2313.8, "total_tokens": 32269832} {"current_steps": 55935, "total_steps": 67140, "loss": 0.6819, "lr": 4.124239692177675e-06, "epoch": 8.331099195710456, "percentage": 83.31, "elapsed_time": "3:52:27", "remaining_time": "0:46:34", "throughput": 2313.81, "total_tokens": 32272488} {"current_steps": 55940, "total_steps": 67140, "loss": 0.8253, "lr": 4.120664709567684e-06, "epoch": 8.331843908251415, "percentage": 83.32, "elapsed_time": "3:52:28", "remaining_time": "0:46:32", "throughput": 2313.83, "total_tokens": 32275400} {"current_steps": 55945, "total_steps": 67140, "loss": 0.4605, "lr": 4.117091137898282e-06, "epoch": 8.332588620792373, "percentage": 83.33, "elapsed_time": "3:52:30", "remaining_time": "0:46:31", "throughput": 2313.85, "total_tokens": 32278536} {"current_steps": 55950, "total_steps": 67140, "loss": 0.5346, "lr": 4.113518977410963e-06, "epoch": 8.333333333333334, "percentage": 83.33, "elapsed_time": "3:52:31", "remaining_time": "0:46:30", "throughput": 2313.88, "total_tokens": 32281544} {"current_steps": 55955, "total_steps": 67140, "loss": 0.5882, "lr": 4.109948228347108e-06, "epoch": 8.334078045874293, "percentage": 83.34, "elapsed_time": "3:52:32", "remaining_time": "0:46:28", "throughput": 2313.9, "total_tokens": 32284488} {"current_steps": 55960, "total_steps": 67140, "loss": 0.6, "lr": 4.1063788909480175e-06, "epoch": 8.334822758415251, "percentage": 83.35, "elapsed_time": "3:52:33", "remaining_time": "0:46:27", "throughput": 2313.91, "total_tokens": 32287080} {"current_steps": 55965, "total_steps": 67140, "loss": 0.6325, "lr": 4.102810965454904e-06, "epoch": 8.33556747095621, "percentage": 83.36, "elapsed_time": "3:52:34", "remaining_time": "0:46:26", "throughput": 2313.93, "total_tokens": 32289960} {"current_steps": 55970, "total_steps": 67140, "loss": 0.5845, "lr": 4.099244452108855e-06, "epoch": 8.33631218349717, "percentage": 83.36, "elapsed_time": "3:52:35", "remaining_time": "0:46:25", "throughput": 2313.94, "total_tokens": 32292776} {"current_steps": 55975, "total_steps": 67140, "loss": 0.4304, "lr": 4.0956793511508885e-06, "epoch": 8.33705689603813, "percentage": 83.37, "elapsed_time": "3:52:36", "remaining_time": "0:46:23", "throughput": 2313.97, "total_tokens": 32295784} {"current_steps": 55980, "total_steps": 67140, "loss": 0.5536, "lr": 4.092115662821921e-06, "epoch": 8.337801608579088, "percentage": 83.38, "elapsed_time": "3:52:37", "remaining_time": "0:46:22", "throughput": 2313.97, "total_tokens": 32298440} {"current_steps": 55985, "total_steps": 67140, "loss": 0.494, "lr": 4.088553387362773e-06, "epoch": 8.338546321120047, "percentage": 83.39, "elapsed_time": "3:52:39", "remaining_time": "0:46:21", "throughput": 2313.98, "total_tokens": 32301128} {"current_steps": 55990, "total_steps": 67140, "loss": 0.4743, "lr": 4.084992525014172e-06, "epoch": 8.339291033661008, "percentage": 83.39, "elapsed_time": "3:52:40", "remaining_time": "0:46:20", "throughput": 2314.01, "total_tokens": 32304136} {"current_steps": 55995, "total_steps": 67140, "loss": 0.7372, "lr": 4.081433076016739e-06, "epoch": 8.340035746201966, "percentage": 83.4, "elapsed_time": "3:52:41", "remaining_time": "0:46:18", "throughput": 2314.03, "total_tokens": 32307048} {"current_steps": 56000, "total_steps": 67140, "loss": 0.647, "lr": 4.077875040611015e-06, "epoch": 8.340780458742925, "percentage": 83.41, "elapsed_time": "3:52:42", "remaining_time": "0:46:17", "throughput": 2314.05, "total_tokens": 32310024} {"current_steps": 56005, "total_steps": 67140, "loss": 0.4921, "lr": 4.074318419037424e-06, "epoch": 8.341525171283884, "percentage": 83.42, "elapsed_time": "3:52:43", "remaining_time": "0:46:16", "throughput": 2314.06, "total_tokens": 32312840} {"current_steps": 56010, "total_steps": 67140, "loss": 0.4988, "lr": 4.070763211536319e-06, "epoch": 8.342269883824844, "percentage": 83.42, "elapsed_time": "3:52:44", "remaining_time": "0:46:15", "throughput": 2314.09, "total_tokens": 32315816} {"current_steps": 56015, "total_steps": 67140, "loss": 0.5593, "lr": 4.067209418347942e-06, "epoch": 8.343014596365803, "percentage": 83.43, "elapsed_time": "3:52:45", "remaining_time": "0:46:13", "throughput": 2314.09, "total_tokens": 32318472} {"current_steps": 56020, "total_steps": 67140, "loss": 0.4601, "lr": 4.063657039712448e-06, "epoch": 8.343759308906762, "percentage": 83.44, "elapsed_time": "3:52:47", "remaining_time": "0:46:12", "throughput": 2314.12, "total_tokens": 32321544} {"current_steps": 56025, "total_steps": 67140, "loss": 0.5229, "lr": 4.0601060758698965e-06, "epoch": 8.34450402144772, "percentage": 83.45, "elapsed_time": "3:52:48", "remaining_time": "0:46:11", "throughput": 2314.14, "total_tokens": 32324424} {"current_steps": 56030, "total_steps": 67140, "loss": 0.6278, "lr": 4.05655652706024e-06, "epoch": 8.345248733988681, "percentage": 83.45, "elapsed_time": "3:52:49", "remaining_time": "0:46:09", "throughput": 2314.16, "total_tokens": 32327304} {"current_steps": 56035, "total_steps": 67140, "loss": 0.4617, "lr": 4.053008393523336e-06, "epoch": 8.34599344652964, "percentage": 83.46, "elapsed_time": "3:52:50", "remaining_time": "0:46:08", "throughput": 2314.17, "total_tokens": 32330024} {"current_steps": 56040, "total_steps": 67140, "loss": 0.5321, "lr": 4.049461675498961e-06, "epoch": 8.346738159070599, "percentage": 83.47, "elapsed_time": "3:52:51", "remaining_time": "0:46:07", "throughput": 2314.18, "total_tokens": 32332680} {"current_steps": 56045, "total_steps": 67140, "loss": 0.5462, "lr": 4.045916373226791e-06, "epoch": 8.347482871611557, "percentage": 83.47, "elapsed_time": "3:52:52", "remaining_time": "0:46:06", "throughput": 2314.21, "total_tokens": 32335784} {"current_steps": 56050, "total_steps": 67140, "loss": 0.5363, "lr": 4.042372486946394e-06, "epoch": 8.348227584152518, "percentage": 83.48, "elapsed_time": "3:52:53", "remaining_time": "0:46:04", "throughput": 2314.23, "total_tokens": 32338888} {"current_steps": 56055, "total_steps": 67140, "loss": 0.7467, "lr": 4.03883001689726e-06, "epoch": 8.348972296693477, "percentage": 83.49, "elapsed_time": "3:52:55", "remaining_time": "0:46:03", "throughput": 2314.26, "total_tokens": 32341928} {"current_steps": 56060, "total_steps": 67140, "loss": 0.3423, "lr": 4.035288963318778e-06, "epoch": 8.349717009234435, "percentage": 83.5, "elapsed_time": "3:52:56", "remaining_time": "0:46:02", "throughput": 2314.27, "total_tokens": 32344552} {"current_steps": 56065, "total_steps": 67140, "loss": 0.6251, "lr": 4.031749326450224e-06, "epoch": 8.350461721775394, "percentage": 83.5, "elapsed_time": "3:52:57", "remaining_time": "0:46:01", "throughput": 2314.28, "total_tokens": 32347208} {"current_steps": 56070, "total_steps": 67140, "loss": 0.5176, "lr": 4.028211106530808e-06, "epoch": 8.351206434316353, "percentage": 83.51, "elapsed_time": "3:52:58", "remaining_time": "0:45:59", "throughput": 2314.31, "total_tokens": 32350376} {"current_steps": 56075, "total_steps": 67140, "loss": 0.5546, "lr": 4.024674303799611e-06, "epoch": 8.351951146857314, "percentage": 83.52, "elapsed_time": "3:52:59", "remaining_time": "0:45:58", "throughput": 2314.31, "total_tokens": 32353000} {"current_steps": 56080, "total_steps": 67140, "loss": 0.7842, "lr": 4.021138918495648e-06, "epoch": 8.352695859398272, "percentage": 83.53, "elapsed_time": "3:53:00", "remaining_time": "0:45:57", "throughput": 2314.33, "total_tokens": 32355816} {"current_steps": 56085, "total_steps": 67140, "loss": 0.4799, "lr": 4.017604950857823e-06, "epoch": 8.353440571939231, "percentage": 83.53, "elapsed_time": "3:53:01", "remaining_time": "0:45:55", "throughput": 2314.34, "total_tokens": 32358440} {"current_steps": 56090, "total_steps": 67140, "loss": 0.6221, "lr": 4.014072401124946e-06, "epoch": 8.35418528448019, "percentage": 83.54, "elapsed_time": "3:53:02", "remaining_time": "0:45:54", "throughput": 2314.35, "total_tokens": 32361128} {"current_steps": 56095, "total_steps": 67140, "loss": 0.6689, "lr": 4.0105412695357395e-06, "epoch": 8.35492999702115, "percentage": 83.55, "elapsed_time": "3:53:03", "remaining_time": "0:45:53", "throughput": 2314.37, "total_tokens": 32363944} {"current_steps": 56100, "total_steps": 67140, "loss": 0.694, "lr": 4.0070115563288105e-06, "epoch": 8.35567470956211, "percentage": 83.56, "elapsed_time": "3:53:05", "remaining_time": "0:45:52", "throughput": 2314.37, "total_tokens": 32366568} {"current_steps": 56105, "total_steps": 67140, "loss": 0.4159, "lr": 4.003483261742691e-06, "epoch": 8.356419422103068, "percentage": 83.56, "elapsed_time": "3:53:06", "remaining_time": "0:45:50", "throughput": 2314.39, "total_tokens": 32369352} {"current_steps": 56110, "total_steps": 67140, "loss": 0.6096, "lr": 3.999956386015813e-06, "epoch": 8.357164134644027, "percentage": 83.57, "elapsed_time": "3:53:07", "remaining_time": "0:45:49", "throughput": 2314.41, "total_tokens": 32372296} {"current_steps": 56115, "total_steps": 67140, "loss": 0.5621, "lr": 3.996430929386494e-06, "epoch": 8.357908847184987, "percentage": 83.58, "elapsed_time": "3:53:08", "remaining_time": "0:45:48", "throughput": 2314.43, "total_tokens": 32375176} {"current_steps": 56120, "total_steps": 67140, "loss": 0.6513, "lr": 3.992906892092979e-06, "epoch": 8.358653559725946, "percentage": 83.59, "elapsed_time": "3:53:09", "remaining_time": "0:45:47", "throughput": 2314.44, "total_tokens": 32377928} {"current_steps": 56125, "total_steps": 67140, "loss": 0.4744, "lr": 3.989384274373409e-06, "epoch": 8.359398272266905, "percentage": 83.59, "elapsed_time": "3:53:10", "remaining_time": "0:45:45", "throughput": 2314.46, "total_tokens": 32380776} {"current_steps": 56130, "total_steps": 67140, "loss": 0.5078, "lr": 3.985863076465835e-06, "epoch": 8.360142984807863, "percentage": 83.6, "elapsed_time": "3:53:11", "remaining_time": "0:45:44", "throughput": 2314.47, "total_tokens": 32383592} {"current_steps": 56135, "total_steps": 67140, "loss": 0.6889, "lr": 3.9823432986081876e-06, "epoch": 8.360887697348824, "percentage": 83.61, "elapsed_time": "3:53:12", "remaining_time": "0:45:43", "throughput": 2314.51, "total_tokens": 32386856} {"current_steps": 56140, "total_steps": 67140, "loss": 0.6394, "lr": 3.978824941038328e-06, "epoch": 8.361632409889783, "percentage": 83.62, "elapsed_time": "3:53:14", "remaining_time": "0:45:41", "throughput": 2314.52, "total_tokens": 32389608} {"current_steps": 56145, "total_steps": 67140, "loss": 0.7026, "lr": 3.975308003994016e-06, "epoch": 8.362377122430741, "percentage": 83.62, "elapsed_time": "3:53:15", "remaining_time": "0:45:40", "throughput": 2314.54, "total_tokens": 32392488} {"current_steps": 56150, "total_steps": 67140, "loss": 0.6118, "lr": 3.971792487712914e-06, "epoch": 8.3631218349717, "percentage": 83.63, "elapsed_time": "3:53:16", "remaining_time": "0:45:39", "throughput": 2314.58, "total_tokens": 32395784} {"current_steps": 56155, "total_steps": 67140, "loss": 0.5181, "lr": 3.968278392432573e-06, "epoch": 8.36386654751266, "percentage": 83.64, "elapsed_time": "3:53:17", "remaining_time": "0:45:38", "throughput": 2314.59, "total_tokens": 32398536} {"current_steps": 56160, "total_steps": 67140, "loss": 0.5225, "lr": 3.964765718390473e-06, "epoch": 8.36461126005362, "percentage": 83.65, "elapsed_time": "3:53:18", "remaining_time": "0:45:36", "throughput": 2314.6, "total_tokens": 32401224} {"current_steps": 56165, "total_steps": 67140, "loss": 0.5474, "lr": 3.961254465823985e-06, "epoch": 8.365355972594578, "percentage": 83.65, "elapsed_time": "3:53:19", "remaining_time": "0:45:35", "throughput": 2314.62, "total_tokens": 32404104} {"current_steps": 56170, "total_steps": 67140, "loss": 0.5302, "lr": 3.957744634970378e-06, "epoch": 8.366100685135537, "percentage": 83.66, "elapsed_time": "3:53:20", "remaining_time": "0:45:34", "throughput": 2314.64, "total_tokens": 32407016} {"current_steps": 56175, "total_steps": 67140, "loss": 0.3325, "lr": 3.954236226066838e-06, "epoch": 8.366845397676498, "percentage": 83.67, "elapsed_time": "3:53:22", "remaining_time": "0:45:33", "throughput": 2314.66, "total_tokens": 32410024} {"current_steps": 56180, "total_steps": 67140, "loss": 0.6058, "lr": 3.950729239350448e-06, "epoch": 8.367590110217456, "percentage": 83.68, "elapsed_time": "3:53:23", "remaining_time": "0:45:31", "throughput": 2314.68, "total_tokens": 32412872} {"current_steps": 56185, "total_steps": 67140, "loss": 0.6008, "lr": 3.947223675058195e-06, "epoch": 8.368334822758415, "percentage": 83.68, "elapsed_time": "3:53:24", "remaining_time": "0:45:30", "throughput": 2314.68, "total_tokens": 32415464} {"current_steps": 56190, "total_steps": 67140, "loss": 0.5479, "lr": 3.943719533426979e-06, "epoch": 8.369079535299374, "percentage": 83.69, "elapsed_time": "3:53:25", "remaining_time": "0:45:29", "throughput": 2314.71, "total_tokens": 32418600} {"current_steps": 56195, "total_steps": 67140, "loss": 0.6433, "lr": 3.940216814693587e-06, "epoch": 8.369824247840334, "percentage": 83.7, "elapsed_time": "3:53:26", "remaining_time": "0:45:28", "throughput": 2314.72, "total_tokens": 32421320} {"current_steps": 56200, "total_steps": 67140, "loss": 0.677, "lr": 3.936715519094716e-06, "epoch": 8.370568960381293, "percentage": 83.71, "elapsed_time": "3:53:27", "remaining_time": "0:45:26", "throughput": 2314.73, "total_tokens": 32424136} {"current_steps": 56205, "total_steps": 67140, "loss": 0.6591, "lr": 3.933215646866972e-06, "epoch": 8.371313672922252, "percentage": 83.71, "elapsed_time": "3:53:28", "remaining_time": "0:45:25", "throughput": 2314.75, "total_tokens": 32426952} {"current_steps": 56210, "total_steps": 67140, "loss": 0.4896, "lr": 3.929717198246862e-06, "epoch": 8.37205838546321, "percentage": 83.72, "elapsed_time": "3:53:29", "remaining_time": "0:45:24", "throughput": 2314.76, "total_tokens": 32429736} {"current_steps": 56215, "total_steps": 67140, "loss": 0.5683, "lr": 3.926220173470799e-06, "epoch": 8.372803098004171, "percentage": 83.73, "elapsed_time": "3:53:31", "remaining_time": "0:45:22", "throughput": 2314.79, "total_tokens": 32432904} {"current_steps": 56220, "total_steps": 67140, "loss": 0.5592, "lr": 3.9227245727750965e-06, "epoch": 8.37354781054513, "percentage": 83.74, "elapsed_time": "3:53:32", "remaining_time": "0:45:21", "throughput": 2314.8, "total_tokens": 32435528} {"current_steps": 56225, "total_steps": 67140, "loss": 0.5132, "lr": 3.919230396395981e-06, "epoch": 8.374292523086089, "percentage": 83.74, "elapsed_time": "3:53:33", "remaining_time": "0:45:20", "throughput": 2314.82, "total_tokens": 32438504} {"current_steps": 56230, "total_steps": 67140, "loss": 0.4314, "lr": 3.915737644569567e-06, "epoch": 8.375037235627047, "percentage": 83.75, "elapsed_time": "3:53:34", "remaining_time": "0:45:19", "throughput": 2314.84, "total_tokens": 32441480} {"current_steps": 56235, "total_steps": 67140, "loss": 0.5205, "lr": 3.912246317531873e-06, "epoch": 8.375781948168008, "percentage": 83.76, "elapsed_time": "3:53:35", "remaining_time": "0:45:17", "throughput": 2314.86, "total_tokens": 32444360} {"current_steps": 56240, "total_steps": 67140, "loss": 0.7459, "lr": 3.908756415518835e-06, "epoch": 8.376526660708967, "percentage": 83.77, "elapsed_time": "3:53:36", "remaining_time": "0:45:16", "throughput": 2314.9, "total_tokens": 32447528} {"current_steps": 56245, "total_steps": 67140, "loss": 0.5408, "lr": 3.905267938766291e-06, "epoch": 8.377271373249926, "percentage": 83.77, "elapsed_time": "3:53:37", "remaining_time": "0:45:15", "throughput": 2314.91, "total_tokens": 32450280} {"current_steps": 56250, "total_steps": 67140, "loss": 0.552, "lr": 3.901780887509973e-06, "epoch": 8.378016085790884, "percentage": 83.78, "elapsed_time": "3:53:39", "remaining_time": "0:45:14", "throughput": 2314.92, "total_tokens": 32453192} {"current_steps": 56255, "total_steps": 67140, "loss": 0.611, "lr": 3.898295261985524e-06, "epoch": 8.378760798331843, "percentage": 83.79, "elapsed_time": "3:53:40", "remaining_time": "0:45:12", "throughput": 2314.93, "total_tokens": 32455784} {"current_steps": 56260, "total_steps": 67140, "loss": 0.6484, "lr": 3.894811062428494e-06, "epoch": 8.379505510872804, "percentage": 83.8, "elapsed_time": "3:53:41", "remaining_time": "0:45:11", "throughput": 2314.96, "total_tokens": 32458888} {"current_steps": 56265, "total_steps": 67140, "loss": 0.6492, "lr": 3.8913282890743195e-06, "epoch": 8.380250223413762, "percentage": 83.8, "elapsed_time": "3:53:42", "remaining_time": "0:45:10", "throughput": 2314.97, "total_tokens": 32461608} {"current_steps": 56270, "total_steps": 67140, "loss": 0.7548, "lr": 3.887846942158363e-06, "epoch": 8.380994935954721, "percentage": 83.81, "elapsed_time": "3:53:43", "remaining_time": "0:45:09", "throughput": 2314.98, "total_tokens": 32464360} {"current_steps": 56275, "total_steps": 67140, "loss": 0.4719, "lr": 3.884367021915869e-06, "epoch": 8.38173964849568, "percentage": 83.82, "elapsed_time": "3:53:44", "remaining_time": "0:45:07", "throughput": 2315.0, "total_tokens": 32467304} {"current_steps": 56280, "total_steps": 67140, "loss": 0.4598, "lr": 3.880888528581999e-06, "epoch": 8.38248436103664, "percentage": 83.82, "elapsed_time": "3:53:45", "remaining_time": "0:45:06", "throughput": 2315.01, "total_tokens": 32469864} {"current_steps": 56285, "total_steps": 67140, "loss": 0.5279, "lr": 3.877411462391822e-06, "epoch": 8.3832290735776, "percentage": 83.83, "elapsed_time": "3:53:46", "remaining_time": "0:45:05", "throughput": 2315.02, "total_tokens": 32472648} {"current_steps": 56290, "total_steps": 67140, "loss": 0.6509, "lr": 3.873935823580299e-06, "epoch": 8.383973786118558, "percentage": 83.84, "elapsed_time": "3:53:48", "remaining_time": "0:45:03", "throughput": 2315.04, "total_tokens": 32475560} {"current_steps": 56295, "total_steps": 67140, "loss": 0.3503, "lr": 3.870461612382306e-06, "epoch": 8.384718498659517, "percentage": 83.85, "elapsed_time": "3:53:49", "remaining_time": "0:45:02", "throughput": 2315.06, "total_tokens": 32478440} {"current_steps": 56300, "total_steps": 67140, "loss": 0.2933, "lr": 3.866988829032603e-06, "epoch": 8.385463211200477, "percentage": 83.85, "elapsed_time": "3:53:50", "remaining_time": "0:45:01", "throughput": 2315.07, "total_tokens": 32481224} {"current_steps": 56305, "total_steps": 67140, "loss": 0.5047, "lr": 3.863517473765877e-06, "epoch": 8.386207923741436, "percentage": 83.86, "elapsed_time": "3:53:51", "remaining_time": "0:45:00", "throughput": 2315.09, "total_tokens": 32484232} {"current_steps": 56310, "total_steps": 67140, "loss": 0.566, "lr": 3.8600475468167056e-06, "epoch": 8.386952636282395, "percentage": 83.87, "elapsed_time": "3:53:52", "remaining_time": "0:44:58", "throughput": 2315.11, "total_tokens": 32487176} {"current_steps": 56315, "total_steps": 67140, "loss": 0.7423, "lr": 3.8565790484195785e-06, "epoch": 8.387697348823353, "percentage": 83.88, "elapsed_time": "3:53:53", "remaining_time": "0:44:57", "throughput": 2315.16, "total_tokens": 32490664} {"current_steps": 56320, "total_steps": 67140, "loss": 0.6553, "lr": 3.853111978808868e-06, "epoch": 8.388442061364314, "percentage": 83.88, "elapsed_time": "3:53:55", "remaining_time": "0:44:56", "throughput": 2315.18, "total_tokens": 32493640} {"current_steps": 56325, "total_steps": 67140, "loss": 0.4609, "lr": 3.849646338218874e-06, "epoch": 8.389186773905273, "percentage": 83.89, "elapsed_time": "3:53:56", "remaining_time": "0:44:55", "throughput": 2315.2, "total_tokens": 32496552} {"current_steps": 56330, "total_steps": 67140, "loss": 0.3959, "lr": 3.846182126883796e-06, "epoch": 8.389931486446232, "percentage": 83.9, "elapsed_time": "3:53:57", "remaining_time": "0:44:53", "throughput": 2315.21, "total_tokens": 32499400} {"current_steps": 56335, "total_steps": 67140, "loss": 0.704, "lr": 3.842719345037718e-06, "epoch": 8.39067619898719, "percentage": 83.91, "elapsed_time": "3:53:58", "remaining_time": "0:44:52", "throughput": 2315.23, "total_tokens": 32502184} {"current_steps": 56340, "total_steps": 67140, "loss": 0.6193, "lr": 3.83925799291465e-06, "epoch": 8.39142091152815, "percentage": 83.91, "elapsed_time": "3:53:59", "remaining_time": "0:44:51", "throughput": 2315.24, "total_tokens": 32504968} {"current_steps": 56345, "total_steps": 67140, "loss": 0.658, "lr": 3.835798070748489e-06, "epoch": 8.39216562406911, "percentage": 83.92, "elapsed_time": "3:54:00", "remaining_time": "0:44:50", "throughput": 2315.25, "total_tokens": 32507688} {"current_steps": 56350, "total_steps": 67140, "loss": 0.6461, "lr": 3.8323395787730505e-06, "epoch": 8.392910336610068, "percentage": 83.93, "elapsed_time": "3:54:01", "remaining_time": "0:44:48", "throughput": 2315.26, "total_tokens": 32510472} {"current_steps": 56355, "total_steps": 67140, "loss": 0.5122, "lr": 3.828882517222046e-06, "epoch": 8.393655049151027, "percentage": 83.94, "elapsed_time": "3:54:02", "remaining_time": "0:44:47", "throughput": 2315.27, "total_tokens": 32513192} {"current_steps": 56360, "total_steps": 67140, "loss": 0.508, "lr": 3.825426886329087e-06, "epoch": 8.394399761691988, "percentage": 83.94, "elapsed_time": "3:54:04", "remaining_time": "0:44:46", "throughput": 2315.27, "total_tokens": 32515720} {"current_steps": 56365, "total_steps": 67140, "loss": 0.4821, "lr": 3.8219726863276826e-06, "epoch": 8.395144474232946, "percentage": 83.95, "elapsed_time": "3:54:05", "remaining_time": "0:44:44", "throughput": 2315.29, "total_tokens": 32518664} {"current_steps": 56370, "total_steps": 67140, "loss": 0.5672, "lr": 3.81851991745126e-06, "epoch": 8.395889186773905, "percentage": 83.96, "elapsed_time": "3:54:06", "remaining_time": "0:44:43", "throughput": 2315.32, "total_tokens": 32521800} {"current_steps": 56375, "total_steps": 67140, "loss": 0.5852, "lr": 3.8150685799331454e-06, "epoch": 8.396633899314864, "percentage": 83.97, "elapsed_time": "3:54:07", "remaining_time": "0:44:42", "throughput": 2315.33, "total_tokens": 32524552} {"current_steps": 56380, "total_steps": 67140, "loss": 0.636, "lr": 3.811618674006562e-06, "epoch": 8.397378611855824, "percentage": 83.97, "elapsed_time": "3:54:08", "remaining_time": "0:44:41", "throughput": 2315.35, "total_tokens": 32527464} {"current_steps": 56385, "total_steps": 67140, "loss": 0.5354, "lr": 3.8081701999046454e-06, "epoch": 8.398123324396783, "percentage": 83.98, "elapsed_time": "3:54:09", "remaining_time": "0:44:39", "throughput": 2315.37, "total_tokens": 32530472} {"current_steps": 56390, "total_steps": 67140, "loss": 0.4653, "lr": 3.804723157860432e-06, "epoch": 8.398868036937742, "percentage": 83.99, "elapsed_time": "3:54:10", "remaining_time": "0:44:38", "throughput": 2315.38, "total_tokens": 32533160} {"current_steps": 56395, "total_steps": 67140, "loss": 0.7742, "lr": 3.8012775481068517e-06, "epoch": 8.3996127494787, "percentage": 84.0, "elapsed_time": "3:54:11", "remaining_time": "0:44:37", "throughput": 2315.4, "total_tokens": 32535976} {"current_steps": 56400, "total_steps": 67140, "loss": 0.4629, "lr": 3.797833370876744e-06, "epoch": 8.400357462019661, "percentage": 84.0, "elapsed_time": "3:54:13", "remaining_time": "0:44:36", "throughput": 2315.42, "total_tokens": 32538952} {"current_steps": 56405, "total_steps": 67140, "loss": 0.5259, "lr": 3.794390626402855e-06, "epoch": 8.40110217456062, "percentage": 84.01, "elapsed_time": "3:54:14", "remaining_time": "0:44:34", "throughput": 2315.45, "total_tokens": 32542056} {"current_steps": 56410, "total_steps": 67140, "loss": 0.5611, "lr": 3.79094931491783e-06, "epoch": 8.401846887101579, "percentage": 84.02, "elapsed_time": "3:54:15", "remaining_time": "0:44:33", "throughput": 2315.49, "total_tokens": 32545320} {"current_steps": 56415, "total_steps": 67140, "loss": 0.7106, "lr": 3.7875094366542212e-06, "epoch": 8.402591599642538, "percentage": 84.03, "elapsed_time": "3:54:16", "remaining_time": "0:44:32", "throughput": 2315.52, "total_tokens": 32548584} {"current_steps": 56420, "total_steps": 67140, "loss": 0.6683, "lr": 3.7840709918444823e-06, "epoch": 8.403336312183498, "percentage": 84.03, "elapsed_time": "3:54:17", "remaining_time": "0:44:31", "throughput": 2315.54, "total_tokens": 32551496} {"current_steps": 56425, "total_steps": 67140, "loss": 0.6201, "lr": 3.780633980720974e-06, "epoch": 8.404081024724457, "percentage": 84.04, "elapsed_time": "3:54:18", "remaining_time": "0:44:29", "throughput": 2315.55, "total_tokens": 32554056} {"current_steps": 56430, "total_steps": 67140, "loss": 0.67, "lr": 3.777198403515944e-06, "epoch": 8.404825737265416, "percentage": 84.05, "elapsed_time": "3:54:20", "remaining_time": "0:44:28", "throughput": 2315.58, "total_tokens": 32557160} {"current_steps": 56435, "total_steps": 67140, "loss": 0.417, "lr": 3.7737642604615624e-06, "epoch": 8.405570449806374, "percentage": 84.06, "elapsed_time": "3:54:21", "remaining_time": "0:44:27", "throughput": 2315.59, "total_tokens": 32560040} {"current_steps": 56440, "total_steps": 67140, "loss": 0.4024, "lr": 3.7703315517898908e-06, "epoch": 8.406315162347333, "percentage": 84.06, "elapsed_time": "3:54:22", "remaining_time": "0:44:25", "throughput": 2315.61, "total_tokens": 32562824} {"current_steps": 56445, "total_steps": 67140, "loss": 0.4731, "lr": 3.7669002777328986e-06, "epoch": 8.407059874888294, "percentage": 84.07, "elapsed_time": "3:54:23", "remaining_time": "0:44:24", "throughput": 2315.62, "total_tokens": 32565608} {"current_steps": 56450, "total_steps": 67140, "loss": 0.4649, "lr": 3.763470438522457e-06, "epoch": 8.407804587429252, "percentage": 84.08, "elapsed_time": "3:54:24", "remaining_time": "0:44:23", "throughput": 2315.65, "total_tokens": 32568680} {"current_steps": 56455, "total_steps": 67140, "loss": 0.5307, "lr": 3.760042034390343e-06, "epoch": 8.408549299970211, "percentage": 84.09, "elapsed_time": "3:54:25", "remaining_time": "0:44:22", "throughput": 2315.67, "total_tokens": 32571720} {"current_steps": 56460, "total_steps": 67140, "loss": 0.7839, "lr": 3.7566150655682364e-06, "epoch": 8.40929401251117, "percentage": 84.09, "elapsed_time": "3:54:26", "remaining_time": "0:44:20", "throughput": 2315.69, "total_tokens": 32574568} {"current_steps": 56465, "total_steps": 67140, "loss": 0.6708, "lr": 3.7531895322877096e-06, "epoch": 8.41003872505213, "percentage": 84.1, "elapsed_time": "3:54:28", "remaining_time": "0:44:19", "throughput": 2315.7, "total_tokens": 32577352} {"current_steps": 56470, "total_steps": 67140, "loss": 0.4798, "lr": 3.749765434780253e-06, "epoch": 8.41078343759309, "percentage": 84.11, "elapsed_time": "3:54:29", "remaining_time": "0:44:18", "throughput": 2315.73, "total_tokens": 32580488} {"current_steps": 56475, "total_steps": 67140, "loss": 0.7597, "lr": 3.746342773277256e-06, "epoch": 8.411528150134048, "percentage": 84.12, "elapsed_time": "3:54:30", "remaining_time": "0:44:17", "throughput": 2315.75, "total_tokens": 32583496} {"current_steps": 56480, "total_steps": 67140, "loss": 0.5557, "lr": 3.742921548009995e-06, "epoch": 8.412272862675007, "percentage": 84.12, "elapsed_time": "3:54:31", "remaining_time": "0:44:15", "throughput": 2315.76, "total_tokens": 32586184} {"current_steps": 56485, "total_steps": 67140, "loss": 0.538, "lr": 3.7395017592096738e-06, "epoch": 8.413017575215967, "percentage": 84.13, "elapsed_time": "3:54:32", "remaining_time": "0:44:14", "throughput": 2315.78, "total_tokens": 32589160} {"current_steps": 56490, "total_steps": 67140, "loss": 0.5343, "lr": 3.7360834071073823e-06, "epoch": 8.413762287756926, "percentage": 84.14, "elapsed_time": "3:54:33", "remaining_time": "0:44:13", "throughput": 2315.8, "total_tokens": 32592008} {"current_steps": 56495, "total_steps": 67140, "loss": 0.8012, "lr": 3.7326664919341308e-06, "epoch": 8.414507000297885, "percentage": 84.15, "elapsed_time": "3:54:34", "remaining_time": "0:44:12", "throughput": 2315.82, "total_tokens": 32594984} {"current_steps": 56500, "total_steps": 67140, "loss": 0.6138, "lr": 3.7292510139208007e-06, "epoch": 8.415251712838844, "percentage": 84.15, "elapsed_time": "3:54:36", "remaining_time": "0:44:10", "throughput": 2315.83, "total_tokens": 32597640} {"current_steps": 56505, "total_steps": 67140, "loss": 0.8348, "lr": 3.725836973298211e-06, "epoch": 8.415996425379804, "percentage": 84.16, "elapsed_time": "3:54:37", "remaining_time": "0:44:09", "throughput": 2315.85, "total_tokens": 32600552} {"current_steps": 56510, "total_steps": 67140, "loss": 0.7154, "lr": 3.722424370297062e-06, "epoch": 8.416741137920763, "percentage": 84.17, "elapsed_time": "3:54:38", "remaining_time": "0:44:08", "throughput": 2315.86, "total_tokens": 32603368} {"current_steps": 56515, "total_steps": 67140, "loss": 0.4089, "lr": 3.7190132051479697e-06, "epoch": 8.417485850461722, "percentage": 84.17, "elapsed_time": "3:54:39", "remaining_time": "0:44:06", "throughput": 2315.88, "total_tokens": 32606120} {"current_steps": 56520, "total_steps": 67140, "loss": 0.7287, "lr": 3.715603478081439e-06, "epoch": 8.41823056300268, "percentage": 84.18, "elapsed_time": "3:54:40", "remaining_time": "0:44:05", "throughput": 2315.9, "total_tokens": 32609192} {"current_steps": 56525, "total_steps": 67140, "loss": 0.6283, "lr": 3.7121951893278966e-06, "epoch": 8.418975275543641, "percentage": 84.19, "elapsed_time": "3:54:41", "remaining_time": "0:44:04", "throughput": 2315.93, "total_tokens": 32612168} {"current_steps": 56530, "total_steps": 67140, "loss": 0.5993, "lr": 3.708788339117644e-06, "epoch": 8.4197199880846, "percentage": 84.2, "elapsed_time": "3:54:42", "remaining_time": "0:44:03", "throughput": 2315.94, "total_tokens": 32615048} {"current_steps": 56535, "total_steps": 67140, "loss": 0.5858, "lr": 3.7053829276809143e-06, "epoch": 8.420464700625558, "percentage": 84.2, "elapsed_time": "3:54:43", "remaining_time": "0:44:01", "throughput": 2315.96, "total_tokens": 32617928} {"current_steps": 56540, "total_steps": 67140, "loss": 0.6129, "lr": 3.7019789552478286e-06, "epoch": 8.421209413166517, "percentage": 84.21, "elapsed_time": "3:54:45", "remaining_time": "0:44:00", "throughput": 2315.98, "total_tokens": 32620840} {"current_steps": 56545, "total_steps": 67140, "loss": 0.6686, "lr": 3.6985764220484137e-06, "epoch": 8.421954125707478, "percentage": 84.22, "elapsed_time": "3:54:46", "remaining_time": "0:43:59", "throughput": 2315.99, "total_tokens": 32623656} {"current_steps": 56550, "total_steps": 67140, "loss": 0.4607, "lr": 3.695175328312597e-06, "epoch": 8.422698838248436, "percentage": 84.23, "elapsed_time": "3:54:47", "remaining_time": "0:43:58", "throughput": 2316.01, "total_tokens": 32626472} {"current_steps": 56555, "total_steps": 67140, "loss": 0.5481, "lr": 3.6917756742702205e-06, "epoch": 8.423443550789395, "percentage": 84.23, "elapsed_time": "3:54:48", "remaining_time": "0:43:56", "throughput": 2316.05, "total_tokens": 32629736} {"current_steps": 56560, "total_steps": 67140, "loss": 0.4564, "lr": 3.68837746015101e-06, "epoch": 8.424188263330354, "percentage": 84.24, "elapsed_time": "3:54:49", "remaining_time": "0:43:55", "throughput": 2316.07, "total_tokens": 32632680} {"current_steps": 56565, "total_steps": 67140, "loss": 0.9333, "lr": 3.6849806861845997e-06, "epoch": 8.424932975871315, "percentage": 84.25, "elapsed_time": "3:54:50", "remaining_time": "0:43:54", "throughput": 2316.08, "total_tokens": 32635464} {"current_steps": 56570, "total_steps": 67140, "loss": 0.4389, "lr": 3.6815853526005305e-06, "epoch": 8.425677688412273, "percentage": 84.26, "elapsed_time": "3:54:51", "remaining_time": "0:43:53", "throughput": 2316.1, "total_tokens": 32638376} {"current_steps": 56575, "total_steps": 67140, "loss": 0.5356, "lr": 3.678191459628252e-06, "epoch": 8.426422400953232, "percentage": 84.26, "elapsed_time": "3:54:53", "remaining_time": "0:43:51", "throughput": 2316.11, "total_tokens": 32641000} {"current_steps": 56580, "total_steps": 67140, "loss": 0.627, "lr": 3.6747990074971065e-06, "epoch": 8.42716711349419, "percentage": 84.27, "elapsed_time": "3:54:54", "remaining_time": "0:43:50", "throughput": 2316.13, "total_tokens": 32643848} {"current_steps": 56585, "total_steps": 67140, "loss": 0.6438, "lr": 3.671407996436341e-06, "epoch": 8.42791182603515, "percentage": 84.28, "elapsed_time": "3:54:55", "remaining_time": "0:43:49", "throughput": 2316.15, "total_tokens": 32646952} {"current_steps": 56590, "total_steps": 67140, "loss": 0.4918, "lr": 3.6680184266751128e-06, "epoch": 8.42865653857611, "percentage": 84.29, "elapsed_time": "3:54:56", "remaining_time": "0:43:48", "throughput": 2316.19, "total_tokens": 32650344} {"current_steps": 56595, "total_steps": 67140, "loss": 0.5124, "lr": 3.66463029844247e-06, "epoch": 8.429401251117069, "percentage": 84.29, "elapsed_time": "3:54:57", "remaining_time": "0:43:46", "throughput": 2316.21, "total_tokens": 32653128} {"current_steps": 56600, "total_steps": 67140, "loss": 0.7755, "lr": 3.6612436119673634e-06, "epoch": 8.430145963658028, "percentage": 84.3, "elapsed_time": "3:54:58", "remaining_time": "0:43:45", "throughput": 2316.21, "total_tokens": 32655720} {"current_steps": 56605, "total_steps": 67140, "loss": 0.564, "lr": 3.657858367478656e-06, "epoch": 8.430890676198986, "percentage": 84.31, "elapsed_time": "3:54:59", "remaining_time": "0:43:44", "throughput": 2316.23, "total_tokens": 32658696} {"current_steps": 56610, "total_steps": 67140, "loss": 0.461, "lr": 3.6544745652051097e-06, "epoch": 8.431635388739947, "percentage": 84.32, "elapsed_time": "3:55:01", "remaining_time": "0:43:42", "throughput": 2316.25, "total_tokens": 32661512} {"current_steps": 56615, "total_steps": 67140, "loss": 0.4567, "lr": 3.6510922053753864e-06, "epoch": 8.432380101280906, "percentage": 84.32, "elapsed_time": "3:55:02", "remaining_time": "0:43:41", "throughput": 2316.27, "total_tokens": 32664456} {"current_steps": 56620, "total_steps": 67140, "loss": 0.5369, "lr": 3.647711288218053e-06, "epoch": 8.433124813821864, "percentage": 84.33, "elapsed_time": "3:55:03", "remaining_time": "0:43:40", "throughput": 2316.29, "total_tokens": 32667368} {"current_steps": 56625, "total_steps": 67140, "loss": 0.6417, "lr": 3.644331813961588e-06, "epoch": 8.433869526362823, "percentage": 84.34, "elapsed_time": "3:55:04", "remaining_time": "0:43:39", "throughput": 2316.29, "total_tokens": 32669992} {"current_steps": 56630, "total_steps": 67140, "loss": 0.569, "lr": 3.640953782834344e-06, "epoch": 8.434614238903784, "percentage": 84.35, "elapsed_time": "3:55:05", "remaining_time": "0:43:37", "throughput": 2316.31, "total_tokens": 32672840} {"current_steps": 56635, "total_steps": 67140, "loss": 0.6754, "lr": 3.637577195064612e-06, "epoch": 8.435358951444742, "percentage": 84.35, "elapsed_time": "3:55:06", "remaining_time": "0:43:36", "throughput": 2316.32, "total_tokens": 32675624} {"current_steps": 56640, "total_steps": 67140, "loss": 0.6989, "lr": 3.634202050880553e-06, "epoch": 8.436103663985701, "percentage": 84.36, "elapsed_time": "3:55:07", "remaining_time": "0:43:35", "throughput": 2316.34, "total_tokens": 32678440} {"current_steps": 56645, "total_steps": 67140, "loss": 0.5054, "lr": 3.6308283505102515e-06, "epoch": 8.43684837652666, "percentage": 84.37, "elapsed_time": "3:55:08", "remaining_time": "0:43:34", "throughput": 2316.36, "total_tokens": 32681320} {"current_steps": 56650, "total_steps": 67140, "loss": 0.4865, "lr": 3.6274560941816887e-06, "epoch": 8.43759308906762, "percentage": 84.38, "elapsed_time": "3:55:10", "remaining_time": "0:43:32", "throughput": 2316.37, "total_tokens": 32684072} {"current_steps": 56655, "total_steps": 67140, "loss": 0.5722, "lr": 3.6240852821227524e-06, "epoch": 8.43833780160858, "percentage": 84.38, "elapsed_time": "3:55:11", "remaining_time": "0:43:31", "throughput": 2316.39, "total_tokens": 32687016} {"current_steps": 56660, "total_steps": 67140, "loss": 0.4862, "lr": 3.620715914561226e-06, "epoch": 8.439082514149538, "percentage": 84.39, "elapsed_time": "3:55:12", "remaining_time": "0:43:30", "throughput": 2316.41, "total_tokens": 32689992} {"current_steps": 56665, "total_steps": 67140, "loss": 0.4003, "lr": 3.6173479917247927e-06, "epoch": 8.439827226690497, "percentage": 84.4, "elapsed_time": "3:55:13", "remaining_time": "0:43:28", "throughput": 2316.42, "total_tokens": 32692712} {"current_steps": 56670, "total_steps": 67140, "loss": 0.4273, "lr": 3.613981513841047e-06, "epoch": 8.440571939231457, "percentage": 84.41, "elapsed_time": "3:55:14", "remaining_time": "0:43:27", "throughput": 2316.43, "total_tokens": 32695528} {"current_steps": 56675, "total_steps": 67140, "loss": 0.7789, "lr": 3.6106164811374855e-06, "epoch": 8.441316651772416, "percentage": 84.41, "elapsed_time": "3:55:15", "remaining_time": "0:43:26", "throughput": 2316.46, "total_tokens": 32698536} {"current_steps": 56680, "total_steps": 67140, "loss": 0.5147, "lr": 3.607252893841495e-06, "epoch": 8.442061364313375, "percentage": 84.42, "elapsed_time": "3:55:16", "remaining_time": "0:43:25", "throughput": 2316.48, "total_tokens": 32701480} {"current_steps": 56685, "total_steps": 67140, "loss": 0.4904, "lr": 3.6038907521803776e-06, "epoch": 8.442806076854334, "percentage": 84.43, "elapsed_time": "3:55:18", "remaining_time": "0:43:23", "throughput": 2316.5, "total_tokens": 32704488} {"current_steps": 56690, "total_steps": 67140, "loss": 0.6552, "lr": 3.6005300563813375e-06, "epoch": 8.443550789395294, "percentage": 84.44, "elapsed_time": "3:55:19", "remaining_time": "0:43:22", "throughput": 2316.53, "total_tokens": 32707464} {"current_steps": 56695, "total_steps": 67140, "loss": 0.5267, "lr": 3.5971708066714682e-06, "epoch": 8.444295501936253, "percentage": 84.44, "elapsed_time": "3:55:20", "remaining_time": "0:43:21", "throughput": 2316.54, "total_tokens": 32710216} {"current_steps": 56700, "total_steps": 67140, "loss": 0.5842, "lr": 3.593813003277777e-06, "epoch": 8.445040214477212, "percentage": 84.45, "elapsed_time": "3:55:21", "remaining_time": "0:43:20", "throughput": 2316.56, "total_tokens": 32713288} {"current_steps": 56705, "total_steps": 67140, "loss": 0.6513, "lr": 3.5904566464271704e-06, "epoch": 8.44578492701817, "percentage": 84.46, "elapsed_time": "3:55:22", "remaining_time": "0:43:18", "throughput": 2316.56, "total_tokens": 32715816} {"current_steps": 56710, "total_steps": 67140, "loss": 0.6325, "lr": 3.5871017363464596e-06, "epoch": 8.446529639559131, "percentage": 84.47, "elapsed_time": "3:55:23", "remaining_time": "0:43:17", "throughput": 2316.58, "total_tokens": 32718664} {"current_steps": 56715, "total_steps": 67140, "loss": 0.571, "lr": 3.5837482732623636e-06, "epoch": 8.44727435210009, "percentage": 84.47, "elapsed_time": "3:55:24", "remaining_time": "0:43:16", "throughput": 2316.61, "total_tokens": 32721704} {"current_steps": 56720, "total_steps": 67140, "loss": 0.6116, "lr": 3.5803962574014775e-06, "epoch": 8.448019064641048, "percentage": 84.48, "elapsed_time": "3:55:25", "remaining_time": "0:43:15", "throughput": 2316.62, "total_tokens": 32724584} {"current_steps": 56725, "total_steps": 67140, "loss": 0.5891, "lr": 3.577045688990335e-06, "epoch": 8.448763777182007, "percentage": 84.49, "elapsed_time": "3:55:27", "remaining_time": "0:43:13", "throughput": 2316.66, "total_tokens": 32727912} {"current_steps": 56730, "total_steps": 67140, "loss": 0.7926, "lr": 3.5736965682553385e-06, "epoch": 8.449508489722968, "percentage": 84.5, "elapsed_time": "3:55:28", "remaining_time": "0:43:12", "throughput": 2316.67, "total_tokens": 32730472} {"current_steps": 56735, "total_steps": 67140, "loss": 0.7092, "lr": 3.5703488954228147e-06, "epoch": 8.450253202263927, "percentage": 84.5, "elapsed_time": "3:55:29", "remaining_time": "0:43:11", "throughput": 2316.68, "total_tokens": 32733256} {"current_steps": 56740, "total_steps": 67140, "loss": 0.5677, "lr": 3.5670026707189858e-06, "epoch": 8.450997914804885, "percentage": 84.51, "elapsed_time": "3:55:30", "remaining_time": "0:43:10", "throughput": 2316.71, "total_tokens": 32736296} {"current_steps": 56745, "total_steps": 67140, "loss": 0.5529, "lr": 3.5636578943699787e-06, "epoch": 8.451742627345844, "percentage": 84.52, "elapsed_time": "3:55:31", "remaining_time": "0:43:08", "throughput": 2316.72, "total_tokens": 32739144} {"current_steps": 56750, "total_steps": 67140, "loss": 0.7076, "lr": 3.5603145666018132e-06, "epoch": 8.452487339886805, "percentage": 84.52, "elapsed_time": "3:55:32", "remaining_time": "0:43:07", "throughput": 2316.75, "total_tokens": 32742248} {"current_steps": 56755, "total_steps": 67140, "loss": 0.5922, "lr": 3.5569726876404307e-06, "epoch": 8.453232052427763, "percentage": 84.53, "elapsed_time": "3:55:33", "remaining_time": "0:43:06", "throughput": 2316.77, "total_tokens": 32745192} {"current_steps": 56760, "total_steps": 67140, "loss": 0.4787, "lr": 3.553632257711653e-06, "epoch": 8.453976764968722, "percentage": 84.54, "elapsed_time": "3:55:35", "remaining_time": "0:43:04", "throughput": 2316.8, "total_tokens": 32748136} {"current_steps": 56765, "total_steps": 67140, "loss": 0.5695, "lr": 3.550293277041206e-06, "epoch": 8.45472147750968, "percentage": 84.55, "elapsed_time": "3:55:36", "remaining_time": "0:43:03", "throughput": 2316.81, "total_tokens": 32751016} {"current_steps": 56770, "total_steps": 67140, "loss": 0.6349, "lr": 3.54695574585473e-06, "epoch": 8.45546619005064, "percentage": 84.55, "elapsed_time": "3:55:37", "remaining_time": "0:43:02", "throughput": 2316.84, "total_tokens": 32754120} {"current_steps": 56775, "total_steps": 67140, "loss": 0.5379, "lr": 3.543619664377765e-06, "epoch": 8.4562109025916, "percentage": 84.56, "elapsed_time": "3:55:38", "remaining_time": "0:43:01", "throughput": 2316.86, "total_tokens": 32756968} {"current_steps": 56780, "total_steps": 67140, "loss": 0.3632, "lr": 3.540285032835747e-06, "epoch": 8.456955615132559, "percentage": 84.57, "elapsed_time": "3:55:39", "remaining_time": "0:42:59", "throughput": 2316.87, "total_tokens": 32759752} {"current_steps": 56785, "total_steps": 67140, "loss": 0.5401, "lr": 3.536951851454018e-06, "epoch": 8.457700327673518, "percentage": 84.58, "elapsed_time": "3:55:40", "remaining_time": "0:42:58", "throughput": 2316.9, "total_tokens": 32762888} {"current_steps": 56790, "total_steps": 67140, "loss": 0.5614, "lr": 3.5336201204578256e-06, "epoch": 8.458445040214476, "percentage": 84.58, "elapsed_time": "3:55:41", "remaining_time": "0:42:57", "throughput": 2316.91, "total_tokens": 32765544} {"current_steps": 56795, "total_steps": 67140, "loss": 0.814, "lr": 3.5302898400723094e-06, "epoch": 8.459189752755437, "percentage": 84.59, "elapsed_time": "3:55:43", "remaining_time": "0:42:56", "throughput": 2316.92, "total_tokens": 32768360} {"current_steps": 56800, "total_steps": 67140, "loss": 0.754, "lr": 3.5269610105225114e-06, "epoch": 8.459934465296396, "percentage": 84.6, "elapsed_time": "3:55:44", "remaining_time": "0:42:54", "throughput": 2316.94, "total_tokens": 32771144} {"current_steps": 56805, "total_steps": 67140, "loss": 0.5466, "lr": 3.523633632033385e-06, "epoch": 8.460679177837354, "percentage": 84.61, "elapsed_time": "3:55:45", "remaining_time": "0:42:53", "throughput": 2316.96, "total_tokens": 32773992} {"current_steps": 56810, "total_steps": 67140, "loss": 0.5344, "lr": 3.520307704829781e-06, "epoch": 8.461423890378313, "percentage": 84.61, "elapsed_time": "3:55:46", "remaining_time": "0:42:52", "throughput": 2316.96, "total_tokens": 32776680} {"current_steps": 56815, "total_steps": 67140, "loss": 0.6076, "lr": 3.5169832291364502e-06, "epoch": 8.462168602919274, "percentage": 84.62, "elapsed_time": "3:55:47", "remaining_time": "0:42:51", "throughput": 2316.98, "total_tokens": 32779656} {"current_steps": 56820, "total_steps": 67140, "loss": 0.5926, "lr": 3.5136602051780517e-06, "epoch": 8.462913315460233, "percentage": 84.63, "elapsed_time": "3:55:48", "remaining_time": "0:42:49", "throughput": 2316.99, "total_tokens": 32782248} {"current_steps": 56825, "total_steps": 67140, "loss": 0.6431, "lr": 3.5103386331791444e-06, "epoch": 8.463658028001191, "percentage": 84.64, "elapsed_time": "3:55:49", "remaining_time": "0:42:48", "throughput": 2317.01, "total_tokens": 32785288} {"current_steps": 56830, "total_steps": 67140, "loss": 0.4644, "lr": 3.507018513364177e-06, "epoch": 8.46440274054215, "percentage": 84.64, "elapsed_time": "3:55:50", "remaining_time": "0:42:47", "throughput": 2317.02, "total_tokens": 32787976} {"current_steps": 56835, "total_steps": 67140, "loss": 0.4777, "lr": 3.5036998459575197e-06, "epoch": 8.46514745308311, "percentage": 84.65, "elapsed_time": "3:55:52", "remaining_time": "0:42:45", "throughput": 2317.05, "total_tokens": 32791080} {"current_steps": 56840, "total_steps": 67140, "loss": 0.6507, "lr": 3.5003826311834214e-06, "epoch": 8.46589216562407, "percentage": 84.66, "elapsed_time": "3:55:53", "remaining_time": "0:42:44", "throughput": 2317.05, "total_tokens": 32793608} {"current_steps": 56845, "total_steps": 67140, "loss": 0.5891, "lr": 3.497066869266058e-06, "epoch": 8.466636878165028, "percentage": 84.67, "elapsed_time": "3:55:54", "remaining_time": "0:42:43", "throughput": 2317.06, "total_tokens": 32796328} {"current_steps": 56850, "total_steps": 67140, "loss": 0.5732, "lr": 3.493752560429486e-06, "epoch": 8.467381590705987, "percentage": 84.67, "elapsed_time": "3:55:55", "remaining_time": "0:42:42", "throughput": 2317.09, "total_tokens": 32799464} {"current_steps": 56855, "total_steps": 67140, "loss": 0.4728, "lr": 3.490439704897688e-06, "epoch": 8.468126303246947, "percentage": 84.68, "elapsed_time": "3:55:56", "remaining_time": "0:42:40", "throughput": 2317.09, "total_tokens": 32802088} {"current_steps": 56860, "total_steps": 67140, "loss": 0.6271, "lr": 3.4871283028945155e-06, "epoch": 8.468871015787906, "percentage": 84.69, "elapsed_time": "3:55:57", "remaining_time": "0:42:39", "throughput": 2317.1, "total_tokens": 32804776} {"current_steps": 56865, "total_steps": 67140, "loss": 0.7783, "lr": 3.4838183546437475e-06, "epoch": 8.469615728328865, "percentage": 84.7, "elapsed_time": "3:55:58", "remaining_time": "0:42:38", "throughput": 2317.11, "total_tokens": 32807464} {"current_steps": 56870, "total_steps": 67140, "loss": 0.6861, "lr": 3.480509860369058e-06, "epoch": 8.470360440869824, "percentage": 84.7, "elapsed_time": "3:55:59", "remaining_time": "0:42:37", "throughput": 2317.14, "total_tokens": 32810600} {"current_steps": 56875, "total_steps": 67140, "loss": 0.4719, "lr": 3.477202820294018e-06, "epoch": 8.471105153410784, "percentage": 84.71, "elapsed_time": "3:56:01", "remaining_time": "0:42:35", "throughput": 2317.15, "total_tokens": 32813160} {"current_steps": 56880, "total_steps": 67140, "loss": 0.5655, "lr": 3.473897234642112e-06, "epoch": 8.471849865951743, "percentage": 84.72, "elapsed_time": "3:56:02", "remaining_time": "0:42:34", "throughput": 2317.15, "total_tokens": 32815816} {"current_steps": 56885, "total_steps": 67140, "loss": 0.6156, "lr": 3.4705931036367074e-06, "epoch": 8.472594578492702, "percentage": 84.73, "elapsed_time": "3:56:03", "remaining_time": "0:42:33", "throughput": 2317.17, "total_tokens": 32818696} {"current_steps": 56890, "total_steps": 67140, "loss": 0.6625, "lr": 3.4672904275010936e-06, "epoch": 8.47333929103366, "percentage": 84.73, "elapsed_time": "3:56:04", "remaining_time": "0:42:32", "throughput": 2317.19, "total_tokens": 32821608} {"current_steps": 56895, "total_steps": 67140, "loss": 0.6745, "lr": 3.463989206458443e-06, "epoch": 8.474084003574621, "percentage": 84.74, "elapsed_time": "3:56:05", "remaining_time": "0:42:30", "throughput": 2317.22, "total_tokens": 32824776} {"current_steps": 56900, "total_steps": 67140, "loss": 0.6044, "lr": 3.460689440731843e-06, "epoch": 8.47482871611558, "percentage": 84.75, "elapsed_time": "3:56:06", "remaining_time": "0:42:29", "throughput": 2317.24, "total_tokens": 32827656} {"current_steps": 56905, "total_steps": 67140, "loss": 0.5306, "lr": 3.457391130544277e-06, "epoch": 8.475573428656539, "percentage": 84.76, "elapsed_time": "3:56:07", "remaining_time": "0:42:28", "throughput": 2317.25, "total_tokens": 32830440} {"current_steps": 56910, "total_steps": 67140, "loss": 0.7653, "lr": 3.45409427611863e-06, "epoch": 8.476318141197497, "percentage": 84.76, "elapsed_time": "3:56:08", "remaining_time": "0:42:26", "throughput": 2317.27, "total_tokens": 32833384} {"current_steps": 56915, "total_steps": 67140, "loss": 0.4014, "lr": 3.4507988776776968e-06, "epoch": 8.477062853738458, "percentage": 84.77, "elapsed_time": "3:56:10", "remaining_time": "0:42:25", "throughput": 2317.29, "total_tokens": 32836328} {"current_steps": 56920, "total_steps": 67140, "loss": 0.5562, "lr": 3.4475049354441653e-06, "epoch": 8.477807566279417, "percentage": 84.78, "elapsed_time": "3:56:11", "remaining_time": "0:42:24", "throughput": 2317.31, "total_tokens": 32839176} {"current_steps": 56925, "total_steps": 67140, "loss": 0.5788, "lr": 3.444212449640627e-06, "epoch": 8.478552278820375, "percentage": 84.79, "elapsed_time": "3:56:12", "remaining_time": "0:42:23", "throughput": 2317.33, "total_tokens": 32842024} {"current_steps": 56930, "total_steps": 67140, "loss": 0.5023, "lr": 3.4409214204895653e-06, "epoch": 8.479296991361334, "percentage": 84.79, "elapsed_time": "3:56:13", "remaining_time": "0:42:21", "throughput": 2317.35, "total_tokens": 32844904} {"current_steps": 56935, "total_steps": 67140, "loss": 0.5519, "lr": 3.4376318482133797e-06, "epoch": 8.480041703902295, "percentage": 84.8, "elapsed_time": "3:56:14", "remaining_time": "0:42:20", "throughput": 2317.35, "total_tokens": 32847560} {"current_steps": 56940, "total_steps": 67140, "loss": 0.5955, "lr": 3.4343437330343675e-06, "epoch": 8.480786416443253, "percentage": 84.81, "elapsed_time": "3:56:15", "remaining_time": "0:42:19", "throughput": 2317.37, "total_tokens": 32850408} {"current_steps": 56945, "total_steps": 67140, "loss": 0.7913, "lr": 3.431057075174729e-06, "epoch": 8.481531128984212, "percentage": 84.82, "elapsed_time": "3:56:16", "remaining_time": "0:42:18", "throughput": 2317.39, "total_tokens": 32853352} {"current_steps": 56950, "total_steps": 67140, "loss": 0.8076, "lr": 3.4277718748565585e-06, "epoch": 8.482275841525171, "percentage": 84.82, "elapsed_time": "3:56:18", "remaining_time": "0:42:16", "throughput": 2317.41, "total_tokens": 32856264} {"current_steps": 56955, "total_steps": 67140, "loss": 0.744, "lr": 3.4244881323018645e-06, "epoch": 8.48302055406613, "percentage": 84.83, "elapsed_time": "3:56:19", "remaining_time": "0:42:15", "throughput": 2317.43, "total_tokens": 32859112} {"current_steps": 56960, "total_steps": 67140, "loss": 0.5996, "lr": 3.421205847732542e-06, "epoch": 8.48376526660709, "percentage": 84.84, "elapsed_time": "3:56:20", "remaining_time": "0:42:14", "throughput": 2317.44, "total_tokens": 32861992} {"current_steps": 56965, "total_steps": 67140, "loss": 0.5255, "lr": 3.4179250213703914e-06, "epoch": 8.484509979148049, "percentage": 84.85, "elapsed_time": "3:56:21", "remaining_time": "0:42:13", "throughput": 2317.46, "total_tokens": 32864840} {"current_steps": 56970, "total_steps": 67140, "loss": 0.637, "lr": 3.414645653437118e-06, "epoch": 8.485254691689008, "percentage": 84.85, "elapsed_time": "3:56:22", "remaining_time": "0:42:11", "throughput": 2317.49, "total_tokens": 32867944} {"current_steps": 56975, "total_steps": 67140, "loss": 0.5826, "lr": 3.411367744154334e-06, "epoch": 8.485999404229966, "percentage": 84.86, "elapsed_time": "3:56:23", "remaining_time": "0:42:10", "throughput": 2317.52, "total_tokens": 32871112} {"current_steps": 56980, "total_steps": 67140, "loss": 0.4549, "lr": 3.4080912937435455e-06, "epoch": 8.486744116770927, "percentage": 84.87, "elapsed_time": "3:56:24", "remaining_time": "0:42:09", "throughput": 2317.54, "total_tokens": 32874088} {"current_steps": 56985, "total_steps": 67140, "loss": 0.5588, "lr": 3.4048163024261614e-06, "epoch": 8.487488829311886, "percentage": 84.87, "elapsed_time": "3:56:26", "remaining_time": "0:42:08", "throughput": 2317.55, "total_tokens": 32876808} {"current_steps": 56990, "total_steps": 67140, "loss": 0.4273, "lr": 3.4015427704234965e-06, "epoch": 8.488233541852845, "percentage": 84.88, "elapsed_time": "3:56:27", "remaining_time": "0:42:06", "throughput": 2317.57, "total_tokens": 32879752} {"current_steps": 56995, "total_steps": 67140, "loss": 0.602, "lr": 3.3982706979567542e-06, "epoch": 8.488978254393803, "percentage": 84.89, "elapsed_time": "3:56:28", "remaining_time": "0:42:05", "throughput": 2317.59, "total_tokens": 32882600} {"current_steps": 57000, "total_steps": 67140, "loss": 0.5025, "lr": 3.395000085247055e-06, "epoch": 8.489722966934764, "percentage": 84.9, "elapsed_time": "3:56:29", "remaining_time": "0:42:04", "throughput": 2317.61, "total_tokens": 32885640} {"current_steps": 57005, "total_steps": 67140, "loss": 0.5222, "lr": 3.391730932515405e-06, "epoch": 8.490467679475723, "percentage": 84.9, "elapsed_time": "3:56:30", "remaining_time": "0:42:02", "throughput": 2317.62, "total_tokens": 32888328} {"current_steps": 57010, "total_steps": 67140, "loss": 0.6372, "lr": 3.388463239982728e-06, "epoch": 8.491212392016681, "percentage": 84.91, "elapsed_time": "3:56:31", "remaining_time": "0:42:01", "throughput": 2317.63, "total_tokens": 32891016} {"current_steps": 57015, "total_steps": 67140, "loss": 0.6868, "lr": 3.3851970078698394e-06, "epoch": 8.49195710455764, "percentage": 84.92, "elapsed_time": "3:56:32", "remaining_time": "0:42:00", "throughput": 2317.64, "total_tokens": 32893640} {"current_steps": 57020, "total_steps": 67140, "loss": 0.6761, "lr": 3.3819322363974615e-06, "epoch": 8.4927018170986, "percentage": 84.93, "elapsed_time": "3:56:33", "remaining_time": "0:41:59", "throughput": 2317.66, "total_tokens": 32896584} {"current_steps": 57025, "total_steps": 67140, "loss": 0.5947, "lr": 3.3786689257862047e-06, "epoch": 8.49344652963956, "percentage": 84.93, "elapsed_time": "3:56:35", "remaining_time": "0:41:57", "throughput": 2317.68, "total_tokens": 32899432} {"current_steps": 57030, "total_steps": 67140, "loss": 0.6214, "lr": 3.3754070762565952e-06, "epoch": 8.494191242180518, "percentage": 84.94, "elapsed_time": "3:56:36", "remaining_time": "0:41:56", "throughput": 2317.7, "total_tokens": 32902440} {"current_steps": 57035, "total_steps": 67140, "loss": 0.5594, "lr": 3.372146688029057e-06, "epoch": 8.494935954721477, "percentage": 84.95, "elapsed_time": "3:56:37", "remaining_time": "0:41:55", "throughput": 2317.77, "total_tokens": 32906664} {"current_steps": 57040, "total_steps": 67140, "loss": 0.4308, "lr": 3.368887761323919e-06, "epoch": 8.495680667262437, "percentage": 84.96, "elapsed_time": "3:56:38", "remaining_time": "0:41:54", "throughput": 2317.79, "total_tokens": 32909576} {"current_steps": 57045, "total_steps": 67140, "loss": 0.5351, "lr": 3.3656302963613966e-06, "epoch": 8.496425379803396, "percentage": 84.96, "elapsed_time": "3:56:39", "remaining_time": "0:41:52", "throughput": 2317.79, "total_tokens": 32912072} {"current_steps": 57050, "total_steps": 67140, "loss": 0.6998, "lr": 3.362374293361617e-06, "epoch": 8.497170092344355, "percentage": 84.97, "elapsed_time": "3:56:40", "remaining_time": "0:41:51", "throughput": 2317.8, "total_tokens": 32914792} {"current_steps": 57055, "total_steps": 67140, "loss": 0.6417, "lr": 3.359119752544618e-06, "epoch": 8.497914804885314, "percentage": 84.98, "elapsed_time": "3:56:41", "remaining_time": "0:41:50", "throughput": 2317.8, "total_tokens": 32917416} {"current_steps": 57060, "total_steps": 67140, "loss": 0.6536, "lr": 3.3558666741303147e-06, "epoch": 8.498659517426274, "percentage": 84.99, "elapsed_time": "3:56:43", "remaining_time": "0:41:49", "throughput": 2317.82, "total_tokens": 32920200} {"current_steps": 57065, "total_steps": 67140, "loss": 0.5285, "lr": 3.352615058338543e-06, "epoch": 8.499404229967233, "percentage": 84.99, "elapsed_time": "3:56:44", "remaining_time": "0:41:47", "throughput": 2317.84, "total_tokens": 32923240} {"current_steps": 57069, "total_steps": 67140, "eval_loss": 0.6745066046714783, "epoch": 8.5, "percentage": 85.0, "elapsed_time": "3:57:59", "remaining_time": "0:41:59", "throughput": 2305.81, "total_tokens": 32925544} {"current_steps": 57070, "total_steps": 67140, "loss": 0.7458, "lr": 3.3493649053890326e-06, "epoch": 8.500148942508192, "percentage": 85.0, "elapsed_time": "3:58:01", "remaining_time": "0:41:59", "throughput": 2305.52, "total_tokens": 32926120} {"current_steps": 57075, "total_steps": 67140, "loss": 0.5025, "lr": 3.3461162155014186e-06, "epoch": 8.50089365504915, "percentage": 85.01, "elapsed_time": "3:58:02", "remaining_time": "0:41:58", "throughput": 2305.54, "total_tokens": 32929192} {"current_steps": 57080, "total_steps": 67140, "loss": 0.7147, "lr": 3.342868988895237e-06, "epoch": 8.501638367590111, "percentage": 85.02, "elapsed_time": "3:58:03", "remaining_time": "0:41:57", "throughput": 2305.56, "total_tokens": 32932168} {"current_steps": 57085, "total_steps": 67140, "loss": 0.559, "lr": 3.3396232257899116e-06, "epoch": 8.50238308013107, "percentage": 85.02, "elapsed_time": "3:58:04", "remaining_time": "0:41:56", "throughput": 2305.58, "total_tokens": 32935048} {"current_steps": 57090, "total_steps": 67140, "loss": 0.4758, "lr": 3.33637892640479e-06, "epoch": 8.503127792672029, "percentage": 85.03, "elapsed_time": "3:58:06", "remaining_time": "0:41:54", "throughput": 2305.6, "total_tokens": 32937864} {"current_steps": 57095, "total_steps": 67140, "loss": 0.529, "lr": 3.3331360909590994e-06, "epoch": 8.503872505212987, "percentage": 85.04, "elapsed_time": "3:58:07", "remaining_time": "0:41:53", "throughput": 2305.62, "total_tokens": 32940680} {"current_steps": 57100, "total_steps": 67140, "loss": 0.3876, "lr": 3.3298947196719776e-06, "epoch": 8.504617217753946, "percentage": 85.05, "elapsed_time": "3:58:08", "remaining_time": "0:41:52", "throughput": 2305.62, "total_tokens": 32943208} {"current_steps": 57105, "total_steps": 67140, "loss": 0.4671, "lr": 3.326654812762467e-06, "epoch": 8.505361930294907, "percentage": 85.05, "elapsed_time": "3:58:09", "remaining_time": "0:41:51", "throughput": 2305.63, "total_tokens": 32945896} {"current_steps": 57110, "total_steps": 67140, "loss": 0.4963, "lr": 3.3234163704495086e-06, "epoch": 8.506106642835865, "percentage": 85.06, "elapsed_time": "3:58:10", "remaining_time": "0:41:49", "throughput": 2305.65, "total_tokens": 32948776} {"current_steps": 57115, "total_steps": 67140, "loss": 0.5517, "lr": 3.3201793929519386e-06, "epoch": 8.506851355376824, "percentage": 85.07, "elapsed_time": "3:58:11", "remaining_time": "0:41:48", "throughput": 2305.66, "total_tokens": 32951496} {"current_steps": 57120, "total_steps": 67140, "loss": 0.5031, "lr": 3.316943880488507e-06, "epoch": 8.507596067917785, "percentage": 85.08, "elapsed_time": "3:58:12", "remaining_time": "0:41:47", "throughput": 2305.67, "total_tokens": 32954312} {"current_steps": 57125, "total_steps": 67140, "loss": 0.6929, "lr": 3.313709833277853e-06, "epoch": 8.508340780458743, "percentage": 85.08, "elapsed_time": "3:58:13", "remaining_time": "0:41:45", "throughput": 2305.7, "total_tokens": 32957224} {"current_steps": 57130, "total_steps": 67140, "loss": 0.5847, "lr": 3.310477251538513e-06, "epoch": 8.509085492999702, "percentage": 85.09, "elapsed_time": "3:58:15", "remaining_time": "0:41:44", "throughput": 2305.72, "total_tokens": 32960360} {"current_steps": 57135, "total_steps": 67140, "loss": 0.6642, "lr": 3.3072461354889367e-06, "epoch": 8.509830205540661, "percentage": 85.1, "elapsed_time": "3:58:16", "remaining_time": "0:41:43", "throughput": 2305.74, "total_tokens": 32963208} {"current_steps": 57140, "total_steps": 67140, "loss": 0.4668, "lr": 3.304016485347469e-06, "epoch": 8.51057491808162, "percentage": 85.11, "elapsed_time": "3:58:17", "remaining_time": "0:41:42", "throughput": 2305.76, "total_tokens": 32966088} {"current_steps": 57145, "total_steps": 67140, "loss": 0.864, "lr": 3.300788301332361e-06, "epoch": 8.51131963062258, "percentage": 85.11, "elapsed_time": "3:58:18", "remaining_time": "0:41:40", "throughput": 2305.78, "total_tokens": 32969032} {"current_steps": 57150, "total_steps": 67140, "loss": 0.4628, "lr": 3.297561583661754e-06, "epoch": 8.512064343163539, "percentage": 85.12, "elapsed_time": "3:58:19", "remaining_time": "0:41:39", "throughput": 2305.8, "total_tokens": 32971752} {"current_steps": 57155, "total_steps": 67140, "loss": 0.6712, "lr": 3.2943363325537046e-06, "epoch": 8.512809055704498, "percentage": 85.13, "elapsed_time": "3:58:20", "remaining_time": "0:41:38", "throughput": 2305.81, "total_tokens": 32974600} {"current_steps": 57160, "total_steps": 67140, "loss": 0.5809, "lr": 3.2911125482261577e-06, "epoch": 8.513553768245457, "percentage": 85.14, "elapsed_time": "3:58:21", "remaining_time": "0:41:37", "throughput": 2305.83, "total_tokens": 32977448} {"current_steps": 57165, "total_steps": 67140, "loss": 0.4528, "lr": 3.287890230896959e-06, "epoch": 8.514298480786417, "percentage": 85.14, "elapsed_time": "3:58:22", "remaining_time": "0:41:35", "throughput": 2305.84, "total_tokens": 32980072} {"current_steps": 57170, "total_steps": 67140, "loss": 0.5567, "lr": 3.284669380783864e-06, "epoch": 8.515043193327376, "percentage": 85.15, "elapsed_time": "3:58:23", "remaining_time": "0:41:34", "throughput": 2305.86, "total_tokens": 32982920} {"current_steps": 57175, "total_steps": 67140, "loss": 0.6264, "lr": 3.2814499981045217e-06, "epoch": 8.515787905868335, "percentage": 85.16, "elapsed_time": "3:58:25", "remaining_time": "0:41:33", "throughput": 2305.88, "total_tokens": 32985800} {"current_steps": 57180, "total_steps": 67140, "loss": 0.5381, "lr": 3.2782320830764877e-06, "epoch": 8.516532618409293, "percentage": 85.17, "elapsed_time": "3:58:26", "remaining_time": "0:41:31", "throughput": 2305.9, "total_tokens": 32988808} {"current_steps": 57185, "total_steps": 67140, "loss": 0.6359, "lr": 3.2750156359172224e-06, "epoch": 8.517277330950254, "percentage": 85.17, "elapsed_time": "3:58:27", "remaining_time": "0:41:30", "throughput": 2305.91, "total_tokens": 32991560} {"current_steps": 57190, "total_steps": 67140, "loss": 0.7791, "lr": 3.271800656844065e-06, "epoch": 8.518022043491213, "percentage": 85.18, "elapsed_time": "3:58:28", "remaining_time": "0:41:29", "throughput": 2305.93, "total_tokens": 32994440} {"current_steps": 57195, "total_steps": 67140, "loss": 0.5584, "lr": 3.268587146074281e-06, "epoch": 8.518766756032171, "percentage": 85.19, "elapsed_time": "3:58:29", "remaining_time": "0:41:28", "throughput": 2305.93, "total_tokens": 32997096} {"current_steps": 57200, "total_steps": 67140, "loss": 0.4243, "lr": 3.26537510382503e-06, "epoch": 8.51951146857313, "percentage": 85.2, "elapsed_time": "3:58:30", "remaining_time": "0:41:26", "throughput": 2305.96, "total_tokens": 33000232} {"current_steps": 57205, "total_steps": 67140, "loss": 0.5927, "lr": 3.2621645303133553e-06, "epoch": 8.52025618111409, "percentage": 85.2, "elapsed_time": "3:58:31", "remaining_time": "0:41:25", "throughput": 2305.99, "total_tokens": 33003368} {"current_steps": 57210, "total_steps": 67140, "loss": 0.5201, "lr": 3.2589554257562243e-06, "epoch": 8.52100089365505, "percentage": 85.21, "elapsed_time": "3:58:33", "remaining_time": "0:41:24", "throughput": 2306.03, "total_tokens": 33006536} {"current_steps": 57215, "total_steps": 67140, "loss": 0.4285, "lr": 3.255747790370489e-06, "epoch": 8.521745606196008, "percentage": 85.22, "elapsed_time": "3:58:34", "remaining_time": "0:41:23", "throughput": 2306.06, "total_tokens": 33009640} {"current_steps": 57220, "total_steps": 67140, "loss": 0.5894, "lr": 3.2525416243729236e-06, "epoch": 8.522490318736967, "percentage": 85.22, "elapsed_time": "3:58:35", "remaining_time": "0:41:21", "throughput": 2306.08, "total_tokens": 33012648} {"current_steps": 57225, "total_steps": 67140, "loss": 0.5728, "lr": 3.2493369279801677e-06, "epoch": 8.523235031277927, "percentage": 85.23, "elapsed_time": "3:58:36", "remaining_time": "0:41:20", "throughput": 2306.12, "total_tokens": 33015976} {"current_steps": 57230, "total_steps": 67140, "loss": 0.6802, "lr": 3.2461337014087907e-06, "epoch": 8.523979743818886, "percentage": 85.24, "elapsed_time": "3:58:37", "remaining_time": "0:41:19", "throughput": 2306.13, "total_tokens": 33018600} {"current_steps": 57235, "total_steps": 67140, "loss": 0.5906, "lr": 3.242931944875252e-06, "epoch": 8.524724456359845, "percentage": 85.25, "elapsed_time": "3:58:38", "remaining_time": "0:41:18", "throughput": 2306.16, "total_tokens": 33021736} {"current_steps": 57240, "total_steps": 67140, "loss": 0.6204, "lr": 3.239731658595921e-06, "epoch": 8.525469168900804, "percentage": 85.25, "elapsed_time": "3:58:40", "remaining_time": "0:41:16", "throughput": 2306.19, "total_tokens": 33024808} {"current_steps": 57245, "total_steps": 67140, "loss": 0.5906, "lr": 3.236532842787049e-06, "epoch": 8.526213881441764, "percentage": 85.26, "elapsed_time": "3:58:41", "remaining_time": "0:41:15", "throughput": 2306.21, "total_tokens": 33027784} {"current_steps": 57250, "total_steps": 67140, "loss": 0.6003, "lr": 3.233335497664805e-06, "epoch": 8.526958593982723, "percentage": 85.27, "elapsed_time": "3:58:42", "remaining_time": "0:41:14", "throughput": 2306.23, "total_tokens": 33030600} {"current_steps": 57255, "total_steps": 67140, "loss": 0.6445, "lr": 3.230139623445255e-06, "epoch": 8.527703306523682, "percentage": 85.28, "elapsed_time": "3:58:43", "remaining_time": "0:41:12", "throughput": 2306.23, "total_tokens": 33033160} {"current_steps": 57260, "total_steps": 67140, "loss": 0.5188, "lr": 3.2269452203443546e-06, "epoch": 8.52844801906464, "percentage": 85.28, "elapsed_time": "3:58:44", "remaining_time": "0:41:11", "throughput": 2306.24, "total_tokens": 33035912} {"current_steps": 57265, "total_steps": 67140, "loss": 0.4101, "lr": 3.2237522885779718e-06, "epoch": 8.529192731605601, "percentage": 85.29, "elapsed_time": "3:58:45", "remaining_time": "0:41:10", "throughput": 2306.27, "total_tokens": 33038920} {"current_steps": 57270, "total_steps": 67140, "loss": 0.655, "lr": 3.220560828361874e-06, "epoch": 8.52993744414656, "percentage": 85.3, "elapsed_time": "3:58:46", "remaining_time": "0:41:09", "throughput": 2306.28, "total_tokens": 33041608} {"current_steps": 57275, "total_steps": 67140, "loss": 0.519, "lr": 3.217370839911729e-06, "epoch": 8.530682156687519, "percentage": 85.31, "elapsed_time": "3:58:47", "remaining_time": "0:41:07", "throughput": 2306.28, "total_tokens": 33044168} {"current_steps": 57280, "total_steps": 67140, "loss": 0.6383, "lr": 3.2141823234431045e-06, "epoch": 8.531426869228477, "percentage": 85.31, "elapsed_time": "3:58:49", "remaining_time": "0:41:06", "throughput": 2306.29, "total_tokens": 33046856} {"current_steps": 57285, "total_steps": 67140, "loss": 0.6354, "lr": 3.2109952791714583e-06, "epoch": 8.532171581769436, "percentage": 85.32, "elapsed_time": "3:58:50", "remaining_time": "0:41:05", "throughput": 2306.31, "total_tokens": 33049736} {"current_steps": 57290, "total_steps": 67140, "loss": 0.3831, "lr": 3.2078097073121704e-06, "epoch": 8.532916294310397, "percentage": 85.33, "elapsed_time": "3:58:51", "remaining_time": "0:41:04", "throughput": 2306.31, "total_tokens": 33052232} {"current_steps": 57295, "total_steps": 67140, "loss": 0.4045, "lr": 3.2046256080804943e-06, "epoch": 8.533661006851355, "percentage": 85.34, "elapsed_time": "3:58:52", "remaining_time": "0:41:02", "throughput": 2306.33, "total_tokens": 33055080} {"current_steps": 57300, "total_steps": 67140, "loss": 0.4906, "lr": 3.2014429816916074e-06, "epoch": 8.534405719392314, "percentage": 85.34, "elapsed_time": "3:58:53", "remaining_time": "0:41:01", "throughput": 2306.32, "total_tokens": 33057576} {"current_steps": 57305, "total_steps": 67140, "loss": 0.631, "lr": 3.198261828360577e-06, "epoch": 8.535150431933273, "percentage": 85.35, "elapsed_time": "3:58:54", "remaining_time": "0:41:00", "throughput": 2306.33, "total_tokens": 33060328} {"current_steps": 57310, "total_steps": 67140, "loss": 0.4986, "lr": 3.1950821483023723e-06, "epoch": 8.535895144474233, "percentage": 85.36, "elapsed_time": "3:58:55", "remaining_time": "0:40:58", "throughput": 2306.35, "total_tokens": 33063016} {"current_steps": 57315, "total_steps": 67140, "loss": 0.5432, "lr": 3.191903941731866e-06, "epoch": 8.536639857015192, "percentage": 85.37, "elapsed_time": "3:58:56", "remaining_time": "0:40:57", "throughput": 2306.36, "total_tokens": 33065800} {"current_steps": 57320, "total_steps": 67140, "loss": 0.705, "lr": 3.188727208863829e-06, "epoch": 8.537384569556151, "percentage": 85.37, "elapsed_time": "3:58:57", "remaining_time": "0:40:56", "throughput": 2306.39, "total_tokens": 33069032} {"current_steps": 57325, "total_steps": 67140, "loss": 0.7024, "lr": 3.1855519499129293e-06, "epoch": 8.53812928209711, "percentage": 85.38, "elapsed_time": "3:58:59", "remaining_time": "0:40:55", "throughput": 2306.41, "total_tokens": 33071816} {"current_steps": 57330, "total_steps": 67140, "loss": 0.5094, "lr": 3.1823781650937328e-06, "epoch": 8.53887399463807, "percentage": 85.39, "elapsed_time": "3:59:00", "remaining_time": "0:40:53", "throughput": 2306.43, "total_tokens": 33074760} {"current_steps": 57335, "total_steps": 67140, "loss": 0.6375, "lr": 3.1792058546207174e-06, "epoch": 8.539618707179029, "percentage": 85.4, "elapsed_time": "3:59:01", "remaining_time": "0:40:52", "throughput": 2306.46, "total_tokens": 33077928} {"current_steps": 57340, "total_steps": 67140, "loss": 0.5286, "lr": 3.176035018708251e-06, "epoch": 8.540363419719988, "percentage": 85.4, "elapsed_time": "3:59:02", "remaining_time": "0:40:51", "throughput": 2306.47, "total_tokens": 33080680} {"current_steps": 57345, "total_steps": 67140, "loss": 0.6711, "lr": 3.1728656575706118e-06, "epoch": 8.541108132260947, "percentage": 85.41, "elapsed_time": "3:59:03", "remaining_time": "0:40:50", "throughput": 2306.49, "total_tokens": 33083400} {"current_steps": 57350, "total_steps": 67140, "loss": 0.5042, "lr": 3.16969777142197e-06, "epoch": 8.541852844801907, "percentage": 85.42, "elapsed_time": "3:59:04", "remaining_time": "0:40:48", "throughput": 2306.49, "total_tokens": 33085928} {"current_steps": 57355, "total_steps": 67140, "loss": 0.611, "lr": 3.1665313604763937e-06, "epoch": 8.542597557342866, "percentage": 85.43, "elapsed_time": "3:59:05", "remaining_time": "0:40:47", "throughput": 2306.5, "total_tokens": 33088712} {"current_steps": 57360, "total_steps": 67140, "loss": 0.4617, "lr": 3.163366424947864e-06, "epoch": 8.543342269883825, "percentage": 85.43, "elapsed_time": "3:59:06", "remaining_time": "0:40:46", "throughput": 2306.51, "total_tokens": 33091432} {"current_steps": 57365, "total_steps": 67140, "loss": 0.5401, "lr": 3.1602029650502463e-06, "epoch": 8.544086982424783, "percentage": 85.44, "elapsed_time": "3:59:08", "remaining_time": "0:40:44", "throughput": 2306.52, "total_tokens": 33094056} {"current_steps": 57370, "total_steps": 67140, "loss": 0.7085, "lr": 3.1570409809973165e-06, "epoch": 8.544831694965744, "percentage": 85.45, "elapsed_time": "3:59:09", "remaining_time": "0:40:43", "throughput": 2306.54, "total_tokens": 33096968} {"current_steps": 57375, "total_steps": 67140, "loss": 0.4998, "lr": 3.153880473002752e-06, "epoch": 8.545576407506703, "percentage": 85.46, "elapsed_time": "3:59:10", "remaining_time": "0:40:42", "throughput": 2306.56, "total_tokens": 33099976} {"current_steps": 57380, "total_steps": 67140, "loss": 0.5827, "lr": 3.1507214412801243e-06, "epoch": 8.546321120047661, "percentage": 85.46, "elapsed_time": "3:59:11", "remaining_time": "0:40:41", "throughput": 2306.58, "total_tokens": 33102920} {"current_steps": 57385, "total_steps": 67140, "loss": 0.6504, "lr": 3.1475638860429147e-06, "epoch": 8.54706583258862, "percentage": 85.47, "elapsed_time": "3:59:12", "remaining_time": "0:40:39", "throughput": 2306.61, "total_tokens": 33106088} {"current_steps": 57390, "total_steps": 67140, "loss": 0.4726, "lr": 3.1444078075044873e-06, "epoch": 8.54781054512958, "percentage": 85.48, "elapsed_time": "3:59:13", "remaining_time": "0:40:38", "throughput": 2306.63, "total_tokens": 33109000} {"current_steps": 57395, "total_steps": 67140, "loss": 0.6082, "lr": 3.1412532058781198e-06, "epoch": 8.54855525767054, "percentage": 85.49, "elapsed_time": "3:59:14", "remaining_time": "0:40:37", "throughput": 2306.65, "total_tokens": 33111848} {"current_steps": 57400, "total_steps": 67140, "loss": 0.7675, "lr": 3.138100081376996e-06, "epoch": 8.549299970211498, "percentage": 85.49, "elapsed_time": "3:59:16", "remaining_time": "0:40:36", "throughput": 2306.72, "total_tokens": 33115880} {"current_steps": 57405, "total_steps": 67140, "loss": 0.4943, "lr": 3.13494843421418e-06, "epoch": 8.550044682752457, "percentage": 85.5, "elapsed_time": "3:59:17", "remaining_time": "0:40:34", "throughput": 2306.71, "total_tokens": 33118280} {"current_steps": 57410, "total_steps": 67140, "loss": 0.6077, "lr": 3.1317982646026507e-06, "epoch": 8.550789395293418, "percentage": 85.51, "elapsed_time": "3:59:18", "remaining_time": "0:40:33", "throughput": 2306.72, "total_tokens": 33120840} {"current_steps": 57415, "total_steps": 67140, "loss": 0.4602, "lr": 3.128649572755285e-06, "epoch": 8.551534107834376, "percentage": 85.52, "elapsed_time": "3:59:19", "remaining_time": "0:40:32", "throughput": 2306.72, "total_tokens": 33123464} {"current_steps": 57420, "total_steps": 67140, "loss": 0.526, "lr": 3.125502358884866e-06, "epoch": 8.552278820375335, "percentage": 85.52, "elapsed_time": "3:59:20", "remaining_time": "0:40:30", "throughput": 2306.76, "total_tokens": 33126632} {"current_steps": 57425, "total_steps": 67140, "loss": 0.7866, "lr": 3.1223566232040564e-06, "epoch": 8.553023532916294, "percentage": 85.53, "elapsed_time": "3:59:21", "remaining_time": "0:40:29", "throughput": 2306.78, "total_tokens": 33129544} {"current_steps": 57430, "total_steps": 67140, "loss": 0.5051, "lr": 3.1192123659254364e-06, "epoch": 8.553768245457253, "percentage": 85.54, "elapsed_time": "3:59:22", "remaining_time": "0:40:28", "throughput": 2306.8, "total_tokens": 33132488} {"current_steps": 57435, "total_steps": 67140, "loss": 0.5657, "lr": 3.116069587261486e-06, "epoch": 8.554512957998213, "percentage": 85.55, "elapsed_time": "3:59:24", "remaining_time": "0:40:27", "throughput": 2306.82, "total_tokens": 33135368} {"current_steps": 57440, "total_steps": 67140, "loss": 0.6346, "lr": 3.1129282874245826e-06, "epoch": 8.555257670539172, "percentage": 85.55, "elapsed_time": "3:59:25", "remaining_time": "0:40:25", "throughput": 2306.83, "total_tokens": 33138184} {"current_steps": 57445, "total_steps": 67140, "loss": 0.5766, "lr": 3.109788466626995e-06, "epoch": 8.55600238308013, "percentage": 85.56, "elapsed_time": "3:59:26", "remaining_time": "0:40:24", "throughput": 2306.86, "total_tokens": 33141320} {"current_steps": 57450, "total_steps": 67140, "loss": 0.7699, "lr": 3.106650125080904e-06, "epoch": 8.556747095621091, "percentage": 85.57, "elapsed_time": "3:59:27", "remaining_time": "0:40:23", "throughput": 2306.87, "total_tokens": 33144040} {"current_steps": 57455, "total_steps": 67140, "loss": 0.5536, "lr": 3.103513262998392e-06, "epoch": 8.55749180816205, "percentage": 85.57, "elapsed_time": "3:59:28", "remaining_time": "0:40:22", "throughput": 2306.88, "total_tokens": 33146632} {"current_steps": 57460, "total_steps": 67140, "loss": 0.4219, "lr": 3.1003778805914207e-06, "epoch": 8.558236520703009, "percentage": 85.58, "elapsed_time": "3:59:29", "remaining_time": "0:40:20", "throughput": 2306.89, "total_tokens": 33149352} {"current_steps": 57465, "total_steps": 67140, "loss": 0.5636, "lr": 3.0972439780718786e-06, "epoch": 8.558981233243967, "percentage": 85.59, "elapsed_time": "3:59:30", "remaining_time": "0:40:19", "throughput": 2306.91, "total_tokens": 33152232} {"current_steps": 57470, "total_steps": 67140, "loss": 0.5357, "lr": 3.0941115556515355e-06, "epoch": 8.559725945784926, "percentage": 85.6, "elapsed_time": "3:59:31", "remaining_time": "0:40:18", "throughput": 2306.92, "total_tokens": 33154984} {"current_steps": 57475, "total_steps": 67140, "loss": 0.4958, "lr": 3.0909806135420714e-06, "epoch": 8.560470658325887, "percentage": 85.6, "elapsed_time": "3:59:33", "remaining_time": "0:40:16", "throughput": 2306.93, "total_tokens": 33157928} {"current_steps": 57480, "total_steps": 67140, "loss": 0.4661, "lr": 3.0878511519550623e-06, "epoch": 8.561215370866845, "percentage": 85.61, "elapsed_time": "3:59:34", "remaining_time": "0:40:15", "throughput": 2306.96, "total_tokens": 33160968} {"current_steps": 57485, "total_steps": 67140, "loss": 0.5498, "lr": 3.0847231711019884e-06, "epoch": 8.561960083407804, "percentage": 85.62, "elapsed_time": "3:59:35", "remaining_time": "0:40:14", "throughput": 2306.97, "total_tokens": 33163688} {"current_steps": 57490, "total_steps": 67140, "loss": 0.5424, "lr": 3.0815966711942227e-06, "epoch": 8.562704795948763, "percentage": 85.63, "elapsed_time": "3:59:36", "remaining_time": "0:40:13", "throughput": 2307.0, "total_tokens": 33166792} {"current_steps": 57495, "total_steps": 67140, "loss": 0.4926, "lr": 3.078471652443035e-06, "epoch": 8.563449508489724, "percentage": 85.63, "elapsed_time": "3:59:37", "remaining_time": "0:40:11", "throughput": 2307.01, "total_tokens": 33169576} {"current_steps": 57500, "total_steps": 67140, "loss": 0.5596, "lr": 3.0753481150596038e-06, "epoch": 8.564194221030682, "percentage": 85.64, "elapsed_time": "3:59:38", "remaining_time": "0:40:10", "throughput": 2307.04, "total_tokens": 33172584} {"current_steps": 57505, "total_steps": 67140, "loss": 0.4476, "lr": 3.072226059255012e-06, "epoch": 8.564938933571641, "percentage": 85.65, "elapsed_time": "3:59:40", "remaining_time": "0:40:09", "throughput": 2307.05, "total_tokens": 33175464} {"current_steps": 57510, "total_steps": 67140, "loss": 0.5508, "lr": 3.0691054852402286e-06, "epoch": 8.5656836461126, "percentage": 85.66, "elapsed_time": "3:59:41", "remaining_time": "0:40:08", "throughput": 2307.07, "total_tokens": 33178248} {"current_steps": 57515, "total_steps": 67140, "loss": 0.613, "lr": 3.065986393226139e-06, "epoch": 8.56642835865356, "percentage": 85.66, "elapsed_time": "3:59:42", "remaining_time": "0:40:06", "throughput": 2307.1, "total_tokens": 33181448} {"current_steps": 57520, "total_steps": 67140, "loss": 0.552, "lr": 3.0628687834235032e-06, "epoch": 8.567173071194519, "percentage": 85.67, "elapsed_time": "3:59:43", "remaining_time": "0:40:05", "throughput": 2307.1, "total_tokens": 33184040} {"current_steps": 57525, "total_steps": 67140, "loss": 0.5325, "lr": 3.0597526560430133e-06, "epoch": 8.567917783735478, "percentage": 85.68, "elapsed_time": "3:59:44", "remaining_time": "0:40:04", "throughput": 2307.12, "total_tokens": 33186984} {"current_steps": 57530, "total_steps": 67140, "loss": 0.6949, "lr": 3.056638011295229e-06, "epoch": 8.568662496276437, "percentage": 85.69, "elapsed_time": "3:59:45", "remaining_time": "0:40:03", "throughput": 2307.14, "total_tokens": 33189896} {"current_steps": 57535, "total_steps": 67140, "loss": 0.7075, "lr": 3.053524849390635e-06, "epoch": 8.569407208817397, "percentage": 85.69, "elapsed_time": "3:59:46", "remaining_time": "0:40:01", "throughput": 2307.16, "total_tokens": 33192680} {"current_steps": 57540, "total_steps": 67140, "loss": 0.6366, "lr": 3.050413170539604e-06, "epoch": 8.570151921358356, "percentage": 85.7, "elapsed_time": "3:59:47", "remaining_time": "0:40:00", "throughput": 2307.17, "total_tokens": 33195368} {"current_steps": 57545, "total_steps": 67140, "loss": 0.4962, "lr": 3.0473029749524094e-06, "epoch": 8.570896633899315, "percentage": 85.71, "elapsed_time": "3:59:49", "remaining_time": "0:39:59", "throughput": 2307.19, "total_tokens": 33198280} {"current_steps": 57550, "total_steps": 67140, "loss": 0.5384, "lr": 3.044194262839231e-06, "epoch": 8.571641346440273, "percentage": 85.72, "elapsed_time": "3:59:50", "remaining_time": "0:39:57", "throughput": 2307.21, "total_tokens": 33201352} {"current_steps": 57555, "total_steps": 67140, "loss": 0.6853, "lr": 3.041087034410134e-06, "epoch": 8.572386058981234, "percentage": 85.72, "elapsed_time": "3:59:51", "remaining_time": "0:39:56", "throughput": 2307.22, "total_tokens": 33204040} {"current_steps": 57560, "total_steps": 67140, "loss": 0.4663, "lr": 3.037981289875097e-06, "epoch": 8.573130771522193, "percentage": 85.73, "elapsed_time": "3:59:52", "remaining_time": "0:39:55", "throughput": 2307.25, "total_tokens": 33207016} {"current_steps": 57565, "total_steps": 67140, "loss": 0.7198, "lr": 3.0348770294439973e-06, "epoch": 8.573875484063151, "percentage": 85.74, "elapsed_time": "3:59:53", "remaining_time": "0:39:54", "throughput": 2307.26, "total_tokens": 33209832} {"current_steps": 57570, "total_steps": 67140, "loss": 0.7682, "lr": 3.0317742533266024e-06, "epoch": 8.57462019660411, "percentage": 85.75, "elapsed_time": "3:59:54", "remaining_time": "0:39:52", "throughput": 2307.26, "total_tokens": 33212328} {"current_steps": 57575, "total_steps": 67140, "loss": 0.5415, "lr": 3.0286729617325844e-06, "epoch": 8.57536490914507, "percentage": 85.75, "elapsed_time": "3:59:55", "remaining_time": "0:39:51", "throughput": 2307.29, "total_tokens": 33215240} {"current_steps": 57580, "total_steps": 67140, "loss": 0.831, "lr": 3.0255731548715195e-06, "epoch": 8.57610962168603, "percentage": 85.76, "elapsed_time": "3:59:56", "remaining_time": "0:39:50", "throughput": 2307.31, "total_tokens": 33218152} {"current_steps": 57585, "total_steps": 67140, "loss": 0.4309, "lr": 3.0224748329528846e-06, "epoch": 8.576854334226988, "percentage": 85.77, "elapsed_time": "3:59:58", "remaining_time": "0:39:49", "throughput": 2307.32, "total_tokens": 33220872} {"current_steps": 57590, "total_steps": 67140, "loss": 0.6425, "lr": 3.0193779961860403e-06, "epoch": 8.577599046767947, "percentage": 85.78, "elapsed_time": "3:59:59", "remaining_time": "0:39:47", "throughput": 2307.34, "total_tokens": 33224008} {"current_steps": 57595, "total_steps": 67140, "loss": 0.6233, "lr": 3.0162826447802634e-06, "epoch": 8.578343759308908, "percentage": 85.78, "elapsed_time": "4:00:00", "remaining_time": "0:39:46", "throughput": 2307.36, "total_tokens": 33226888} {"current_steps": 57600, "total_steps": 67140, "loss": 0.5934, "lr": 3.0131887789447284e-06, "epoch": 8.579088471849866, "percentage": 85.79, "elapsed_time": "4:00:01", "remaining_time": "0:39:45", "throughput": 2307.38, "total_tokens": 33229736} {"current_steps": 57605, "total_steps": 67140, "loss": 0.5136, "lr": 3.0100963988885067e-06, "epoch": 8.579833184390825, "percentage": 85.8, "elapsed_time": "4:00:02", "remaining_time": "0:39:43", "throughput": 2307.4, "total_tokens": 33232808} {"current_steps": 57610, "total_steps": 67140, "loss": 0.4329, "lr": 3.0070055048205647e-06, "epoch": 8.580577896931784, "percentage": 85.81, "elapsed_time": "4:00:03", "remaining_time": "0:39:42", "throughput": 2307.43, "total_tokens": 33235784} {"current_steps": 57615, "total_steps": 67140, "loss": 0.5747, "lr": 3.003916096949769e-06, "epoch": 8.581322609472743, "percentage": 85.81, "elapsed_time": "4:00:04", "remaining_time": "0:39:41", "throughput": 2307.45, "total_tokens": 33238696} {"current_steps": 57620, "total_steps": 67140, "loss": 0.4848, "lr": 3.0008281754849018e-06, "epoch": 8.582067322013703, "percentage": 85.82, "elapsed_time": "4:00:06", "remaining_time": "0:39:40", "throughput": 2307.46, "total_tokens": 33241448} {"current_steps": 57625, "total_steps": 67140, "loss": 0.4696, "lr": 2.9977417406346186e-06, "epoch": 8.582812034554662, "percentage": 85.83, "elapsed_time": "4:00:07", "remaining_time": "0:39:38", "throughput": 2307.48, "total_tokens": 33244296} {"current_steps": 57630, "total_steps": 67140, "loss": 0.4747, "lr": 2.994656792607495e-06, "epoch": 8.58355674709562, "percentage": 85.84, "elapsed_time": "4:00:08", "remaining_time": "0:39:37", "throughput": 2307.49, "total_tokens": 33247176} {"current_steps": 57635, "total_steps": 67140, "loss": 0.5396, "lr": 2.9915733316119963e-06, "epoch": 8.584301459636581, "percentage": 85.84, "elapsed_time": "4:00:09", "remaining_time": "0:39:36", "throughput": 2307.51, "total_tokens": 33250088} {"current_steps": 57640, "total_steps": 67140, "loss": 0.5781, "lr": 2.988491357856493e-06, "epoch": 8.58504617217754, "percentage": 85.85, "elapsed_time": "4:00:10", "remaining_time": "0:39:35", "throughput": 2307.54, "total_tokens": 33253192} {"current_steps": 57645, "total_steps": 67140, "loss": 0.3667, "lr": 2.9854108715492572e-06, "epoch": 8.585790884718499, "percentage": 85.86, "elapsed_time": "4:00:11", "remaining_time": "0:39:33", "throughput": 2307.55, "total_tokens": 33255880} {"current_steps": 57650, "total_steps": 67140, "loss": 0.7268, "lr": 2.9823318728984447e-06, "epoch": 8.586535597259457, "percentage": 85.87, "elapsed_time": "4:00:12", "remaining_time": "0:39:32", "throughput": 2307.57, "total_tokens": 33258824} {"current_steps": 57655, "total_steps": 67140, "loss": 0.4184, "lr": 2.97925436211213e-06, "epoch": 8.587280309800416, "percentage": 85.87, "elapsed_time": "4:00:14", "remaining_time": "0:39:31", "throughput": 2307.59, "total_tokens": 33261704} {"current_steps": 57660, "total_steps": 67140, "loss": 0.4249, "lr": 2.9761783393982722e-06, "epoch": 8.588025022341377, "percentage": 85.88, "elapsed_time": "4:00:15", "remaining_time": "0:39:30", "throughput": 2307.62, "total_tokens": 33264872} {"current_steps": 57665, "total_steps": 67140, "loss": 0.5969, "lr": 2.9731038049647385e-06, "epoch": 8.588769734882336, "percentage": 85.89, "elapsed_time": "4:00:16", "remaining_time": "0:39:28", "throughput": 2307.65, "total_tokens": 33267944} {"current_steps": 57670, "total_steps": 67140, "loss": 0.524, "lr": 2.970030759019296e-06, "epoch": 8.589514447423294, "percentage": 85.9, "elapsed_time": "4:00:17", "remaining_time": "0:39:27", "throughput": 2307.68, "total_tokens": 33271144} {"current_steps": 57675, "total_steps": 67140, "loss": 0.5452, "lr": 2.966959201769609e-06, "epoch": 8.590259159964253, "percentage": 85.9, "elapsed_time": "4:00:18", "remaining_time": "0:39:26", "throughput": 2307.69, "total_tokens": 33273672} {"current_steps": 57680, "total_steps": 67140, "loss": 0.4919, "lr": 2.963889133423242e-06, "epoch": 8.591003872505214, "percentage": 85.91, "elapsed_time": "4:00:19", "remaining_time": "0:39:24", "throughput": 2307.7, "total_tokens": 33276584} {"current_steps": 57685, "total_steps": 67140, "loss": 0.4128, "lr": 2.9608205541876516e-06, "epoch": 8.591748585046172, "percentage": 85.92, "elapsed_time": "4:00:20", "remaining_time": "0:39:23", "throughput": 2307.72, "total_tokens": 33279304} {"current_steps": 57690, "total_steps": 67140, "loss": 0.6988, "lr": 2.957753464270208e-06, "epoch": 8.592493297587131, "percentage": 85.92, "elapsed_time": "4:00:22", "remaining_time": "0:39:22", "throughput": 2307.73, "total_tokens": 33282088} {"current_steps": 57695, "total_steps": 67140, "loss": 0.454, "lr": 2.954687863878164e-06, "epoch": 8.59323801012809, "percentage": 85.93, "elapsed_time": "4:00:23", "remaining_time": "0:39:21", "throughput": 2307.75, "total_tokens": 33285128} {"current_steps": 57700, "total_steps": 67140, "loss": 0.4647, "lr": 2.9516237532186826e-06, "epoch": 8.59398272266905, "percentage": 85.94, "elapsed_time": "4:00:24", "remaining_time": "0:39:19", "throughput": 2307.77, "total_tokens": 33288040} {"current_steps": 57705, "total_steps": 67140, "loss": 0.5734, "lr": 2.9485611324988254e-06, "epoch": 8.59472743521001, "percentage": 85.95, "elapsed_time": "4:00:25", "remaining_time": "0:39:18", "throughput": 2307.79, "total_tokens": 33290824} {"current_steps": 57710, "total_steps": 67140, "loss": 0.7145, "lr": 2.9455000019255524e-06, "epoch": 8.595472147750968, "percentage": 85.95, "elapsed_time": "4:00:26", "remaining_time": "0:39:17", "throughput": 2307.82, "total_tokens": 33293960} {"current_steps": 57715, "total_steps": 67140, "loss": 0.5609, "lr": 2.9424403617057285e-06, "epoch": 8.596216860291927, "percentage": 85.96, "elapsed_time": "4:00:27", "remaining_time": "0:39:16", "throughput": 2307.83, "total_tokens": 33296712} {"current_steps": 57720, "total_steps": 67140, "loss": 0.7493, "lr": 2.939382212046099e-06, "epoch": 8.596961572832887, "percentage": 85.97, "elapsed_time": "4:00:28", "remaining_time": "0:39:14", "throughput": 2307.84, "total_tokens": 33299560} {"current_steps": 57725, "total_steps": 67140, "loss": 0.6339, "lr": 2.936325553153335e-06, "epoch": 8.597706285373846, "percentage": 85.98, "elapsed_time": "4:00:30", "remaining_time": "0:39:13", "throughput": 2307.87, "total_tokens": 33302600} {"current_steps": 57730, "total_steps": 67140, "loss": 0.567, "lr": 2.9332703852339797e-06, "epoch": 8.598450997914805, "percentage": 85.98, "elapsed_time": "4:00:31", "remaining_time": "0:39:12", "throughput": 2307.89, "total_tokens": 33305480} {"current_steps": 57735, "total_steps": 67140, "loss": 0.5646, "lr": 2.930216708494493e-06, "epoch": 8.599195710455763, "percentage": 85.99, "elapsed_time": "4:00:32", "remaining_time": "0:39:11", "throughput": 2307.91, "total_tokens": 33308552} {"current_steps": 57740, "total_steps": 67140, "loss": 0.4831, "lr": 2.927164523141235e-06, "epoch": 8.599940422996724, "percentage": 86.0, "elapsed_time": "4:00:33", "remaining_time": "0:39:09", "throughput": 2307.92, "total_tokens": 33311208} {"current_steps": 57745, "total_steps": 67140, "loss": 0.6666, "lr": 2.9241138293804565e-06, "epoch": 8.600685135537683, "percentage": 86.01, "elapsed_time": "4:00:34", "remaining_time": "0:39:08", "throughput": 2307.92, "total_tokens": 33313832} {"current_steps": 57750, "total_steps": 67140, "loss": 0.4806, "lr": 2.9210646274183157e-06, "epoch": 8.601429848078642, "percentage": 86.01, "elapsed_time": "4:00:35", "remaining_time": "0:39:07", "throughput": 2307.95, "total_tokens": 33316840} {"current_steps": 57755, "total_steps": 67140, "loss": 0.6287, "lr": 2.9180169174608555e-06, "epoch": 8.6021745606196, "percentage": 86.02, "elapsed_time": "4:00:36", "remaining_time": "0:39:05", "throughput": 2307.97, "total_tokens": 33319784} {"current_steps": 57760, "total_steps": 67140, "loss": 0.5423, "lr": 2.9149706997140316e-06, "epoch": 8.60291927316056, "percentage": 86.03, "elapsed_time": "4:00:37", "remaining_time": "0:39:04", "throughput": 2307.99, "total_tokens": 33322632} {"current_steps": 57765, "total_steps": 67140, "loss": 0.4092, "lr": 2.911925974383703e-06, "epoch": 8.60366398570152, "percentage": 86.04, "elapsed_time": "4:00:39", "remaining_time": "0:39:03", "throughput": 2308.0, "total_tokens": 33325480} {"current_steps": 57770, "total_steps": 67140, "loss": 0.5366, "lr": 2.908882741675609e-06, "epoch": 8.604408698242478, "percentage": 86.04, "elapsed_time": "4:00:40", "remaining_time": "0:39:02", "throughput": 2308.02, "total_tokens": 33328392} {"current_steps": 57775, "total_steps": 67140, "loss": 0.6161, "lr": 2.9058410017954035e-06, "epoch": 8.605153410783437, "percentage": 86.05, "elapsed_time": "4:00:41", "remaining_time": "0:39:00", "throughput": 2308.04, "total_tokens": 33331144} {"current_steps": 57780, "total_steps": 67140, "loss": 0.5416, "lr": 2.902800754948634e-06, "epoch": 8.605898123324398, "percentage": 86.06, "elapsed_time": "4:00:42", "remaining_time": "0:38:59", "throughput": 2308.07, "total_tokens": 33334344} {"current_steps": 57785, "total_steps": 67140, "loss": 0.5045, "lr": 2.8997620013407557e-06, "epoch": 8.606642835865356, "percentage": 86.07, "elapsed_time": "4:00:43", "remaining_time": "0:38:58", "throughput": 2308.09, "total_tokens": 33337192} {"current_steps": 57790, "total_steps": 67140, "loss": 0.4827, "lr": 2.896724741177101e-06, "epoch": 8.607387548406315, "percentage": 86.07, "elapsed_time": "4:00:44", "remaining_time": "0:38:57", "throughput": 2308.1, "total_tokens": 33339912} {"current_steps": 57795, "total_steps": 67140, "loss": 0.5274, "lr": 2.893688974662925e-06, "epoch": 8.608132260947274, "percentage": 86.08, "elapsed_time": "4:00:45", "remaining_time": "0:38:55", "throughput": 2308.1, "total_tokens": 33342600} {"current_steps": 57800, "total_steps": 67140, "loss": 0.5217, "lr": 2.8906547020033703e-06, "epoch": 8.608876973488233, "percentage": 86.09, "elapsed_time": "4:00:46", "remaining_time": "0:38:54", "throughput": 2308.12, "total_tokens": 33345448} {"current_steps": 57805, "total_steps": 67140, "loss": 0.5912, "lr": 2.887621923403483e-06, "epoch": 8.609621686029193, "percentage": 86.1, "elapsed_time": "4:00:48", "remaining_time": "0:38:53", "throughput": 2308.14, "total_tokens": 33348360} {"current_steps": 57810, "total_steps": 67140, "loss": 0.6344, "lr": 2.884590639068202e-06, "epoch": 8.610366398570152, "percentage": 86.1, "elapsed_time": "4:00:49", "remaining_time": "0:38:51", "throughput": 2308.17, "total_tokens": 33351400} {"current_steps": 57815, "total_steps": 67140, "loss": 0.6486, "lr": 2.8815608492023696e-06, "epoch": 8.61111111111111, "percentage": 86.11, "elapsed_time": "4:00:50", "remaining_time": "0:38:50", "throughput": 2308.18, "total_tokens": 33354152} {"current_steps": 57820, "total_steps": 67140, "loss": 0.6242, "lr": 2.878532554010732e-06, "epoch": 8.61185582365207, "percentage": 86.12, "elapsed_time": "4:00:51", "remaining_time": "0:38:49", "throughput": 2308.21, "total_tokens": 33357256} {"current_steps": 57825, "total_steps": 67140, "loss": 0.3968, "lr": 2.875505753697921e-06, "epoch": 8.61260053619303, "percentage": 86.13, "elapsed_time": "4:00:52", "remaining_time": "0:38:48", "throughput": 2308.22, "total_tokens": 33360072} {"current_steps": 57830, "total_steps": 67140, "loss": 0.6206, "lr": 2.8724804484684785e-06, "epoch": 8.613345248733989, "percentage": 86.13, "elapsed_time": "4:00:53", "remaining_time": "0:38:46", "throughput": 2308.24, "total_tokens": 33362888} {"current_steps": 57835, "total_steps": 67140, "loss": 0.6522, "lr": 2.8694566385268463e-06, "epoch": 8.614089961274948, "percentage": 86.14, "elapsed_time": "4:00:54", "remaining_time": "0:38:45", "throughput": 2308.25, "total_tokens": 33365640} {"current_steps": 57840, "total_steps": 67140, "loss": 0.4698, "lr": 2.866434324077355e-06, "epoch": 8.614834673815906, "percentage": 86.15, "elapsed_time": "4:00:56", "remaining_time": "0:38:44", "throughput": 2308.27, "total_tokens": 33368648} {"current_steps": 57845, "total_steps": 67140, "loss": 0.8099, "lr": 2.86341350532425e-06, "epoch": 8.615579386356867, "percentage": 86.16, "elapsed_time": "4:00:57", "remaining_time": "0:38:43", "throughput": 2308.29, "total_tokens": 33371464} {"current_steps": 57850, "total_steps": 67140, "loss": 0.6473, "lr": 2.8603941824716542e-06, "epoch": 8.616324098897826, "percentage": 86.16, "elapsed_time": "4:00:58", "remaining_time": "0:38:41", "throughput": 2308.3, "total_tokens": 33374280} {"current_steps": 57855, "total_steps": 67140, "loss": 0.5464, "lr": 2.857376355723612e-06, "epoch": 8.617068811438784, "percentage": 86.17, "elapsed_time": "4:00:59", "remaining_time": "0:38:40", "throughput": 2308.32, "total_tokens": 33377096} {"current_steps": 57860, "total_steps": 67140, "loss": 0.4931, "lr": 2.8543600252840448e-06, "epoch": 8.617813523979743, "percentage": 86.18, "elapsed_time": "4:01:00", "remaining_time": "0:38:39", "throughput": 2308.34, "total_tokens": 33380008} {"current_steps": 57865, "total_steps": 67140, "loss": 0.6516, "lr": 2.8513451913567883e-06, "epoch": 8.618558236520704, "percentage": 86.19, "elapsed_time": "4:01:01", "remaining_time": "0:38:38", "throughput": 2308.35, "total_tokens": 33382888} {"current_steps": 57870, "total_steps": 67140, "loss": 0.5269, "lr": 2.848331854145575e-06, "epoch": 8.619302949061662, "percentage": 86.19, "elapsed_time": "4:01:02", "remaining_time": "0:38:36", "throughput": 2308.38, "total_tokens": 33385896} {"current_steps": 57875, "total_steps": 67140, "loss": 0.6146, "lr": 2.845320013854033e-06, "epoch": 8.620047661602621, "percentage": 86.2, "elapsed_time": "4:01:04", "remaining_time": "0:38:35", "throughput": 2308.4, "total_tokens": 33388744} {"current_steps": 57880, "total_steps": 67140, "loss": 0.6217, "lr": 2.8423096706856973e-06, "epoch": 8.62079237414358, "percentage": 86.21, "elapsed_time": "4:01:05", "remaining_time": "0:38:34", "throughput": 2308.41, "total_tokens": 33391592} {"current_steps": 57885, "total_steps": 67140, "loss": 0.442, "lr": 2.839300824843985e-06, "epoch": 8.62153708668454, "percentage": 86.22, "elapsed_time": "4:01:06", "remaining_time": "0:38:32", "throughput": 2308.44, "total_tokens": 33394600} {"current_steps": 57890, "total_steps": 67140, "loss": 0.74, "lr": 2.8362934765322174e-06, "epoch": 8.6222817992255, "percentage": 86.22, "elapsed_time": "4:01:07", "remaining_time": "0:38:31", "throughput": 2308.45, "total_tokens": 33397448} {"current_steps": 57895, "total_steps": 67140, "loss": 0.8691, "lr": 2.833287625953629e-06, "epoch": 8.623026511766458, "percentage": 86.23, "elapsed_time": "4:01:08", "remaining_time": "0:38:30", "throughput": 2308.47, "total_tokens": 33400392} {"current_steps": 57900, "total_steps": 67140, "loss": 0.5966, "lr": 2.8302832733113376e-06, "epoch": 8.623771224307417, "percentage": 86.24, "elapsed_time": "4:01:09", "remaining_time": "0:38:29", "throughput": 2308.5, "total_tokens": 33403432} {"current_steps": 57905, "total_steps": 67140, "loss": 0.5463, "lr": 2.8272804188083675e-06, "epoch": 8.624515936848377, "percentage": 86.25, "elapsed_time": "4:01:10", "remaining_time": "0:38:27", "throughput": 2308.52, "total_tokens": 33406312} {"current_steps": 57910, "total_steps": 67140, "loss": 0.7213, "lr": 2.824279062647639e-06, "epoch": 8.625260649389336, "percentage": 86.25, "elapsed_time": "4:01:12", "remaining_time": "0:38:26", "throughput": 2308.54, "total_tokens": 33409256} {"current_steps": 57915, "total_steps": 67140, "loss": 0.546, "lr": 2.8212792050319766e-06, "epoch": 8.626005361930295, "percentage": 86.26, "elapsed_time": "4:01:13", "remaining_time": "0:38:25", "throughput": 2308.56, "total_tokens": 33412296} {"current_steps": 57920, "total_steps": 67140, "loss": 0.7283, "lr": 2.8182808461640897e-06, "epoch": 8.626750074471254, "percentage": 86.27, "elapsed_time": "4:01:14", "remaining_time": "0:38:24", "throughput": 2308.58, "total_tokens": 33415112} {"current_steps": 57925, "total_steps": 67140, "loss": 0.5314, "lr": 2.8152839862466027e-06, "epoch": 8.627494787012214, "percentage": 86.27, "elapsed_time": "4:01:15", "remaining_time": "0:38:22", "throughput": 2308.58, "total_tokens": 33417704} {"current_steps": 57930, "total_steps": 67140, "loss": 0.625, "lr": 2.812288625482021e-06, "epoch": 8.628239499553173, "percentage": 86.28, "elapsed_time": "4:01:16", "remaining_time": "0:38:21", "throughput": 2308.6, "total_tokens": 33420648} {"current_steps": 57935, "total_steps": 67140, "loss": 0.463, "lr": 2.8092947640727673e-06, "epoch": 8.628984212094132, "percentage": 86.29, "elapsed_time": "4:01:17", "remaining_time": "0:38:20", "throughput": 2308.62, "total_tokens": 33423592} {"current_steps": 57940, "total_steps": 67140, "loss": 0.5458, "lr": 2.8063024022211533e-06, "epoch": 8.62972892463509, "percentage": 86.3, "elapsed_time": "4:01:18", "remaining_time": "0:38:19", "throughput": 2308.64, "total_tokens": 33426376} {"current_steps": 57945, "total_steps": 67140, "loss": 0.4925, "lr": 2.8033115401293884e-06, "epoch": 8.63047363717605, "percentage": 86.3, "elapsed_time": "4:01:20", "remaining_time": "0:38:17", "throughput": 2308.68, "total_tokens": 33429864} {"current_steps": 57950, "total_steps": 67140, "loss": 0.5855, "lr": 2.80032217799959e-06, "epoch": 8.63121834971701, "percentage": 86.31, "elapsed_time": "4:01:21", "remaining_time": "0:38:16", "throughput": 2308.71, "total_tokens": 33433000} {"current_steps": 57955, "total_steps": 67140, "loss": 0.5094, "lr": 2.7973343160337562e-06, "epoch": 8.631963062257968, "percentage": 86.32, "elapsed_time": "4:01:22", "remaining_time": "0:38:15", "throughput": 2308.72, "total_tokens": 33435752} {"current_steps": 57960, "total_steps": 67140, "loss": 0.5309, "lr": 2.7943479544337988e-06, "epoch": 8.632707774798927, "percentage": 86.33, "elapsed_time": "4:01:23", "remaining_time": "0:38:13", "throughput": 2308.72, "total_tokens": 33438216} {"current_steps": 57965, "total_steps": 67140, "loss": 0.6175, "lr": 2.7913630934015304e-06, "epoch": 8.633452487339888, "percentage": 86.33, "elapsed_time": "4:01:24", "remaining_time": "0:38:12", "throughput": 2308.74, "total_tokens": 33441128} {"current_steps": 57970, "total_steps": 67140, "loss": 0.6701, "lr": 2.7883797331386465e-06, "epoch": 8.634197199880846, "percentage": 86.34, "elapsed_time": "4:01:25", "remaining_time": "0:38:11", "throughput": 2308.76, "total_tokens": 33444008} {"current_steps": 57975, "total_steps": 67140, "loss": 0.4347, "lr": 2.785397873846754e-06, "epoch": 8.634941912421805, "percentage": 86.35, "elapsed_time": "4:01:26", "remaining_time": "0:38:10", "throughput": 2308.77, "total_tokens": 33446696} {"current_steps": 57980, "total_steps": 67140, "loss": 0.4007, "lr": 2.7824175157273564e-06, "epoch": 8.635686624962764, "percentage": 86.36, "elapsed_time": "4:01:27", "remaining_time": "0:38:08", "throughput": 2308.79, "total_tokens": 33449640} {"current_steps": 57985, "total_steps": 67140, "loss": 0.6477, "lr": 2.779438658981856e-06, "epoch": 8.636431337503723, "percentage": 86.36, "elapsed_time": "4:01:29", "remaining_time": "0:38:07", "throughput": 2308.8, "total_tokens": 33452456} {"current_steps": 57990, "total_steps": 67140, "loss": 0.7168, "lr": 2.776461303811545e-06, "epoch": 8.637176050044683, "percentage": 86.37, "elapsed_time": "4:01:30", "remaining_time": "0:38:06", "throughput": 2308.81, "total_tokens": 33455144} {"current_steps": 57995, "total_steps": 67140, "loss": 0.4443, "lr": 2.7734854504176234e-06, "epoch": 8.637920762585642, "percentage": 86.38, "elapsed_time": "4:01:31", "remaining_time": "0:38:05", "throughput": 2308.82, "total_tokens": 33457832} {"current_steps": 58000, "total_steps": 67140, "loss": 0.5302, "lr": 2.770511099001191e-06, "epoch": 8.6386654751266, "percentage": 86.39, "elapsed_time": "4:01:32", "remaining_time": "0:38:03", "throughput": 2308.83, "total_tokens": 33460456} {"current_steps": 58005, "total_steps": 67140, "loss": 0.6602, "lr": 2.7675382497632435e-06, "epoch": 8.63941018766756, "percentage": 86.39, "elapsed_time": "4:01:33", "remaining_time": "0:38:02", "throughput": 2308.84, "total_tokens": 33463336} {"current_steps": 58010, "total_steps": 67140, "loss": 0.7604, "lr": 2.764566902904664e-06, "epoch": 8.64015490020852, "percentage": 86.4, "elapsed_time": "4:01:34", "remaining_time": "0:38:01", "throughput": 2308.86, "total_tokens": 33466248} {"current_steps": 58015, "total_steps": 67140, "loss": 0.5805, "lr": 2.761597058626253e-06, "epoch": 8.640899612749479, "percentage": 86.41, "elapsed_time": "4:01:35", "remaining_time": "0:38:00", "throughput": 2308.88, "total_tokens": 33469224} {"current_steps": 58020, "total_steps": 67140, "loss": 0.7127, "lr": 2.758628717128703e-06, "epoch": 8.641644325290438, "percentage": 86.42, "elapsed_time": "4:01:37", "remaining_time": "0:37:58", "throughput": 2308.92, "total_tokens": 33472488} {"current_steps": 58025, "total_steps": 67140, "loss": 0.5744, "lr": 2.755661878612592e-06, "epoch": 8.642389037831396, "percentage": 86.42, "elapsed_time": "4:01:38", "remaining_time": "0:37:57", "throughput": 2308.94, "total_tokens": 33475304} {"current_steps": 58030, "total_steps": 67140, "loss": 0.4375, "lr": 2.75269654327841e-06, "epoch": 8.643133750372357, "percentage": 86.43, "elapsed_time": "4:01:39", "remaining_time": "0:37:56", "throughput": 2308.95, "total_tokens": 33478152} {"current_steps": 58035, "total_steps": 67140, "loss": 0.5747, "lr": 2.749732711326547e-06, "epoch": 8.643878462913316, "percentage": 86.44, "elapsed_time": "4:01:40", "remaining_time": "0:37:54", "throughput": 2308.98, "total_tokens": 33481384} {"current_steps": 58040, "total_steps": 67140, "loss": 0.4799, "lr": 2.7467703829572836e-06, "epoch": 8.644623175454274, "percentage": 86.45, "elapsed_time": "4:01:41", "remaining_time": "0:37:53", "throughput": 2309.0, "total_tokens": 33484200} {"current_steps": 58045, "total_steps": 67140, "loss": 0.7116, "lr": 2.7438095583708078e-06, "epoch": 8.645367887995233, "percentage": 86.45, "elapsed_time": "4:01:42", "remaining_time": "0:37:52", "throughput": 2309.02, "total_tokens": 33487144} {"current_steps": 58050, "total_steps": 67140, "loss": 0.5643, "lr": 2.740850237767195e-06, "epoch": 8.646112600536194, "percentage": 86.46, "elapsed_time": "4:01:43", "remaining_time": "0:37:51", "throughput": 2309.05, "total_tokens": 33490152} {"current_steps": 58055, "total_steps": 67140, "loss": 0.6686, "lr": 2.737892421346419e-06, "epoch": 8.646857313077152, "percentage": 86.47, "elapsed_time": "4:01:44", "remaining_time": "0:37:49", "throughput": 2309.05, "total_tokens": 33492776} {"current_steps": 58060, "total_steps": 67140, "loss": 0.3075, "lr": 2.7349361093083643e-06, "epoch": 8.647602025618111, "percentage": 86.48, "elapsed_time": "4:01:46", "remaining_time": "0:37:48", "throughput": 2309.07, "total_tokens": 33495592} {"current_steps": 58065, "total_steps": 67140, "loss": 0.5095, "lr": 2.7319813018528013e-06, "epoch": 8.64834673815907, "percentage": 86.48, "elapsed_time": "4:01:47", "remaining_time": "0:37:47", "throughput": 2309.09, "total_tokens": 33498440} {"current_steps": 58070, "total_steps": 67140, "loss": 0.6415, "lr": 2.7290279991794067e-06, "epoch": 8.64909145070003, "percentage": 86.49, "elapsed_time": "4:01:48", "remaining_time": "0:37:46", "throughput": 2309.12, "total_tokens": 33501576} {"current_steps": 58075, "total_steps": 67140, "loss": 0.5876, "lr": 2.7260762014877538e-06, "epoch": 8.64983616324099, "percentage": 86.5, "elapsed_time": "4:01:49", "remaining_time": "0:37:44", "throughput": 2309.13, "total_tokens": 33504328} {"current_steps": 58080, "total_steps": 67140, "loss": 0.7629, "lr": 2.723125908977317e-06, "epoch": 8.650580875781948, "percentage": 86.51, "elapsed_time": "4:01:50", "remaining_time": "0:37:43", "throughput": 2309.16, "total_tokens": 33507496} {"current_steps": 58085, "total_steps": 67140, "loss": 0.7148, "lr": 2.7201771218474558e-06, "epoch": 8.651325588322907, "percentage": 86.51, "elapsed_time": "4:01:51", "remaining_time": "0:37:42", "throughput": 2309.18, "total_tokens": 33510312} {"current_steps": 58090, "total_steps": 67140, "loss": 0.5492, "lr": 2.7172298402974443e-06, "epoch": 8.652070300863867, "percentage": 86.52, "elapsed_time": "4:01:52", "remaining_time": "0:37:41", "throughput": 2309.18, "total_tokens": 33512968} {"current_steps": 58095, "total_steps": 67140, "loss": 0.513, "lr": 2.7142840645264426e-06, "epoch": 8.652815013404826, "percentage": 86.53, "elapsed_time": "4:01:54", "remaining_time": "0:37:39", "throughput": 2309.2, "total_tokens": 33515912} {"current_steps": 58100, "total_steps": 67140, "loss": 0.5717, "lr": 2.711339794733517e-06, "epoch": 8.653559725945785, "percentage": 86.54, "elapsed_time": "4:01:55", "remaining_time": "0:37:38", "throughput": 2309.21, "total_tokens": 33518504} {"current_steps": 58105, "total_steps": 67140, "loss": 0.6038, "lr": 2.7083970311176267e-06, "epoch": 8.654304438486744, "percentage": 86.54, "elapsed_time": "4:01:56", "remaining_time": "0:37:37", "throughput": 2309.22, "total_tokens": 33521256} {"current_steps": 58110, "total_steps": 67140, "loss": 0.4729, "lr": 2.7054557738776356e-06, "epoch": 8.655049151027704, "percentage": 86.55, "elapsed_time": "4:01:57", "remaining_time": "0:37:35", "throughput": 2309.24, "total_tokens": 33524136} {"current_steps": 58115, "total_steps": 67140, "loss": 0.6369, "lr": 2.702516023212304e-06, "epoch": 8.655793863568663, "percentage": 86.56, "elapsed_time": "4:01:58", "remaining_time": "0:37:34", "throughput": 2309.24, "total_tokens": 33526792} {"current_steps": 58120, "total_steps": 67140, "loss": 0.6828, "lr": 2.699577779320278e-06, "epoch": 8.656538576109622, "percentage": 86.57, "elapsed_time": "4:01:59", "remaining_time": "0:37:33", "throughput": 2309.25, "total_tokens": 33529416} {"current_steps": 58125, "total_steps": 67140, "loss": 0.631, "lr": 2.696641042400122e-06, "epoch": 8.65728328865058, "percentage": 86.57, "elapsed_time": "4:02:00", "remaining_time": "0:37:32", "throughput": 2309.27, "total_tokens": 33532296} {"current_steps": 58130, "total_steps": 67140, "loss": 0.5981, "lr": 2.6937058126502905e-06, "epoch": 8.65802800119154, "percentage": 86.58, "elapsed_time": "4:02:01", "remaining_time": "0:37:30", "throughput": 2309.28, "total_tokens": 33535016} {"current_steps": 58135, "total_steps": 67140, "loss": 0.7053, "lr": 2.6907720902691226e-06, "epoch": 8.6587727137325, "percentage": 86.59, "elapsed_time": "4:02:02", "remaining_time": "0:37:29", "throughput": 2309.3, "total_tokens": 33537960} {"current_steps": 58140, "total_steps": 67140, "loss": 0.616, "lr": 2.6878398754548756e-06, "epoch": 8.659517426273458, "percentage": 86.6, "elapsed_time": "4:02:04", "remaining_time": "0:37:28", "throughput": 2309.32, "total_tokens": 33540968} {"current_steps": 58145, "total_steps": 67140, "loss": 0.5923, "lr": 2.684909168405694e-06, "epoch": 8.660262138814417, "percentage": 86.6, "elapsed_time": "4:02:05", "remaining_time": "0:37:27", "throughput": 2309.34, "total_tokens": 33543912} {"current_steps": 58150, "total_steps": 67140, "loss": 0.7845, "lr": 2.6819799693196283e-06, "epoch": 8.661006851355378, "percentage": 86.61, "elapsed_time": "4:02:06", "remaining_time": "0:37:25", "throughput": 2309.37, "total_tokens": 33546856} {"current_steps": 58155, "total_steps": 67140, "loss": 0.5353, "lr": 2.6790522783946142e-06, "epoch": 8.661751563896336, "percentage": 86.62, "elapsed_time": "4:02:07", "remaining_time": "0:37:24", "throughput": 2309.37, "total_tokens": 33549512} {"current_steps": 58160, "total_steps": 67140, "loss": 0.4589, "lr": 2.676126095828496e-06, "epoch": 8.662496276437295, "percentage": 86.62, "elapsed_time": "4:02:08", "remaining_time": "0:37:23", "throughput": 2309.39, "total_tokens": 33552392} {"current_steps": 58165, "total_steps": 67140, "loss": 0.6448, "lr": 2.673201421819016e-06, "epoch": 8.663240988978254, "percentage": 86.63, "elapsed_time": "4:02:09", "remaining_time": "0:37:21", "throughput": 2309.41, "total_tokens": 33555304} {"current_steps": 58170, "total_steps": 67140, "loss": 0.6742, "lr": 2.670278256563813e-06, "epoch": 8.663985701519213, "percentage": 86.64, "elapsed_time": "4:02:10", "remaining_time": "0:37:20", "throughput": 2309.43, "total_tokens": 33558312} {"current_steps": 58175, "total_steps": 67140, "loss": 0.4919, "lr": 2.667356600260415e-06, "epoch": 8.664730414060173, "percentage": 86.65, "elapsed_time": "4:02:12", "remaining_time": "0:37:19", "throughput": 2309.45, "total_tokens": 33561288} {"current_steps": 58180, "total_steps": 67140, "loss": 0.4181, "lr": 2.664436453106259e-06, "epoch": 8.665475126601132, "percentage": 86.65, "elapsed_time": "4:02:13", "remaining_time": "0:37:18", "throughput": 2309.47, "total_tokens": 33564200} {"current_steps": 58185, "total_steps": 67140, "loss": 0.5092, "lr": 2.6615178152986835e-06, "epoch": 8.66621983914209, "percentage": 86.66, "elapsed_time": "4:02:14", "remaining_time": "0:37:16", "throughput": 2309.49, "total_tokens": 33567112} {"current_steps": 58190, "total_steps": 67140, "loss": 0.5531, "lr": 2.6586006870349095e-06, "epoch": 8.66696455168305, "percentage": 86.67, "elapsed_time": "4:02:15", "remaining_time": "0:37:15", "throughput": 2309.52, "total_tokens": 33570184} {"current_steps": 58195, "total_steps": 67140, "loss": 0.5095, "lr": 2.6556850685120648e-06, "epoch": 8.66770926422401, "percentage": 86.68, "elapsed_time": "4:02:16", "remaining_time": "0:37:14", "throughput": 2309.53, "total_tokens": 33573096} {"current_steps": 58200, "total_steps": 67140, "loss": 0.4702, "lr": 2.6527709599271784e-06, "epoch": 8.668453976764969, "percentage": 86.68, "elapsed_time": "4:02:17", "remaining_time": "0:37:13", "throughput": 2309.55, "total_tokens": 33575912} {"current_steps": 58205, "total_steps": 67140, "loss": 0.5292, "lr": 2.649858361477173e-06, "epoch": 8.669198689305928, "percentage": 86.69, "elapsed_time": "4:02:19", "remaining_time": "0:37:11", "throughput": 2309.57, "total_tokens": 33578952} {"current_steps": 58210, "total_steps": 67140, "loss": 0.5859, "lr": 2.6469472733588767e-06, "epoch": 8.669943401846886, "percentage": 86.7, "elapsed_time": "4:02:20", "remaining_time": "0:37:10", "throughput": 2309.59, "total_tokens": 33581736} {"current_steps": 58215, "total_steps": 67140, "loss": 0.5332, "lr": 2.6440376957690026e-06, "epoch": 8.670688114387847, "percentage": 86.71, "elapsed_time": "4:02:21", "remaining_time": "0:37:09", "throughput": 2309.61, "total_tokens": 33584648} {"current_steps": 58220, "total_steps": 67140, "loss": 0.6165, "lr": 2.6411296289041627e-06, "epoch": 8.671432826928806, "percentage": 86.71, "elapsed_time": "4:02:22", "remaining_time": "0:37:08", "throughput": 2309.64, "total_tokens": 33587752} {"current_steps": 58225, "total_steps": 67140, "loss": 0.3511, "lr": 2.638223072960877e-06, "epoch": 8.672177539469764, "percentage": 86.72, "elapsed_time": "4:02:23", "remaining_time": "0:37:06", "throughput": 2309.67, "total_tokens": 33590888} {"current_steps": 58230, "total_steps": 67140, "loss": 0.413, "lr": 2.635318028135561e-06, "epoch": 8.672922252010723, "percentage": 86.73, "elapsed_time": "4:02:24", "remaining_time": "0:37:05", "throughput": 2309.69, "total_tokens": 33593864} {"current_steps": 58235, "total_steps": 67140, "loss": 0.4797, "lr": 2.6324144946245244e-06, "epoch": 8.673666964551684, "percentage": 86.74, "elapsed_time": "4:02:25", "remaining_time": "0:37:04", "throughput": 2309.72, "total_tokens": 33596968} {"current_steps": 58240, "total_steps": 67140, "loss": 0.4252, "lr": 2.629512472623974e-06, "epoch": 8.674411677092642, "percentage": 86.74, "elapsed_time": "4:02:27", "remaining_time": "0:37:03", "throughput": 2309.72, "total_tokens": 33599592} {"current_steps": 58245, "total_steps": 67140, "loss": 0.5287, "lr": 2.6266119623300277e-06, "epoch": 8.675156389633601, "percentage": 86.75, "elapsed_time": "4:02:28", "remaining_time": "0:37:01", "throughput": 2309.75, "total_tokens": 33602664} {"current_steps": 58250, "total_steps": 67140, "loss": 0.414, "lr": 2.6237129639386795e-06, "epoch": 8.67590110217456, "percentage": 86.76, "elapsed_time": "4:02:29", "remaining_time": "0:37:00", "throughput": 2309.76, "total_tokens": 33605416} {"current_steps": 58255, "total_steps": 67140, "loss": 0.6351, "lr": 2.620815477645827e-06, "epoch": 8.67664581471552, "percentage": 86.77, "elapsed_time": "4:02:30", "remaining_time": "0:36:59", "throughput": 2309.77, "total_tokens": 33608200} {"current_steps": 58260, "total_steps": 67140, "loss": 0.57, "lr": 2.6179195036472815e-06, "epoch": 8.67739052725648, "percentage": 86.77, "elapsed_time": "4:02:31", "remaining_time": "0:36:57", "throughput": 2309.79, "total_tokens": 33611112} {"current_steps": 58265, "total_steps": 67140, "loss": 0.6186, "lr": 2.615025042138733e-06, "epoch": 8.678135239797438, "percentage": 86.78, "elapsed_time": "4:02:32", "remaining_time": "0:36:56", "throughput": 2309.8, "total_tokens": 33613928} {"current_steps": 58270, "total_steps": 67140, "loss": 0.6053, "lr": 2.6121320933157834e-06, "epoch": 8.678879952338397, "percentage": 86.79, "elapsed_time": "4:02:33", "remaining_time": "0:36:55", "throughput": 2309.82, "total_tokens": 33616744} {"current_steps": 58275, "total_steps": 67140, "loss": 0.6248, "lr": 2.6092406573739264e-06, "epoch": 8.679624664879357, "percentage": 86.8, "elapsed_time": "4:02:34", "remaining_time": "0:36:54", "throughput": 2309.84, "total_tokens": 33619752} {"current_steps": 58280, "total_steps": 67140, "loss": 0.5935, "lr": 2.606350734508553e-06, "epoch": 8.680369377420316, "percentage": 86.8, "elapsed_time": "4:02:36", "remaining_time": "0:36:52", "throughput": 2309.86, "total_tokens": 33622632} {"current_steps": 58285, "total_steps": 67140, "loss": 0.4648, "lr": 2.6034623249149487e-06, "epoch": 8.681114089961275, "percentage": 86.81, "elapsed_time": "4:02:37", "remaining_time": "0:36:51", "throughput": 2309.89, "total_tokens": 33625832} {"current_steps": 58290, "total_steps": 67140, "loss": 0.4444, "lr": 2.6005754287883072e-06, "epoch": 8.681858802502234, "percentage": 86.82, "elapsed_time": "4:02:38", "remaining_time": "0:36:50", "throughput": 2309.91, "total_tokens": 33628744} {"current_steps": 58295, "total_steps": 67140, "loss": 0.6073, "lr": 2.597690046323703e-06, "epoch": 8.682603515043194, "percentage": 86.83, "elapsed_time": "4:02:39", "remaining_time": "0:36:49", "throughput": 2309.93, "total_tokens": 33631592} {"current_steps": 58300, "total_steps": 67140, "loss": 0.7114, "lr": 2.594806177716125e-06, "epoch": 8.683348227584153, "percentage": 86.83, "elapsed_time": "4:02:40", "remaining_time": "0:36:47", "throughput": 2309.94, "total_tokens": 33634248} {"current_steps": 58305, "total_steps": 67140, "loss": 0.4478, "lr": 2.5919238231604524e-06, "epoch": 8.684092940125112, "percentage": 86.84, "elapsed_time": "4:02:41", "remaining_time": "0:36:46", "throughput": 2309.96, "total_tokens": 33637288} {"current_steps": 58310, "total_steps": 67140, "loss": 0.5302, "lr": 2.589042982851461e-06, "epoch": 8.68483765266607, "percentage": 86.85, "elapsed_time": "4:02:42", "remaining_time": "0:36:45", "throughput": 2309.97, "total_tokens": 33640040} {"current_steps": 58315, "total_steps": 67140, "loss": 0.6035, "lr": 2.5861636569838366e-06, "epoch": 8.68558236520703, "percentage": 86.86, "elapsed_time": "4:02:44", "remaining_time": "0:36:44", "throughput": 2309.99, "total_tokens": 33642888} {"current_steps": 58320, "total_steps": 67140, "loss": 0.5336, "lr": 2.583285845752137e-06, "epoch": 8.68632707774799, "percentage": 86.86, "elapsed_time": "4:02:45", "remaining_time": "0:36:42", "throughput": 2310.01, "total_tokens": 33645736} {"current_steps": 58325, "total_steps": 67140, "loss": 0.523, "lr": 2.580409549350843e-06, "epoch": 8.687071790288948, "percentage": 86.87, "elapsed_time": "4:02:46", "remaining_time": "0:36:41", "throughput": 2310.01, "total_tokens": 33648360} {"current_steps": 58330, "total_steps": 67140, "loss": 0.5249, "lr": 2.577534767974324e-06, "epoch": 8.687816502829907, "percentage": 86.88, "elapsed_time": "4:02:47", "remaining_time": "0:36:40", "throughput": 2310.03, "total_tokens": 33651240} {"current_steps": 58335, "total_steps": 67140, "loss": 0.5059, "lr": 2.574661501816836e-06, "epoch": 8.688561215370868, "percentage": 86.89, "elapsed_time": "4:02:48", "remaining_time": "0:36:38", "throughput": 2310.06, "total_tokens": 33654408} {"current_steps": 58340, "total_steps": 67140, "loss": 0.4219, "lr": 2.5717897510725508e-06, "epoch": 8.689305927911827, "percentage": 86.89, "elapsed_time": "4:02:49", "remaining_time": "0:36:37", "throughput": 2310.09, "total_tokens": 33657448} {"current_steps": 58345, "total_steps": 67140, "loss": 0.5686, "lr": 2.568919515935525e-06, "epoch": 8.690050640452785, "percentage": 86.9, "elapsed_time": "4:02:51", "remaining_time": "0:36:36", "throughput": 2310.13, "total_tokens": 33660936} {"current_steps": 58350, "total_steps": 67140, "loss": 0.7209, "lr": 2.5660507965997282e-06, "epoch": 8.690795352993744, "percentage": 86.91, "elapsed_time": "4:02:52", "remaining_time": "0:36:35", "throughput": 2310.15, "total_tokens": 33663880} {"current_steps": 58355, "total_steps": 67140, "loss": 0.7021, "lr": 2.5631835932590027e-06, "epoch": 8.691540065534703, "percentage": 86.92, "elapsed_time": "4:02:53", "remaining_time": "0:36:33", "throughput": 2310.17, "total_tokens": 33666696} {"current_steps": 58360, "total_steps": 67140, "loss": 0.6604, "lr": 2.5603179061071097e-06, "epoch": 8.692284778075663, "percentage": 86.92, "elapsed_time": "4:02:54", "remaining_time": "0:36:32", "throughput": 2310.2, "total_tokens": 33669864} {"current_steps": 58365, "total_steps": 67140, "loss": 0.5142, "lr": 2.5574537353376977e-06, "epoch": 8.693029490616622, "percentage": 86.93, "elapsed_time": "4:02:55", "remaining_time": "0:36:31", "throughput": 2310.23, "total_tokens": 33672872} {"current_steps": 58370, "total_steps": 67140, "loss": 0.7004, "lr": 2.5545910811443224e-06, "epoch": 8.69377420315758, "percentage": 86.94, "elapsed_time": "4:02:56", "remaining_time": "0:36:30", "throughput": 2310.24, "total_tokens": 33675720} {"current_steps": 58375, "total_steps": 67140, "loss": 0.4729, "lr": 2.5517299437204214e-06, "epoch": 8.69451891569854, "percentage": 86.95, "elapsed_time": "4:02:57", "remaining_time": "0:36:28", "throughput": 2310.26, "total_tokens": 33678536} {"current_steps": 58380, "total_steps": 67140, "loss": 0.6988, "lr": 2.5488703232593474e-06, "epoch": 8.6952636282395, "percentage": 86.95, "elapsed_time": "4:02:58", "remaining_time": "0:36:27", "throughput": 2310.27, "total_tokens": 33681224} {"current_steps": 58385, "total_steps": 67140, "loss": 0.4727, "lr": 2.5460122199543328e-06, "epoch": 8.696008340780459, "percentage": 86.96, "elapsed_time": "4:03:00", "remaining_time": "0:36:26", "throughput": 2310.28, "total_tokens": 33683912} {"current_steps": 58390, "total_steps": 67140, "loss": 0.8465, "lr": 2.54315563399852e-06, "epoch": 8.696753053321418, "percentage": 86.97, "elapsed_time": "4:03:01", "remaining_time": "0:36:25", "throughput": 2310.31, "total_tokens": 33687048} {"current_steps": 58395, "total_steps": 67140, "loss": 0.5496, "lr": 2.5403005655849464e-06, "epoch": 8.697497765862376, "percentage": 86.97, "elapsed_time": "4:03:02", "remaining_time": "0:36:23", "throughput": 2310.34, "total_tokens": 33690216} {"current_steps": 58400, "total_steps": 67140, "loss": 0.4434, "lr": 2.5374470149065465e-06, "epoch": 8.698242478403337, "percentage": 86.98, "elapsed_time": "4:03:03", "remaining_time": "0:36:22", "throughput": 2310.36, "total_tokens": 33693160} {"current_steps": 58405, "total_steps": 67140, "loss": 0.6825, "lr": 2.5345949821561523e-06, "epoch": 8.698987190944296, "percentage": 86.99, "elapsed_time": "4:03:04", "remaining_time": "0:36:21", "throughput": 2310.38, "total_tokens": 33696008} {"current_steps": 58410, "total_steps": 67140, "loss": 0.5828, "lr": 2.5317444675264978e-06, "epoch": 8.699731903485254, "percentage": 87.0, "elapsed_time": "4:03:05", "remaining_time": "0:36:20", "throughput": 2310.4, "total_tokens": 33699048} {"current_steps": 58415, "total_steps": 67140, "loss": 0.6131, "lr": 2.528895471210199e-06, "epoch": 8.700476616026213, "percentage": 87.0, "elapsed_time": "4:03:06", "remaining_time": "0:36:18", "throughput": 2310.41, "total_tokens": 33701832} {"current_steps": 58420, "total_steps": 67140, "loss": 0.6635, "lr": 2.5260479933997826e-06, "epoch": 8.701221328567174, "percentage": 87.01, "elapsed_time": "4:03:08", "remaining_time": "0:36:17", "throughput": 2310.43, "total_tokens": 33704552} {"current_steps": 58425, "total_steps": 67140, "loss": 0.4603, "lr": 2.5232020342876666e-06, "epoch": 8.701966041108133, "percentage": 87.02, "elapsed_time": "4:03:09", "remaining_time": "0:36:16", "throughput": 2310.43, "total_tokens": 33707176} {"current_steps": 58430, "total_steps": 67140, "loss": 0.6857, "lr": 2.520357594066175e-06, "epoch": 8.702710753649091, "percentage": 87.03, "elapsed_time": "4:03:10", "remaining_time": "0:36:14", "throughput": 2310.45, "total_tokens": 33710184} {"current_steps": 58435, "total_steps": 67140, "loss": 0.4712, "lr": 2.5175146729275205e-06, "epoch": 8.70345546619005, "percentage": 87.03, "elapsed_time": "4:03:11", "remaining_time": "0:36:13", "throughput": 2310.48, "total_tokens": 33713128} {"current_steps": 58440, "total_steps": 67140, "loss": 0.7681, "lr": 2.5146732710638192e-06, "epoch": 8.70420017873101, "percentage": 87.04, "elapsed_time": "4:03:12", "remaining_time": "0:36:12", "throughput": 2310.48, "total_tokens": 33715720} {"current_steps": 58445, "total_steps": 67140, "loss": 0.4588, "lr": 2.511833388667084e-06, "epoch": 8.70494489127197, "percentage": 87.05, "elapsed_time": "4:03:13", "remaining_time": "0:36:11", "throughput": 2310.49, "total_tokens": 33718440} {"current_steps": 58450, "total_steps": 67140, "loss": 0.6816, "lr": 2.5089950259292173e-06, "epoch": 8.705689603812928, "percentage": 87.06, "elapsed_time": "4:03:14", "remaining_time": "0:36:09", "throughput": 2310.49, "total_tokens": 33720968} {"current_steps": 58455, "total_steps": 67140, "loss": 0.7356, "lr": 2.5061581830420207e-06, "epoch": 8.706434316353887, "percentage": 87.06, "elapsed_time": "4:03:15", "remaining_time": "0:36:08", "throughput": 2310.51, "total_tokens": 33723752} {"current_steps": 58460, "total_steps": 67140, "loss": 0.5097, "lr": 2.503322860197199e-06, "epoch": 8.707179028894847, "percentage": 87.07, "elapsed_time": "4:03:16", "remaining_time": "0:36:07", "throughput": 2310.52, "total_tokens": 33726600} {"current_steps": 58465, "total_steps": 67140, "loss": 0.7933, "lr": 2.5004890575863556e-06, "epoch": 8.707923741435806, "percentage": 87.08, "elapsed_time": "4:03:18", "remaining_time": "0:36:06", "throughput": 2310.53, "total_tokens": 33729320} {"current_steps": 58470, "total_steps": 67140, "loss": 0.5744, "lr": 2.497656775400986e-06, "epoch": 8.708668453976765, "percentage": 87.09, "elapsed_time": "4:03:19", "remaining_time": "0:36:04", "throughput": 2310.56, "total_tokens": 33732488} {"current_steps": 58475, "total_steps": 67140, "loss": 0.5966, "lr": 2.4948260138324827e-06, "epoch": 8.709413166517724, "percentage": 87.09, "elapsed_time": "4:03:20", "remaining_time": "0:36:03", "throughput": 2310.58, "total_tokens": 33735432} {"current_steps": 58480, "total_steps": 67140, "loss": 0.5294, "lr": 2.4919967730721414e-06, "epoch": 8.710157879058684, "percentage": 87.1, "elapsed_time": "4:03:21", "remaining_time": "0:36:02", "throughput": 2310.6, "total_tokens": 33738216} {"current_steps": 58485, "total_steps": 67140, "loss": 0.6411, "lr": 2.489169053311144e-06, "epoch": 8.710902591599643, "percentage": 87.11, "elapsed_time": "4:03:22", "remaining_time": "0:36:01", "throughput": 2310.62, "total_tokens": 33741192} {"current_steps": 58490, "total_steps": 67140, "loss": 0.4678, "lr": 2.486342854740584e-06, "epoch": 8.711647304140602, "percentage": 87.12, "elapsed_time": "4:03:23", "remaining_time": "0:35:59", "throughput": 2310.63, "total_tokens": 33744040} {"current_steps": 58495, "total_steps": 67140, "loss": 0.499, "lr": 2.483518177551436e-06, "epoch": 8.71239201668156, "percentage": 87.12, "elapsed_time": "4:03:24", "remaining_time": "0:35:58", "throughput": 2310.64, "total_tokens": 33746760} {"current_steps": 58500, "total_steps": 67140, "loss": 0.5631, "lr": 2.4806950219345842e-06, "epoch": 8.71313672922252, "percentage": 87.13, "elapsed_time": "4:03:26", "remaining_time": "0:35:57", "throughput": 2310.67, "total_tokens": 33749864} {"current_steps": 58505, "total_steps": 67140, "loss": 0.5984, "lr": 2.4778733880808036e-06, "epoch": 8.71388144176348, "percentage": 87.14, "elapsed_time": "4:03:27", "remaining_time": "0:35:55", "throughput": 2310.7, "total_tokens": 33753032} {"current_steps": 58510, "total_steps": 67140, "loss": 0.41, "lr": 2.4750532761807748e-06, "epoch": 8.714626154304439, "percentage": 87.15, "elapsed_time": "4:03:28", "remaining_time": "0:35:54", "throughput": 2310.75, "total_tokens": 33756616} {"current_steps": 58515, "total_steps": 67140, "loss": 0.4874, "lr": 2.472234686425068e-06, "epoch": 8.715370866845397, "percentage": 87.15, "elapsed_time": "4:03:29", "remaining_time": "0:35:53", "throughput": 2310.76, "total_tokens": 33759368} {"current_steps": 58520, "total_steps": 67140, "loss": 0.561, "lr": 2.469417619004144e-06, "epoch": 8.716115579386356, "percentage": 87.16, "elapsed_time": "4:03:30", "remaining_time": "0:35:52", "throughput": 2310.78, "total_tokens": 33762408} {"current_steps": 58525, "total_steps": 67140, "loss": 0.4893, "lr": 2.466602074108379e-06, "epoch": 8.716860291927317, "percentage": 87.17, "elapsed_time": "4:03:31", "remaining_time": "0:35:50", "throughput": 2310.81, "total_tokens": 33765384} {"current_steps": 58530, "total_steps": 67140, "loss": 0.6116, "lr": 2.4637880519280317e-06, "epoch": 8.717605004468275, "percentage": 87.18, "elapsed_time": "4:03:33", "remaining_time": "0:35:49", "throughput": 2310.83, "total_tokens": 33768392} {"current_steps": 58535, "total_steps": 67140, "loss": 0.3874, "lr": 2.4609755526532607e-06, "epoch": 8.718349717009234, "percentage": 87.18, "elapsed_time": "4:03:34", "remaining_time": "0:35:48", "throughput": 2310.85, "total_tokens": 33771368} {"current_steps": 58540, "total_steps": 67140, "loss": 0.5529, "lr": 2.4581645764741227e-06, "epoch": 8.719094429550193, "percentage": 87.19, "elapsed_time": "4:03:35", "remaining_time": "0:35:47", "throughput": 2310.86, "total_tokens": 33774024} {"current_steps": 58545, "total_steps": 67140, "loss": 0.4936, "lr": 2.455355123580583e-06, "epoch": 8.719839142091153, "percentage": 87.2, "elapsed_time": "4:03:36", "remaining_time": "0:35:45", "throughput": 2310.88, "total_tokens": 33776904} {"current_steps": 58550, "total_steps": 67140, "loss": 0.3942, "lr": 2.4525471941624746e-06, "epoch": 8.720583854632112, "percentage": 87.21, "elapsed_time": "4:03:37", "remaining_time": "0:35:44", "throughput": 2310.9, "total_tokens": 33779976} {"current_steps": 58555, "total_steps": 67140, "loss": 0.5962, "lr": 2.4497407884095575e-06, "epoch": 8.721328567173071, "percentage": 87.21, "elapsed_time": "4:03:38", "remaining_time": "0:35:43", "throughput": 2310.92, "total_tokens": 33782856} {"current_steps": 58560, "total_steps": 67140, "loss": 0.5696, "lr": 2.4469359065114743e-06, "epoch": 8.72207327971403, "percentage": 87.22, "elapsed_time": "4:03:39", "remaining_time": "0:35:42", "throughput": 2310.93, "total_tokens": 33785640} {"current_steps": 58565, "total_steps": 67140, "loss": 0.8132, "lr": 2.444132548657771e-06, "epoch": 8.72281799225499, "percentage": 87.23, "elapsed_time": "4:03:41", "remaining_time": "0:35:40", "throughput": 2310.95, "total_tokens": 33788648} {"current_steps": 58570, "total_steps": 67140, "loss": 0.6431, "lr": 2.4413307150378873e-06, "epoch": 8.723562704795949, "percentage": 87.24, "elapsed_time": "4:03:42", "remaining_time": "0:35:39", "throughput": 2310.98, "total_tokens": 33791848} {"current_steps": 58575, "total_steps": 67140, "loss": 0.436, "lr": 2.4385304058411525e-06, "epoch": 8.724307417336908, "percentage": 87.24, "elapsed_time": "4:03:43", "remaining_time": "0:35:38", "throughput": 2310.98, "total_tokens": 33794216} {"current_steps": 58580, "total_steps": 67140, "loss": 0.4864, "lr": 2.4357316212568094e-06, "epoch": 8.725052129877866, "percentage": 87.25, "elapsed_time": "4:03:44", "remaining_time": "0:35:37", "throughput": 2311.0, "total_tokens": 33797160} {"current_steps": 58585, "total_steps": 67140, "loss": 0.6117, "lr": 2.432934361473979e-06, "epoch": 8.725796842418827, "percentage": 87.26, "elapsed_time": "4:03:45", "remaining_time": "0:35:35", "throughput": 2311.02, "total_tokens": 33800168} {"current_steps": 58590, "total_steps": 67140, "loss": 0.596, "lr": 2.4301386266816938e-06, "epoch": 8.726541554959786, "percentage": 87.27, "elapsed_time": "4:03:46", "remaining_time": "0:35:34", "throughput": 2311.04, "total_tokens": 33803048} {"current_steps": 58595, "total_steps": 67140, "loss": 0.4536, "lr": 2.4273444170688774e-06, "epoch": 8.727286267500745, "percentage": 87.27, "elapsed_time": "4:03:47", "remaining_time": "0:35:33", "throughput": 2311.07, "total_tokens": 33806184} {"current_steps": 58600, "total_steps": 67140, "loss": 0.487, "lr": 2.424551732824354e-06, "epoch": 8.728030980041703, "percentage": 87.28, "elapsed_time": "4:03:49", "remaining_time": "0:35:31", "throughput": 2311.07, "total_tokens": 33808808} {"current_steps": 58605, "total_steps": 67140, "loss": 0.5746, "lr": 2.421760574136836e-06, "epoch": 8.728775692582664, "percentage": 87.29, "elapsed_time": "4:03:50", "remaining_time": "0:35:30", "throughput": 2311.09, "total_tokens": 33811752} {"current_steps": 58610, "total_steps": 67140, "loss": 0.5638, "lr": 2.418970941194948e-06, "epoch": 8.729520405123623, "percentage": 87.3, "elapsed_time": "4:03:51", "remaining_time": "0:35:29", "throughput": 2311.1, "total_tokens": 33814440} {"current_steps": 58615, "total_steps": 67140, "loss": 0.546, "lr": 2.4161828341871973e-06, "epoch": 8.730265117664581, "percentage": 87.3, "elapsed_time": "4:03:52", "remaining_time": "0:35:28", "throughput": 2311.11, "total_tokens": 33817224} {"current_steps": 58620, "total_steps": 67140, "loss": 0.5962, "lr": 2.4133962533019832e-06, "epoch": 8.73100983020554, "percentage": 87.31, "elapsed_time": "4:03:53", "remaining_time": "0:35:26", "throughput": 2311.14, "total_tokens": 33820232} {"current_steps": 58625, "total_steps": 67140, "loss": 0.5232, "lr": 2.410611198727622e-06, "epoch": 8.7317545427465, "percentage": 87.32, "elapsed_time": "4:03:54", "remaining_time": "0:35:25", "throughput": 2311.15, "total_tokens": 33822952} {"current_steps": 58630, "total_steps": 67140, "loss": 0.5482, "lr": 2.4078276706523156e-06, "epoch": 8.73249925528746, "percentage": 87.32, "elapsed_time": "4:03:55", "remaining_time": "0:35:24", "throughput": 2311.16, "total_tokens": 33825672} {"current_steps": 58635, "total_steps": 67140, "loss": 0.4577, "lr": 2.405045669264161e-06, "epoch": 8.733243967828418, "percentage": 87.33, "elapsed_time": "4:03:56", "remaining_time": "0:35:23", "throughput": 2311.16, "total_tokens": 33828296} {"current_steps": 58640, "total_steps": 67140, "loss": 0.6176, "lr": 2.4022651947511548e-06, "epoch": 8.733988680369377, "percentage": 87.34, "elapsed_time": "4:03:58", "remaining_time": "0:35:21", "throughput": 2311.17, "total_tokens": 33831080} {"current_steps": 58645, "total_steps": 67140, "loss": 0.4958, "lr": 2.399486247301197e-06, "epoch": 8.734733392910336, "percentage": 87.35, "elapsed_time": "4:03:59", "remaining_time": "0:35:20", "throughput": 2311.19, "total_tokens": 33833960} {"current_steps": 58650, "total_steps": 67140, "loss": 0.4002, "lr": 2.3967088271020707e-06, "epoch": 8.735478105451296, "percentage": 87.35, "elapsed_time": "4:04:00", "remaining_time": "0:35:19", "throughput": 2311.2, "total_tokens": 33836552} {"current_steps": 58655, "total_steps": 67140, "loss": 0.5796, "lr": 2.3939329343414584e-06, "epoch": 8.736222817992255, "percentage": 87.36, "elapsed_time": "4:04:01", "remaining_time": "0:35:18", "throughput": 2311.22, "total_tokens": 33839496} {"current_steps": 58660, "total_steps": 67140, "loss": 0.451, "lr": 2.39115856920695e-06, "epoch": 8.736967530533214, "percentage": 87.37, "elapsed_time": "4:04:02", "remaining_time": "0:35:16", "throughput": 2311.24, "total_tokens": 33842440} {"current_steps": 58665, "total_steps": 67140, "loss": 0.5128, "lr": 2.388385731886025e-06, "epoch": 8.737712243074174, "percentage": 87.38, "elapsed_time": "4:04:03", "remaining_time": "0:35:15", "throughput": 2311.26, "total_tokens": 33845384} {"current_steps": 58670, "total_steps": 67140, "loss": 0.6753, "lr": 2.38561442256606e-06, "epoch": 8.738456955615133, "percentage": 87.38, "elapsed_time": "4:04:04", "remaining_time": "0:35:14", "throughput": 2311.28, "total_tokens": 33848328} {"current_steps": 58675, "total_steps": 67140, "loss": 0.5166, "lr": 2.3828446414343288e-06, "epoch": 8.739201668156092, "percentage": 87.39, "elapsed_time": "4:04:05", "remaining_time": "0:35:12", "throughput": 2311.3, "total_tokens": 33851144} {"current_steps": 58680, "total_steps": 67140, "loss": 0.6179, "lr": 2.380076388678007e-06, "epoch": 8.73994638069705, "percentage": 87.4, "elapsed_time": "4:04:07", "remaining_time": "0:35:11", "throughput": 2311.3, "total_tokens": 33853672} {"current_steps": 58685, "total_steps": 67140, "loss": 0.5632, "lr": 2.377309664484151e-06, "epoch": 8.74069109323801, "percentage": 87.41, "elapsed_time": "4:04:08", "remaining_time": "0:35:10", "throughput": 2311.32, "total_tokens": 33856648} {"current_steps": 58690, "total_steps": 67140, "loss": 0.6093, "lr": 2.3745444690397302e-06, "epoch": 8.74143580577897, "percentage": 87.41, "elapsed_time": "4:04:09", "remaining_time": "0:35:09", "throughput": 2311.34, "total_tokens": 33859688} {"current_steps": 58695, "total_steps": 67140, "loss": 0.6885, "lr": 2.3717808025316118e-06, "epoch": 8.742180518319929, "percentage": 87.42, "elapsed_time": "4:04:10", "remaining_time": "0:35:07", "throughput": 2311.35, "total_tokens": 33862408} {"current_steps": 58700, "total_steps": 67140, "loss": 0.6086, "lr": 2.369018665146544e-06, "epoch": 8.742925230860887, "percentage": 87.43, "elapsed_time": "4:04:11", "remaining_time": "0:35:06", "throughput": 2311.36, "total_tokens": 33865000} {"current_steps": 58705, "total_steps": 67140, "loss": 0.59, "lr": 2.36625805707118e-06, "epoch": 8.743669943401846, "percentage": 87.44, "elapsed_time": "4:04:12", "remaining_time": "0:35:05", "throughput": 2311.38, "total_tokens": 33867848} {"current_steps": 58710, "total_steps": 67140, "loss": 0.7167, "lr": 2.363498978492082e-06, "epoch": 8.744414655942807, "percentage": 87.44, "elapsed_time": "4:04:13", "remaining_time": "0:35:04", "throughput": 2311.41, "total_tokens": 33871176} {"current_steps": 58715, "total_steps": 67140, "loss": 0.5614, "lr": 2.3607414295956835e-06, "epoch": 8.745159368483765, "percentage": 87.45, "elapsed_time": "4:04:14", "remaining_time": "0:35:02", "throughput": 2311.42, "total_tokens": 33873864} {"current_steps": 58720, "total_steps": 67140, "loss": 0.4851, "lr": 2.357985410568336e-06, "epoch": 8.745904081024724, "percentage": 87.46, "elapsed_time": "4:04:16", "remaining_time": "0:35:01", "throughput": 2311.45, "total_tokens": 33876936} {"current_steps": 58725, "total_steps": 67140, "loss": 0.4875, "lr": 2.3552309215962796e-06, "epoch": 8.746648793565683, "percentage": 87.47, "elapsed_time": "4:04:17", "remaining_time": "0:35:00", "throughput": 2311.45, "total_tokens": 33879560} {"current_steps": 58730, "total_steps": 67140, "loss": 0.5238, "lr": 2.3524779628656484e-06, "epoch": 8.747393506106643, "percentage": 87.47, "elapsed_time": "4:04:18", "remaining_time": "0:34:59", "throughput": 2311.47, "total_tokens": 33882472} {"current_steps": 58735, "total_steps": 67140, "loss": 0.4387, "lr": 2.3497265345624824e-06, "epoch": 8.748138218647602, "percentage": 87.48, "elapsed_time": "4:04:19", "remaining_time": "0:34:57", "throughput": 2311.49, "total_tokens": 33885256} {"current_steps": 58740, "total_steps": 67140, "loss": 0.5748, "lr": 2.3469766368727053e-06, "epoch": 8.748882931188561, "percentage": 87.49, "elapsed_time": "4:04:20", "remaining_time": "0:34:56", "throughput": 2311.51, "total_tokens": 33888136} {"current_steps": 58745, "total_steps": 67140, "loss": 0.3631, "lr": 2.3442282699821515e-06, "epoch": 8.74962764372952, "percentage": 87.5, "elapsed_time": "4:04:21", "remaining_time": "0:34:55", "throughput": 2311.53, "total_tokens": 33891048} {"current_steps": 58750, "total_steps": 67140, "loss": 0.6997, "lr": 2.341481434076534e-06, "epoch": 8.75037235627048, "percentage": 87.5, "elapsed_time": "4:04:22", "remaining_time": "0:34:53", "throughput": 2311.54, "total_tokens": 33893864} {"current_steps": 58755, "total_steps": 67140, "loss": 0.6247, "lr": 2.338736129341479e-06, "epoch": 8.751117068811439, "percentage": 87.51, "elapsed_time": "4:04:24", "remaining_time": "0:34:52", "throughput": 2311.57, "total_tokens": 33896904} {"current_steps": 58760, "total_steps": 67140, "loss": 0.6055, "lr": 2.335992355962502e-06, "epoch": 8.751861781352398, "percentage": 87.52, "elapsed_time": "4:04:25", "remaining_time": "0:34:51", "throughput": 2311.6, "total_tokens": 33900200} {"current_steps": 58765, "total_steps": 67140, "loss": 0.4903, "lr": 2.3332501141250156e-06, "epoch": 8.752606493893357, "percentage": 87.53, "elapsed_time": "4:04:26", "remaining_time": "0:34:50", "throughput": 2311.61, "total_tokens": 33902952} {"current_steps": 58770, "total_steps": 67140, "loss": 0.5503, "lr": 2.3305094040143303e-06, "epoch": 8.753351206434317, "percentage": 87.53, "elapsed_time": "4:04:27", "remaining_time": "0:34:48", "throughput": 2311.63, "total_tokens": 33905832} {"current_steps": 58775, "total_steps": 67140, "loss": 0.5016, "lr": 2.3277702258156566e-06, "epoch": 8.754095918975276, "percentage": 87.54, "elapsed_time": "4:04:28", "remaining_time": "0:34:47", "throughput": 2311.66, "total_tokens": 33908872} {"current_steps": 58780, "total_steps": 67140, "loss": 0.7213, "lr": 2.3250325797140952e-06, "epoch": 8.754840631516235, "percentage": 87.55, "elapsed_time": "4:04:29", "remaining_time": "0:34:46", "throughput": 2311.67, "total_tokens": 33911624} {"current_steps": 58785, "total_steps": 67140, "loss": 0.6839, "lr": 2.3222964658946357e-06, "epoch": 8.755585344057193, "percentage": 87.56, "elapsed_time": "4:04:30", "remaining_time": "0:34:45", "throughput": 2311.7, "total_tokens": 33914728} {"current_steps": 58790, "total_steps": 67140, "loss": 0.4397, "lr": 2.319561884542179e-06, "epoch": 8.756330056598154, "percentage": 87.56, "elapsed_time": "4:04:32", "remaining_time": "0:34:43", "throughput": 2311.71, "total_tokens": 33917544} {"current_steps": 58795, "total_steps": 67140, "loss": 0.443, "lr": 2.3168288358415197e-06, "epoch": 8.757074769139113, "percentage": 87.57, "elapsed_time": "4:04:33", "remaining_time": "0:34:42", "throughput": 2311.73, "total_tokens": 33920584} {"current_steps": 58800, "total_steps": 67140, "loss": 0.5372, "lr": 2.314097319977343e-06, "epoch": 8.757819481680071, "percentage": 87.58, "elapsed_time": "4:04:34", "remaining_time": "0:34:41", "throughput": 2311.75, "total_tokens": 33923336} {"current_steps": 58805, "total_steps": 67140, "loss": 0.7022, "lr": 2.3113673371342378e-06, "epoch": 8.75856419422103, "percentage": 87.59, "elapsed_time": "4:04:35", "remaining_time": "0:34:40", "throughput": 2311.79, "total_tokens": 33926824} {"current_steps": 58810, "total_steps": 67140, "loss": 0.6375, "lr": 2.3086388874966865e-06, "epoch": 8.75930890676199, "percentage": 87.59, "elapsed_time": "4:04:36", "remaining_time": "0:34:38", "throughput": 2311.82, "total_tokens": 33929896} {"current_steps": 58815, "total_steps": 67140, "loss": 0.4806, "lr": 2.3059119712490613e-06, "epoch": 8.76005361930295, "percentage": 87.6, "elapsed_time": "4:04:37", "remaining_time": "0:34:37", "throughput": 2311.84, "total_tokens": 33932968} {"current_steps": 58820, "total_steps": 67140, "loss": 0.5546, "lr": 2.303186588575634e-06, "epoch": 8.760798331843908, "percentage": 87.61, "elapsed_time": "4:04:38", "remaining_time": "0:34:36", "throughput": 2311.84, "total_tokens": 33935368} {"current_steps": 58825, "total_steps": 67140, "loss": 0.6496, "lr": 2.3004627396605776e-06, "epoch": 8.761543044384867, "percentage": 87.62, "elapsed_time": "4:04:40", "remaining_time": "0:34:35", "throughput": 2311.85, "total_tokens": 33938120} {"current_steps": 58830, "total_steps": 67140, "loss": 0.5098, "lr": 2.2977404246879607e-06, "epoch": 8.762287756925826, "percentage": 87.62, "elapsed_time": "4:04:41", "remaining_time": "0:34:33", "throughput": 2311.87, "total_tokens": 33940936} {"current_steps": 58835, "total_steps": 67140, "loss": 0.6959, "lr": 2.2950196438417448e-06, "epoch": 8.763032469466786, "percentage": 87.63, "elapsed_time": "4:04:42", "remaining_time": "0:34:32", "throughput": 2311.89, "total_tokens": 33944072} {"current_steps": 58840, "total_steps": 67140, "loss": 0.5862, "lr": 2.292300397305791e-06, "epoch": 8.763777182007745, "percentage": 87.64, "elapsed_time": "4:04:43", "remaining_time": "0:34:31", "throughput": 2311.9, "total_tokens": 33946824} {"current_steps": 58845, "total_steps": 67140, "loss": 0.5848, "lr": 2.289582685263858e-06, "epoch": 8.764521894548704, "percentage": 87.65, "elapsed_time": "4:04:44", "remaining_time": "0:34:30", "throughput": 2311.92, "total_tokens": 33949800} {"current_steps": 58850, "total_steps": 67140, "loss": 0.5749, "lr": 2.2868665078995878e-06, "epoch": 8.765266607089664, "percentage": 87.65, "elapsed_time": "4:04:45", "remaining_time": "0:34:28", "throughput": 2311.94, "total_tokens": 33952648} {"current_steps": 58855, "total_steps": 67140, "loss": 0.5108, "lr": 2.2841518653965388e-06, "epoch": 8.766011319630623, "percentage": 87.66, "elapsed_time": "4:04:46", "remaining_time": "0:34:27", "throughput": 2311.96, "total_tokens": 33955560} {"current_steps": 58860, "total_steps": 67140, "loss": 0.4758, "lr": 2.281438757938145e-06, "epoch": 8.766756032171582, "percentage": 87.67, "elapsed_time": "4:04:48", "remaining_time": "0:34:26", "throughput": 2311.97, "total_tokens": 33958280} {"current_steps": 58865, "total_steps": 67140, "loss": 0.4573, "lr": 2.2787271857077546e-06, "epoch": 8.76750074471254, "percentage": 87.68, "elapsed_time": "4:04:49", "remaining_time": "0:34:24", "throughput": 2311.98, "total_tokens": 33961064} {"current_steps": 58870, "total_steps": 67140, "loss": 0.5634, "lr": 2.276017148888604e-06, "epoch": 8.7682454572535, "percentage": 87.68, "elapsed_time": "4:04:50", "remaining_time": "0:34:23", "throughput": 2312.0, "total_tokens": 33963912} {"current_steps": 58875, "total_steps": 67140, "loss": 0.4859, "lr": 2.273308647663827e-06, "epoch": 8.76899016979446, "percentage": 87.69, "elapsed_time": "4:04:51", "remaining_time": "0:34:22", "throughput": 2312.01, "total_tokens": 33966632} {"current_steps": 58880, "total_steps": 67140, "loss": 0.5934, "lr": 2.27060168221645e-06, "epoch": 8.769734882335419, "percentage": 87.7, "elapsed_time": "4:04:52", "remaining_time": "0:34:21", "throughput": 2312.02, "total_tokens": 33969416} {"current_steps": 58885, "total_steps": 67140, "loss": 0.6166, "lr": 2.2678962527293986e-06, "epoch": 8.770479594876377, "percentage": 87.7, "elapsed_time": "4:04:53", "remaining_time": "0:34:19", "throughput": 2312.02, "total_tokens": 33971944} {"current_steps": 58890, "total_steps": 67140, "loss": 0.6523, "lr": 2.2651923593854985e-06, "epoch": 8.771224307417336, "percentage": 87.71, "elapsed_time": "4:04:54", "remaining_time": "0:34:18", "throughput": 2312.03, "total_tokens": 33974504} {"current_steps": 58895, "total_steps": 67140, "loss": 0.4793, "lr": 2.2624900023674678e-06, "epoch": 8.771969019958297, "percentage": 87.72, "elapsed_time": "4:04:55", "remaining_time": "0:34:17", "throughput": 2312.04, "total_tokens": 33977416} {"current_steps": 58900, "total_steps": 67140, "loss": 0.5865, "lr": 2.259789181857916e-06, "epoch": 8.772713732499255, "percentage": 87.73, "elapsed_time": "4:04:56", "remaining_time": "0:34:16", "throughput": 2312.06, "total_tokens": 33980200} {"current_steps": 58905, "total_steps": 67140, "loss": 0.5756, "lr": 2.2570898980393552e-06, "epoch": 8.773458445040214, "percentage": 87.73, "elapsed_time": "4:04:58", "remaining_time": "0:34:14", "throughput": 2312.07, "total_tokens": 33982920} {"current_steps": 58910, "total_steps": 67140, "loss": 0.7466, "lr": 2.254392151094198e-06, "epoch": 8.774203157581173, "percentage": 87.74, "elapsed_time": "4:04:59", "remaining_time": "0:34:13", "throughput": 2312.09, "total_tokens": 33985800} {"current_steps": 58915, "total_steps": 67140, "loss": 0.4356, "lr": 2.251695941204737e-06, "epoch": 8.774947870122134, "percentage": 87.75, "elapsed_time": "4:05:00", "remaining_time": "0:34:12", "throughput": 2312.12, "total_tokens": 33988968} {"current_steps": 58920, "total_steps": 67140, "loss": 0.6316, "lr": 2.2490012685531777e-06, "epoch": 8.775692582663092, "percentage": 87.76, "elapsed_time": "4:05:01", "remaining_time": "0:34:11", "throughput": 2312.14, "total_tokens": 33992008} {"current_steps": 58925, "total_steps": 67140, "loss": 0.5714, "lr": 2.246308133321612e-06, "epoch": 8.776437295204051, "percentage": 87.76, "elapsed_time": "4:05:02", "remaining_time": "0:34:09", "throughput": 2312.16, "total_tokens": 33994856} {"current_steps": 58930, "total_steps": 67140, "loss": 0.3736, "lr": 2.2436165356920335e-06, "epoch": 8.77718200774501, "percentage": 87.77, "elapsed_time": "4:05:03", "remaining_time": "0:34:08", "throughput": 2312.17, "total_tokens": 33997736} {"current_steps": 58935, "total_steps": 67140, "loss": 0.4143, "lr": 2.2409264758463363e-06, "epoch": 8.77792672028597, "percentage": 87.78, "elapsed_time": "4:05:04", "remaining_time": "0:34:07", "throughput": 2312.19, "total_tokens": 34000648} {"current_steps": 58940, "total_steps": 67140, "loss": 0.4789, "lr": 2.238237953966288e-06, "epoch": 8.778671432826929, "percentage": 87.79, "elapsed_time": "4:05:06", "remaining_time": "0:34:05", "throughput": 2312.22, "total_tokens": 34003656} {"current_steps": 58945, "total_steps": 67140, "loss": 0.4155, "lr": 2.2355509702335825e-06, "epoch": 8.779416145367888, "percentage": 87.79, "elapsed_time": "4:05:07", "remaining_time": "0:34:04", "throughput": 2312.22, "total_tokens": 34006344} {"current_steps": 58950, "total_steps": 67140, "loss": 0.4147, "lr": 2.2328655248297833e-06, "epoch": 8.780160857908847, "percentage": 87.8, "elapsed_time": "4:05:08", "remaining_time": "0:34:03", "throughput": 2312.23, "total_tokens": 34009096} {"current_steps": 58955, "total_steps": 67140, "loss": 0.4569, "lr": 2.2301816179363695e-06, "epoch": 8.780905570449807, "percentage": 87.81, "elapsed_time": "4:05:09", "remaining_time": "0:34:02", "throughput": 2312.26, "total_tokens": 34012232} {"current_steps": 58960, "total_steps": 67140, "loss": 0.4944, "lr": 2.2274992497347045e-06, "epoch": 8.781650282990766, "percentage": 87.82, "elapsed_time": "4:05:10", "remaining_time": "0:34:00", "throughput": 2312.29, "total_tokens": 34015304} {"current_steps": 58965, "total_steps": 67140, "loss": 0.5408, "lr": 2.224818420406055e-06, "epoch": 8.782394995531725, "percentage": 87.82, "elapsed_time": "4:05:11", "remaining_time": "0:33:59", "throughput": 2312.32, "total_tokens": 34018472} {"current_steps": 58970, "total_steps": 67140, "loss": 0.4348, "lr": 2.2221391301315787e-06, "epoch": 8.783139708072683, "percentage": 87.83, "elapsed_time": "4:05:12", "remaining_time": "0:33:58", "throughput": 2312.33, "total_tokens": 34021224} {"current_steps": 58975, "total_steps": 67140, "loss": 0.6087, "lr": 2.2194613790923387e-06, "epoch": 8.783884420613644, "percentage": 87.84, "elapsed_time": "4:05:14", "remaining_time": "0:33:57", "throughput": 2312.35, "total_tokens": 34024136} {"current_steps": 58980, "total_steps": 67140, "loss": 0.8593, "lr": 2.2167851674692763e-06, "epoch": 8.784629133154603, "percentage": 87.85, "elapsed_time": "4:05:15", "remaining_time": "0:33:55", "throughput": 2312.36, "total_tokens": 34026920} {"current_steps": 58985, "total_steps": 67140, "loss": 0.6339, "lr": 2.214110495443242e-06, "epoch": 8.785373845695561, "percentage": 87.85, "elapsed_time": "4:05:16", "remaining_time": "0:33:54", "throughput": 2312.38, "total_tokens": 34029896} {"current_steps": 58990, "total_steps": 67140, "loss": 0.5197, "lr": 2.211437363194976e-06, "epoch": 8.78611855823652, "percentage": 87.86, "elapsed_time": "4:05:17", "remaining_time": "0:33:53", "throughput": 2312.39, "total_tokens": 34032584} {"current_steps": 58995, "total_steps": 67140, "loss": 0.6462, "lr": 2.2087657709051246e-06, "epoch": 8.78686327077748, "percentage": 87.87, "elapsed_time": "4:05:18", "remaining_time": "0:33:52", "throughput": 2312.42, "total_tokens": 34035656} {"current_steps": 59000, "total_steps": 67140, "loss": 0.3636, "lr": 2.206095718754217e-06, "epoch": 8.78760798331844, "percentage": 87.88, "elapsed_time": "4:05:19", "remaining_time": "0:33:50", "throughput": 2312.44, "total_tokens": 34038536} {"current_steps": 59005, "total_steps": 67140, "loss": 0.6227, "lr": 2.2034272069226897e-06, "epoch": 8.788352695859398, "percentage": 87.88, "elapsed_time": "4:05:20", "remaining_time": "0:33:49", "throughput": 2312.46, "total_tokens": 34041640} {"current_steps": 59010, "total_steps": 67140, "loss": 0.5871, "lr": 2.2007602355908707e-06, "epoch": 8.789097408400357, "percentage": 87.89, "elapsed_time": "4:05:22", "remaining_time": "0:33:48", "throughput": 2312.48, "total_tokens": 34044488} {"current_steps": 59015, "total_steps": 67140, "loss": 0.7837, "lr": 2.19809480493898e-06, "epoch": 8.789842120941316, "percentage": 87.9, "elapsed_time": "4:05:23", "remaining_time": "0:33:47", "throughput": 2312.49, "total_tokens": 34047176} {"current_steps": 59020, "total_steps": 67140, "loss": 0.6515, "lr": 2.195430915147134e-06, "epoch": 8.790586833482276, "percentage": 87.91, "elapsed_time": "4:05:24", "remaining_time": "0:33:45", "throughput": 2312.51, "total_tokens": 34050152} {"current_steps": 59025, "total_steps": 67140, "loss": 0.5398, "lr": 2.192768566395348e-06, "epoch": 8.791331546023235, "percentage": 87.91, "elapsed_time": "4:05:25", "remaining_time": "0:33:44", "throughput": 2312.55, "total_tokens": 34053512} {"current_steps": 59030, "total_steps": 67140, "loss": 0.599, "lr": 2.1901077588635357e-06, "epoch": 8.792076258564194, "percentage": 87.92, "elapsed_time": "4:05:26", "remaining_time": "0:33:43", "throughput": 2312.57, "total_tokens": 34056488} {"current_steps": 59035, "total_steps": 67140, "loss": 0.7607, "lr": 2.187448492731503e-06, "epoch": 8.792820971105153, "percentage": 87.93, "elapsed_time": "4:05:27", "remaining_time": "0:33:42", "throughput": 2312.58, "total_tokens": 34059272} {"current_steps": 59040, "total_steps": 67140, "loss": 0.6927, "lr": 2.184790768178957e-06, "epoch": 8.793565683646113, "percentage": 87.94, "elapsed_time": "4:05:29", "remaining_time": "0:33:40", "throughput": 2312.63, "total_tokens": 34062760} {"current_steps": 59045, "total_steps": 67140, "loss": 0.4444, "lr": 2.182134585385487e-06, "epoch": 8.794310396187072, "percentage": 87.94, "elapsed_time": "4:05:30", "remaining_time": "0:33:39", "throughput": 2312.65, "total_tokens": 34065704} {"current_steps": 59050, "total_steps": 67140, "loss": 0.4232, "lr": 2.179479944530588e-06, "epoch": 8.79505510872803, "percentage": 87.95, "elapsed_time": "4:05:31", "remaining_time": "0:33:38", "throughput": 2312.67, "total_tokens": 34068648} {"current_steps": 59055, "total_steps": 67140, "loss": 0.3109, "lr": 2.1768268457936613e-06, "epoch": 8.79579982126899, "percentage": 87.96, "elapsed_time": "4:05:32", "remaining_time": "0:33:36", "throughput": 2312.69, "total_tokens": 34071624} {"current_steps": 59060, "total_steps": 67140, "loss": 0.6595, "lr": 2.1741752893539775e-06, "epoch": 8.79654453380995, "percentage": 87.97, "elapsed_time": "4:05:33", "remaining_time": "0:33:35", "throughput": 2312.71, "total_tokens": 34074600} {"current_steps": 59065, "total_steps": 67140, "loss": 0.5706, "lr": 2.1715252753907234e-06, "epoch": 8.797289246350909, "percentage": 87.97, "elapsed_time": "4:05:34", "remaining_time": "0:33:34", "throughput": 2312.74, "total_tokens": 34077832} {"current_steps": 59070, "total_steps": 67140, "loss": 0.6226, "lr": 2.168876804082978e-06, "epoch": 8.798033958891867, "percentage": 87.98, "elapsed_time": "4:05:35", "remaining_time": "0:33:33", "throughput": 2312.75, "total_tokens": 34080456} {"current_steps": 59075, "total_steps": 67140, "loss": 0.5975, "lr": 2.166229875609718e-06, "epoch": 8.798778671432826, "percentage": 87.99, "elapsed_time": "4:05:37", "remaining_time": "0:33:31", "throughput": 2312.76, "total_tokens": 34083336} {"current_steps": 59080, "total_steps": 67140, "loss": 0.8758, "lr": 2.163584490149806e-06, "epoch": 8.799523383973787, "percentage": 88.0, "elapsed_time": "4:05:38", "remaining_time": "0:33:30", "throughput": 2312.77, "total_tokens": 34086088} {"current_steps": 59085, "total_steps": 67140, "loss": 0.8353, "lr": 2.1609406478820066e-06, "epoch": 8.800268096514746, "percentage": 88.0, "elapsed_time": "4:05:39", "remaining_time": "0:33:29", "throughput": 2312.8, "total_tokens": 34089224} {"current_steps": 59090, "total_steps": 67140, "loss": 0.4851, "lr": 2.15829834898498e-06, "epoch": 8.801012809055704, "percentage": 88.01, "elapsed_time": "4:05:40", "remaining_time": "0:33:28", "throughput": 2312.82, "total_tokens": 34092168} {"current_steps": 59095, "total_steps": 67140, "loss": 0.5456, "lr": 2.155657593637289e-06, "epoch": 8.801757521596663, "percentage": 88.02, "elapsed_time": "4:05:41", "remaining_time": "0:33:26", "throughput": 2312.83, "total_tokens": 34094952} {"current_steps": 59100, "total_steps": 67140, "loss": 0.773, "lr": 2.1530183820173743e-06, "epoch": 8.802502234137624, "percentage": 88.03, "elapsed_time": "4:05:42", "remaining_time": "0:33:25", "throughput": 2312.84, "total_tokens": 34097736} {"current_steps": 59105, "total_steps": 67140, "loss": 0.6237, "lr": 2.1503807143035875e-06, "epoch": 8.803246946678582, "percentage": 88.03, "elapsed_time": "4:05:43", "remaining_time": "0:33:24", "throughput": 2312.86, "total_tokens": 34100712} {"current_steps": 59110, "total_steps": 67140, "loss": 0.6776, "lr": 2.1477445906741776e-06, "epoch": 8.803991659219541, "percentage": 88.04, "elapsed_time": "4:05:45", "remaining_time": "0:33:23", "throughput": 2312.87, "total_tokens": 34103432} {"current_steps": 59115, "total_steps": 67140, "loss": 0.744, "lr": 2.1451100113072748e-06, "epoch": 8.8047363717605, "percentage": 88.05, "elapsed_time": "4:05:46", "remaining_time": "0:33:21", "throughput": 2312.89, "total_tokens": 34106408} {"current_steps": 59120, "total_steps": 67140, "loss": 0.6807, "lr": 2.142476976380914e-06, "epoch": 8.80548108430146, "percentage": 88.05, "elapsed_time": "4:05:47", "remaining_time": "0:33:20", "throughput": 2312.9, "total_tokens": 34109032} {"current_steps": 59125, "total_steps": 67140, "loss": 0.5868, "lr": 2.1398454860730277e-06, "epoch": 8.80622579684242, "percentage": 88.06, "elapsed_time": "4:05:48", "remaining_time": "0:33:19", "throughput": 2312.92, "total_tokens": 34111944} {"current_steps": 59130, "total_steps": 67140, "loss": 0.521, "lr": 2.1372155405614436e-06, "epoch": 8.806970509383378, "percentage": 88.07, "elapsed_time": "4:05:49", "remaining_time": "0:33:18", "throughput": 2312.93, "total_tokens": 34114760} {"current_steps": 59135, "total_steps": 67140, "loss": 0.4519, "lr": 2.13458714002388e-06, "epoch": 8.807715221924337, "percentage": 88.08, "elapsed_time": "4:05:50", "remaining_time": "0:33:16", "throughput": 2312.94, "total_tokens": 34117448} {"current_steps": 59140, "total_steps": 67140, "loss": 0.3906, "lr": 2.1319602846379518e-06, "epoch": 8.808459934465297, "percentage": 88.08, "elapsed_time": "4:05:51", "remaining_time": "0:33:15", "throughput": 2312.96, "total_tokens": 34120456} {"current_steps": 59145, "total_steps": 67140, "loss": 0.5099, "lr": 2.1293349745811765e-06, "epoch": 8.809204647006256, "percentage": 88.09, "elapsed_time": "4:05:52", "remaining_time": "0:33:14", "throughput": 2312.98, "total_tokens": 34123336} {"current_steps": 59150, "total_steps": 67140, "loss": 0.6607, "lr": 2.1267112100309545e-06, "epoch": 8.809949359547215, "percentage": 88.1, "elapsed_time": "4:05:54", "remaining_time": "0:33:12", "throughput": 2312.99, "total_tokens": 34126152} {"current_steps": 59155, "total_steps": 67140, "loss": 0.4955, "lr": 2.1240889911645913e-06, "epoch": 8.810694072088173, "percentage": 88.11, "elapsed_time": "4:05:55", "remaining_time": "0:33:11", "throughput": 2313.01, "total_tokens": 34129000} {"current_steps": 59160, "total_steps": 67140, "loss": 0.3512, "lr": 2.121468318159289e-06, "epoch": 8.811438784629132, "percentage": 88.11, "elapsed_time": "4:05:56", "remaining_time": "0:33:10", "throughput": 2313.04, "total_tokens": 34132008} {"current_steps": 59165, "total_steps": 67140, "loss": 0.5448, "lr": 2.1188491911921403e-06, "epoch": 8.812183497170093, "percentage": 88.12, "elapsed_time": "4:05:57", "remaining_time": "0:33:09", "throughput": 2313.05, "total_tokens": 34134728} {"current_steps": 59170, "total_steps": 67140, "loss": 0.5744, "lr": 2.1162316104401364e-06, "epoch": 8.812928209711052, "percentage": 88.13, "elapsed_time": "4:05:58", "remaining_time": "0:33:07", "throughput": 2313.06, "total_tokens": 34137512} {"current_steps": 59175, "total_steps": 67140, "loss": 0.6764, "lr": 2.1136155760801633e-06, "epoch": 8.81367292225201, "percentage": 88.14, "elapsed_time": "4:05:59", "remaining_time": "0:33:06", "throughput": 2313.07, "total_tokens": 34140328} {"current_steps": 59180, "total_steps": 67140, "loss": 0.6269, "lr": 2.1110010882890025e-06, "epoch": 8.81441763479297, "percentage": 88.14, "elapsed_time": "4:06:00", "remaining_time": "0:33:05", "throughput": 2313.09, "total_tokens": 34143336} {"current_steps": 59185, "total_steps": 67140, "loss": 0.5424, "lr": 2.1083881472433232e-06, "epoch": 8.81516234733393, "percentage": 88.15, "elapsed_time": "4:06:02", "remaining_time": "0:33:04", "throughput": 2313.11, "total_tokens": 34146088} {"current_steps": 59190, "total_steps": 67140, "loss": 0.7988, "lr": 2.105776753119701e-06, "epoch": 8.815907059874888, "percentage": 88.16, "elapsed_time": "4:06:03", "remaining_time": "0:33:02", "throughput": 2313.12, "total_tokens": 34148840} {"current_steps": 59195, "total_steps": 67140, "loss": 0.7316, "lr": 2.1031669060946056e-06, "epoch": 8.816651772415847, "percentage": 88.17, "elapsed_time": "4:06:04", "remaining_time": "0:33:01", "throughput": 2313.15, "total_tokens": 34151944} {"current_steps": 59200, "total_steps": 67140, "loss": 0.5265, "lr": 2.100558606344399e-06, "epoch": 8.817396484956806, "percentage": 88.17, "elapsed_time": "4:06:05", "remaining_time": "0:33:00", "throughput": 2313.18, "total_tokens": 34155112} {"current_steps": 59205, "total_steps": 67140, "loss": 0.6753, "lr": 2.0979518540453435e-06, "epoch": 8.818141197497766, "percentage": 88.18, "elapsed_time": "4:06:06", "remaining_time": "0:32:59", "throughput": 2313.18, "total_tokens": 34157800} {"current_steps": 59210, "total_steps": 67140, "loss": 0.6269, "lr": 2.095346649373586e-06, "epoch": 8.818885910038725, "percentage": 88.19, "elapsed_time": "4:06:07", "remaining_time": "0:32:57", "throughput": 2313.2, "total_tokens": 34160680} {"current_steps": 59215, "total_steps": 67140, "loss": 0.5838, "lr": 2.092742992505181e-06, "epoch": 8.819630622579684, "percentage": 88.2, "elapsed_time": "4:06:08", "remaining_time": "0:32:56", "throughput": 2313.21, "total_tokens": 34163336} {"current_steps": 59220, "total_steps": 67140, "loss": 0.4099, "lr": 2.090140883616068e-06, "epoch": 8.820375335120643, "percentage": 88.2, "elapsed_time": "4:06:09", "remaining_time": "0:32:55", "throughput": 2313.22, "total_tokens": 34166120} {"current_steps": 59225, "total_steps": 67140, "loss": 0.5039, "lr": 2.087540322882087e-06, "epoch": 8.821120047661603, "percentage": 88.21, "elapsed_time": "4:06:11", "remaining_time": "0:32:54", "throughput": 2313.23, "total_tokens": 34169000} {"current_steps": 59230, "total_steps": 67140, "loss": 0.4443, "lr": 2.084941310478977e-06, "epoch": 8.821864760202562, "percentage": 88.22, "elapsed_time": "4:06:12", "remaining_time": "0:32:52", "throughput": 2313.26, "total_tokens": 34172008} {"current_steps": 59235, "total_steps": 67140, "loss": 0.5903, "lr": 2.0823438465823656e-06, "epoch": 8.82260947274352, "percentage": 88.23, "elapsed_time": "4:06:13", "remaining_time": "0:32:51", "throughput": 2313.27, "total_tokens": 34174792} {"current_steps": 59240, "total_steps": 67140, "loss": 0.4845, "lr": 2.079747931367787e-06, "epoch": 8.82335418528448, "percentage": 88.23, "elapsed_time": "4:06:14", "remaining_time": "0:32:50", "throughput": 2313.28, "total_tokens": 34177576} {"current_steps": 59245, "total_steps": 67140, "loss": 0.4522, "lr": 2.0771535650106533e-06, "epoch": 8.82409889782544, "percentage": 88.24, "elapsed_time": "4:06:15", "remaining_time": "0:32:49", "throughput": 2313.3, "total_tokens": 34180488} {"current_steps": 59250, "total_steps": 67140, "loss": 0.5184, "lr": 2.0745607476862826e-06, "epoch": 8.824843610366399, "percentage": 88.25, "elapsed_time": "4:06:16", "remaining_time": "0:32:47", "throughput": 2313.31, "total_tokens": 34183176} {"current_steps": 59255, "total_steps": 67140, "loss": 0.5843, "lr": 2.0719694795698907e-06, "epoch": 8.825588322907358, "percentage": 88.26, "elapsed_time": "4:06:17", "remaining_time": "0:32:46", "throughput": 2313.33, "total_tokens": 34186024} {"current_steps": 59260, "total_steps": 67140, "loss": 0.7007, "lr": 2.0693797608365817e-06, "epoch": 8.826333035448316, "percentage": 88.26, "elapsed_time": "4:06:18", "remaining_time": "0:32:45", "throughput": 2313.35, "total_tokens": 34188904} {"current_steps": 59265, "total_steps": 67140, "loss": 0.658, "lr": 2.0667915916613573e-06, "epoch": 8.827077747989277, "percentage": 88.27, "elapsed_time": "4:06:20", "remaining_time": "0:32:43", "throughput": 2313.35, "total_tokens": 34191464} {"current_steps": 59270, "total_steps": 67140, "loss": 0.6821, "lr": 2.0642049722191193e-06, "epoch": 8.827822460530236, "percentage": 88.28, "elapsed_time": "4:06:21", "remaining_time": "0:32:42", "throughput": 2313.36, "total_tokens": 34194184} {"current_steps": 59275, "total_steps": 67140, "loss": 0.7894, "lr": 2.0616199026846613e-06, "epoch": 8.828567173071194, "percentage": 88.29, "elapsed_time": "4:06:22", "remaining_time": "0:32:41", "throughput": 2313.38, "total_tokens": 34197160} {"current_steps": 59280, "total_steps": 67140, "loss": 0.5509, "lr": 2.059036383232668e-06, "epoch": 8.829311885612153, "percentage": 88.29, "elapsed_time": "4:06:23", "remaining_time": "0:32:40", "throughput": 2313.4, "total_tokens": 34200200} {"current_steps": 59285, "total_steps": 67140, "loss": 0.5625, "lr": 2.0564544140377228e-06, "epoch": 8.830056598153114, "percentage": 88.3, "elapsed_time": "4:06:24", "remaining_time": "0:32:38", "throughput": 2313.43, "total_tokens": 34203368} {"current_steps": 59290, "total_steps": 67140, "loss": 0.6458, "lr": 2.0538739952743054e-06, "epoch": 8.830801310694072, "percentage": 88.31, "elapsed_time": "4:06:25", "remaining_time": "0:32:37", "throughput": 2313.44, "total_tokens": 34206024} {"current_steps": 59295, "total_steps": 67140, "loss": 0.7524, "lr": 2.0512951271167922e-06, "epoch": 8.831546023235031, "percentage": 88.32, "elapsed_time": "4:06:26", "remaining_time": "0:32:36", "throughput": 2313.45, "total_tokens": 34208744} {"current_steps": 59300, "total_steps": 67140, "loss": 0.6208, "lr": 2.048717809739459e-06, "epoch": 8.83229073577599, "percentage": 88.32, "elapsed_time": "4:06:28", "remaining_time": "0:32:35", "throughput": 2313.46, "total_tokens": 34211560} {"current_steps": 59305, "total_steps": 67140, "loss": 0.5657, "lr": 2.046142043316457e-06, "epoch": 8.83303544831695, "percentage": 88.33, "elapsed_time": "4:06:29", "remaining_time": "0:32:33", "throughput": 2313.48, "total_tokens": 34214312} {"current_steps": 59310, "total_steps": 67140, "loss": 0.4125, "lr": 2.0435678280218556e-06, "epoch": 8.83378016085791, "percentage": 88.34, "elapsed_time": "4:06:30", "remaining_time": "0:32:32", "throughput": 2313.49, "total_tokens": 34217064} {"current_steps": 59315, "total_steps": 67140, "loss": 0.5828, "lr": 2.040995164029602e-06, "epoch": 8.834524873398868, "percentage": 88.35, "elapsed_time": "4:06:31", "remaining_time": "0:32:31", "throughput": 2313.5, "total_tokens": 34219912} {"current_steps": 59320, "total_steps": 67140, "loss": 0.5074, "lr": 2.038424051513549e-06, "epoch": 8.835269585939827, "percentage": 88.35, "elapsed_time": "4:06:32", "remaining_time": "0:32:30", "throughput": 2313.52, "total_tokens": 34222728} {"current_steps": 59325, "total_steps": 67140, "loss": 0.4438, "lr": 2.035854490647446e-06, "epoch": 8.836014298480787, "percentage": 88.36, "elapsed_time": "4:06:33", "remaining_time": "0:32:28", "throughput": 2313.54, "total_tokens": 34225640} {"current_steps": 59330, "total_steps": 67140, "loss": 0.4619, "lr": 2.033286481604932e-06, "epoch": 8.836759011021746, "percentage": 88.37, "elapsed_time": "4:06:34", "remaining_time": "0:32:27", "throughput": 2313.55, "total_tokens": 34228392} {"current_steps": 59335, "total_steps": 67140, "loss": 0.3675, "lr": 2.0307200245595403e-06, "epoch": 8.837503723562705, "percentage": 88.38, "elapsed_time": "4:06:35", "remaining_time": "0:32:26", "throughput": 2313.58, "total_tokens": 34231592} {"current_steps": 59340, "total_steps": 67140, "loss": 0.4746, "lr": 2.028155119684708e-06, "epoch": 8.838248436103664, "percentage": 88.38, "elapsed_time": "4:06:37", "remaining_time": "0:32:25", "throughput": 2313.6, "total_tokens": 34234568} {"current_steps": 59345, "total_steps": 67140, "loss": 0.7148, "lr": 2.0255917671537534e-06, "epoch": 8.838993148644622, "percentage": 88.39, "elapsed_time": "4:06:38", "remaining_time": "0:32:23", "throughput": 2313.63, "total_tokens": 34237640} {"current_steps": 59350, "total_steps": 67140, "loss": 0.605, "lr": 2.0230299671399e-06, "epoch": 8.839737861185583, "percentage": 88.4, "elapsed_time": "4:06:39", "remaining_time": "0:32:22", "throughput": 2313.65, "total_tokens": 34240456} {"current_steps": 59355, "total_steps": 67140, "loss": 0.403, "lr": 2.0204697198162593e-06, "epoch": 8.840482573726542, "percentage": 88.4, "elapsed_time": "4:06:40", "remaining_time": "0:32:21", "throughput": 2313.68, "total_tokens": 34243688} {"current_steps": 59360, "total_steps": 67140, "loss": 0.6256, "lr": 2.0179110253558507e-06, "epoch": 8.8412272862675, "percentage": 88.41, "elapsed_time": "4:06:41", "remaining_time": "0:32:19", "throughput": 2313.7, "total_tokens": 34246600} {"current_steps": 59365, "total_steps": 67140, "loss": 0.7512, "lr": 2.0153538839315756e-06, "epoch": 8.84197199880846, "percentage": 88.42, "elapsed_time": "4:06:42", "remaining_time": "0:32:18", "throughput": 2313.71, "total_tokens": 34249384} {"current_steps": 59370, "total_steps": 67140, "loss": 0.6883, "lr": 2.0127982957162395e-06, "epoch": 8.84271671134942, "percentage": 88.43, "elapsed_time": "4:06:43", "remaining_time": "0:32:17", "throughput": 2313.73, "total_tokens": 34252232} {"current_steps": 59375, "total_steps": 67140, "loss": 0.688, "lr": 2.0102442608825324e-06, "epoch": 8.843461423890378, "percentage": 88.43, "elapsed_time": "4:06:45", "remaining_time": "0:32:16", "throughput": 2313.74, "total_tokens": 34255080} {"current_steps": 59380, "total_steps": 67140, "loss": 0.7506, "lr": 2.007691779603052e-06, "epoch": 8.844206136431337, "percentage": 88.44, "elapsed_time": "4:06:46", "remaining_time": "0:32:14", "throughput": 2313.76, "total_tokens": 34257960} {"current_steps": 59385, "total_steps": 67140, "loss": 0.4918, "lr": 2.0051408520502774e-06, "epoch": 8.844950848972296, "percentage": 88.45, "elapsed_time": "4:06:47", "remaining_time": "0:32:13", "throughput": 2313.78, "total_tokens": 34260904} {"current_steps": 59390, "total_steps": 67140, "loss": 0.7923, "lr": 2.0025914783965926e-06, "epoch": 8.845695561513256, "percentage": 88.46, "elapsed_time": "4:06:48", "remaining_time": "0:32:12", "throughput": 2313.79, "total_tokens": 34263560} {"current_steps": 59395, "total_steps": 67140, "loss": 0.5316, "lr": 2.000043658814277e-06, "epoch": 8.846440274054215, "percentage": 88.46, "elapsed_time": "4:06:49", "remaining_time": "0:32:11", "throughput": 2313.81, "total_tokens": 34266536} {"current_steps": 59400, "total_steps": 67140, "loss": 0.4907, "lr": 1.9974973934755003e-06, "epoch": 8.847184986595174, "percentage": 88.47, "elapsed_time": "4:06:50", "remaining_time": "0:32:09", "throughput": 2313.81, "total_tokens": 34269160} {"current_steps": 59405, "total_steps": 67140, "loss": 0.6148, "lr": 1.994952682552331e-06, "epoch": 8.847929699136133, "percentage": 88.48, "elapsed_time": "4:06:51", "remaining_time": "0:32:08", "throughput": 2313.84, "total_tokens": 34272168} {"current_steps": 59410, "total_steps": 67140, "loss": 0.6751, "lr": 1.9924095262167238e-06, "epoch": 8.848674411677093, "percentage": 88.49, "elapsed_time": "4:06:52", "remaining_time": "0:32:07", "throughput": 2313.85, "total_tokens": 34274984} {"current_steps": 59415, "total_steps": 67140, "loss": 0.6387, "lr": 1.9898679246405372e-06, "epoch": 8.849419124218052, "percentage": 88.49, "elapsed_time": "4:06:54", "remaining_time": "0:32:06", "throughput": 2313.87, "total_tokens": 34277896} {"current_steps": 59420, "total_steps": 67140, "loss": 0.7364, "lr": 1.9873278779955316e-06, "epoch": 8.85016383675901, "percentage": 88.5, "elapsed_time": "4:06:55", "remaining_time": "0:32:04", "throughput": 2313.89, "total_tokens": 34280872} {"current_steps": 59425, "total_steps": 67140, "loss": 0.6077, "lr": 1.9847893864533395e-06, "epoch": 8.85090854929997, "percentage": 88.51, "elapsed_time": "4:06:56", "remaining_time": "0:32:03", "throughput": 2313.9, "total_tokens": 34283624} {"current_steps": 59430, "total_steps": 67140, "loss": 0.5783, "lr": 1.9822524501855067e-06, "epoch": 8.85165326184093, "percentage": 88.52, "elapsed_time": "4:06:57", "remaining_time": "0:32:02", "throughput": 2313.91, "total_tokens": 34286344} {"current_steps": 59435, "total_steps": 67140, "loss": 0.5339, "lr": 1.979717069363471e-06, "epoch": 8.852397974381889, "percentage": 88.52, "elapsed_time": "4:06:58", "remaining_time": "0:32:01", "throughput": 2313.93, "total_tokens": 34289160} {"current_steps": 59440, "total_steps": 67140, "loss": 0.4658, "lr": 1.9771832441585647e-06, "epoch": 8.853142686922848, "percentage": 88.53, "elapsed_time": "4:06:59", "remaining_time": "0:31:59", "throughput": 2313.95, "total_tokens": 34292104} {"current_steps": 59445, "total_steps": 67140, "loss": 0.6048, "lr": 1.9746509747420065e-06, "epoch": 8.853887399463806, "percentage": 88.54, "elapsed_time": "4:07:00", "remaining_time": "0:31:58", "throughput": 2313.96, "total_tokens": 34294760} {"current_steps": 59450, "total_steps": 67140, "loss": 0.5806, "lr": 1.972120261284924e-06, "epoch": 8.854632112004767, "percentage": 88.55, "elapsed_time": "4:07:01", "remaining_time": "0:31:57", "throughput": 2313.98, "total_tokens": 34297736} {"current_steps": 59455, "total_steps": 67140, "loss": 0.6049, "lr": 1.9695911039583265e-06, "epoch": 8.855376824545726, "percentage": 88.55, "elapsed_time": "4:07:03", "remaining_time": "0:31:55", "throughput": 2313.99, "total_tokens": 34300488} {"current_steps": 59460, "total_steps": 67140, "loss": 0.5125, "lr": 1.9670635029331336e-06, "epoch": 8.856121537086684, "percentage": 88.56, "elapsed_time": "4:07:04", "remaining_time": "0:31:54", "throughput": 2314.01, "total_tokens": 34303432} {"current_steps": 59465, "total_steps": 67140, "loss": 0.5969, "lr": 1.9645374583801417e-06, "epoch": 8.856866249627643, "percentage": 88.57, "elapsed_time": "4:07:05", "remaining_time": "0:31:53", "throughput": 2314.02, "total_tokens": 34306152} {"current_steps": 59470, "total_steps": 67140, "loss": 0.4699, "lr": 1.9620129704700506e-06, "epoch": 8.857610962168604, "percentage": 88.58, "elapsed_time": "4:07:06", "remaining_time": "0:31:52", "throughput": 2314.04, "total_tokens": 34309192} {"current_steps": 59475, "total_steps": 67140, "loss": 0.4701, "lr": 1.95949003937346e-06, "epoch": 8.858355674709562, "percentage": 88.58, "elapsed_time": "4:07:07", "remaining_time": "0:31:50", "throughput": 2314.05, "total_tokens": 34311944} {"current_steps": 59480, "total_steps": 67140, "loss": 0.6715, "lr": 1.9569686652608555e-06, "epoch": 8.859100387250521, "percentage": 88.59, "elapsed_time": "4:07:08", "remaining_time": "0:31:49", "throughput": 2314.08, "total_tokens": 34314920} {"current_steps": 59485, "total_steps": 67140, "loss": 0.5429, "lr": 1.9544488483026203e-06, "epoch": 8.85984509979148, "percentage": 88.6, "elapsed_time": "4:07:09", "remaining_time": "0:31:48", "throughput": 2314.08, "total_tokens": 34317608} {"current_steps": 59490, "total_steps": 67140, "loss": 0.5144, "lr": 1.9519305886690378e-06, "epoch": 8.86058981233244, "percentage": 88.61, "elapsed_time": "4:07:11", "remaining_time": "0:31:47", "throughput": 2314.11, "total_tokens": 34320680} {"current_steps": 59495, "total_steps": 67140, "loss": 0.6298, "lr": 1.949413886530277e-06, "epoch": 8.8613345248734, "percentage": 88.61, "elapsed_time": "4:07:12", "remaining_time": "0:31:45", "throughput": 2314.12, "total_tokens": 34323272} {"current_steps": 59500, "total_steps": 67140, "loss": 0.5289, "lr": 1.9468987420564135e-06, "epoch": 8.862079237414358, "percentage": 88.62, "elapsed_time": "4:07:13", "remaining_time": "0:31:44", "throughput": 2314.13, "total_tokens": 34326088} {"current_steps": 59505, "total_steps": 67140, "loss": 0.5217, "lr": 1.9443851554174026e-06, "epoch": 8.862823949955317, "percentage": 88.63, "elapsed_time": "4:07:14", "remaining_time": "0:31:43", "throughput": 2314.14, "total_tokens": 34328776} {"current_steps": 59510, "total_steps": 67140, "loss": 0.3794, "lr": 1.9418731267831088e-06, "epoch": 8.863568662496277, "percentage": 88.64, "elapsed_time": "4:07:15", "remaining_time": "0:31:42", "throughput": 2314.15, "total_tokens": 34331368} {"current_steps": 59515, "total_steps": 67140, "loss": 0.5127, "lr": 1.939362656323279e-06, "epoch": 8.864313375037236, "percentage": 88.64, "elapsed_time": "4:07:16", "remaining_time": "0:31:40", "throughput": 2314.16, "total_tokens": 34334120} {"current_steps": 59520, "total_steps": 67140, "loss": 0.5139, "lr": 1.936853744207562e-06, "epoch": 8.865058087578195, "percentage": 88.65, "elapsed_time": "4:07:17", "remaining_time": "0:31:39", "throughput": 2314.17, "total_tokens": 34336872} {"current_steps": 59525, "total_steps": 67140, "loss": 0.4411, "lr": 1.9343463906055017e-06, "epoch": 8.865802800119154, "percentage": 88.66, "elapsed_time": "4:07:18", "remaining_time": "0:31:38", "throughput": 2314.21, "total_tokens": 34340200} {"current_steps": 59530, "total_steps": 67140, "loss": 0.5908, "lr": 1.931840595686535e-06, "epoch": 8.866547512660112, "percentage": 88.67, "elapsed_time": "4:07:19", "remaining_time": "0:31:37", "throughput": 2314.22, "total_tokens": 34342920} {"current_steps": 59535, "total_steps": 67140, "loss": 0.6034, "lr": 1.929336359619996e-06, "epoch": 8.867292225201073, "percentage": 88.67, "elapsed_time": "4:07:21", "remaining_time": "0:31:35", "throughput": 2314.23, "total_tokens": 34345704} {"current_steps": 59540, "total_steps": 67140, "loss": 0.5064, "lr": 1.9268336825751022e-06, "epoch": 8.868036937742032, "percentage": 88.68, "elapsed_time": "4:07:22", "remaining_time": "0:31:34", "throughput": 2314.25, "total_tokens": 34348712} {"current_steps": 59545, "total_steps": 67140, "loss": 0.7294, "lr": 1.9243325647209846e-06, "epoch": 8.86878165028299, "percentage": 88.69, "elapsed_time": "4:07:23", "remaining_time": "0:31:33", "throughput": 2314.27, "total_tokens": 34351528} {"current_steps": 59550, "total_steps": 67140, "loss": 0.5179, "lr": 1.9218330062266474e-06, "epoch": 8.86952636282395, "percentage": 88.7, "elapsed_time": "4:07:24", "remaining_time": "0:31:32", "throughput": 2314.28, "total_tokens": 34354248} {"current_steps": 59555, "total_steps": 67140, "loss": 0.6044, "lr": 1.919335007261008e-06, "epoch": 8.87027107536491, "percentage": 88.7, "elapsed_time": "4:07:25", "remaining_time": "0:31:30", "throughput": 2314.28, "total_tokens": 34356872} {"current_steps": 59560, "total_steps": 67140, "loss": 0.5981, "lr": 1.9168385679928707e-06, "epoch": 8.871015787905868, "percentage": 88.71, "elapsed_time": "4:07:26", "remaining_time": "0:31:29", "throughput": 2314.29, "total_tokens": 34359496} {"current_steps": 59565, "total_steps": 67140, "loss": 0.597, "lr": 1.914343688590933e-06, "epoch": 8.871760500446827, "percentage": 88.72, "elapsed_time": "4:07:27", "remaining_time": "0:31:28", "throughput": 2314.31, "total_tokens": 34362408} {"current_steps": 59570, "total_steps": 67140, "loss": 0.5266, "lr": 1.9118503692237917e-06, "epoch": 8.872505212987786, "percentage": 88.73, "elapsed_time": "4:07:28", "remaining_time": "0:31:26", "throughput": 2314.31, "total_tokens": 34364968} {"current_steps": 59575, "total_steps": 67140, "loss": 0.5512, "lr": 1.9093586100599304e-06, "epoch": 8.873249925528746, "percentage": 88.73, "elapsed_time": "4:07:30", "remaining_time": "0:31:25", "throughput": 2314.33, "total_tokens": 34367752} {"current_steps": 59580, "total_steps": 67140, "loss": 0.5955, "lr": 1.90686841126774e-06, "epoch": 8.873994638069705, "percentage": 88.74, "elapsed_time": "4:07:31", "remaining_time": "0:31:24", "throughput": 2314.34, "total_tokens": 34370632} {"current_steps": 59585, "total_steps": 67140, "loss": 0.6677, "lr": 1.9043797730154856e-06, "epoch": 8.874739350610664, "percentage": 88.75, "elapsed_time": "4:07:32", "remaining_time": "0:31:23", "throughput": 2314.34, "total_tokens": 34373224} {"current_steps": 59590, "total_steps": 67140, "loss": 0.5606, "lr": 1.9018926954713495e-06, "epoch": 8.875484063151623, "percentage": 88.75, "elapsed_time": "4:07:33", "remaining_time": "0:31:21", "throughput": 2314.36, "total_tokens": 34376008} {"current_steps": 59595, "total_steps": 67140, "loss": 0.5511, "lr": 1.8994071788033919e-06, "epoch": 8.876228775692583, "percentage": 88.76, "elapsed_time": "4:07:34", "remaining_time": "0:31:20", "throughput": 2314.38, "total_tokens": 34379048} {"current_steps": 59600, "total_steps": 67140, "loss": 0.548, "lr": 1.896923223179578e-06, "epoch": 8.876973488233542, "percentage": 88.77, "elapsed_time": "4:07:35", "remaining_time": "0:31:19", "throughput": 2314.41, "total_tokens": 34382088} {"current_steps": 59605, "total_steps": 67140, "loss": 0.6859, "lr": 1.8944408287677683e-06, "epoch": 8.8777182007745, "percentage": 88.78, "elapsed_time": "4:07:36", "remaining_time": "0:31:18", "throughput": 2314.42, "total_tokens": 34384840} {"current_steps": 59610, "total_steps": 67140, "loss": 0.6631, "lr": 1.891959995735701e-06, "epoch": 8.87846291331546, "percentage": 88.78, "elapsed_time": "4:07:37", "remaining_time": "0:31:16", "throughput": 2314.44, "total_tokens": 34387848} {"current_steps": 59615, "total_steps": 67140, "loss": 0.373, "lr": 1.8894807242510248e-06, "epoch": 8.87920762585642, "percentage": 88.79, "elapsed_time": "4:07:39", "remaining_time": "0:31:15", "throughput": 2314.46, "total_tokens": 34390888} {"current_steps": 59620, "total_steps": 67140, "loss": 0.526, "lr": 1.8870030144812894e-06, "epoch": 8.879952338397379, "percentage": 88.8, "elapsed_time": "4:07:40", "remaining_time": "0:31:14", "throughput": 2314.49, "total_tokens": 34394120} {"current_steps": 59625, "total_steps": 67140, "loss": 0.6889, "lr": 1.8845268665939109e-06, "epoch": 8.880697050938338, "percentage": 88.81, "elapsed_time": "4:07:41", "remaining_time": "0:31:13", "throughput": 2314.51, "total_tokens": 34396936} {"current_steps": 59630, "total_steps": 67140, "loss": 0.6868, "lr": 1.8820522807562302e-06, "epoch": 8.881441763479296, "percentage": 88.81, "elapsed_time": "4:07:42", "remaining_time": "0:31:11", "throughput": 2314.51, "total_tokens": 34399560} {"current_steps": 59635, "total_steps": 67140, "loss": 0.4028, "lr": 1.8795792571354637e-06, "epoch": 8.882186476020257, "percentage": 88.82, "elapsed_time": "4:07:43", "remaining_time": "0:31:10", "throughput": 2314.53, "total_tokens": 34402472} {"current_steps": 59640, "total_steps": 67140, "loss": 0.7686, "lr": 1.8771077958987333e-06, "epoch": 8.882931188561216, "percentage": 88.83, "elapsed_time": "4:07:44", "remaining_time": "0:31:09", "throughput": 2314.55, "total_tokens": 34405352} {"current_steps": 59645, "total_steps": 67140, "loss": 0.5128, "lr": 1.874637897213044e-06, "epoch": 8.883675901102174, "percentage": 88.84, "elapsed_time": "4:07:45", "remaining_time": "0:31:08", "throughput": 2314.56, "total_tokens": 34408168} {"current_steps": 59650, "total_steps": 67140, "loss": 0.6455, "lr": 1.8721695612453072e-06, "epoch": 8.884420613643133, "percentage": 88.84, "elapsed_time": "4:07:47", "remaining_time": "0:31:06", "throughput": 2314.58, "total_tokens": 34411016} {"current_steps": 59655, "total_steps": 67140, "loss": 0.5938, "lr": 1.869702788162317e-06, "epoch": 8.885165326184094, "percentage": 88.85, "elapsed_time": "4:07:48", "remaining_time": "0:31:05", "throughput": 2314.59, "total_tokens": 34413704} {"current_steps": 59660, "total_steps": 67140, "loss": 0.5981, "lr": 1.8672375781307787e-06, "epoch": 8.885910038725052, "percentage": 88.86, "elapsed_time": "4:07:49", "remaining_time": "0:31:04", "throughput": 2314.6, "total_tokens": 34416616} {"current_steps": 59665, "total_steps": 67140, "loss": 0.69, "lr": 1.864773931317268e-06, "epoch": 8.886654751266011, "percentage": 88.87, "elapsed_time": "4:07:50", "remaining_time": "0:31:03", "throughput": 2314.62, "total_tokens": 34419432} {"current_steps": 59670, "total_steps": 67140, "loss": 0.5877, "lr": 1.8623118478882733e-06, "epoch": 8.88739946380697, "percentage": 88.87, "elapsed_time": "4:07:51", "remaining_time": "0:31:01", "throughput": 2314.63, "total_tokens": 34422088} {"current_steps": 59675, "total_steps": 67140, "loss": 0.519, "lr": 1.8598513280101786e-06, "epoch": 8.88814417634793, "percentage": 88.88, "elapsed_time": "4:07:52", "remaining_time": "0:31:00", "throughput": 2314.63, "total_tokens": 34424648} {"current_steps": 59680, "total_steps": 67140, "loss": 0.653, "lr": 1.8573923718492454e-06, "epoch": 8.88888888888889, "percentage": 88.89, "elapsed_time": "4:07:53", "remaining_time": "0:30:59", "throughput": 2314.64, "total_tokens": 34427432} {"current_steps": 59685, "total_steps": 67140, "loss": 0.7107, "lr": 1.854934979571643e-06, "epoch": 8.889633601429848, "percentage": 88.9, "elapsed_time": "4:07:54", "remaining_time": "0:30:57", "throughput": 2314.66, "total_tokens": 34430280} {"current_steps": 59690, "total_steps": 67140, "loss": 0.5201, "lr": 1.8524791513434364e-06, "epoch": 8.890378313970807, "percentage": 88.9, "elapsed_time": "4:07:55", "remaining_time": "0:30:56", "throughput": 2314.67, "total_tokens": 34433000} {"current_steps": 59695, "total_steps": 67140, "loss": 0.6516, "lr": 1.8500248873305758e-06, "epoch": 8.891123026511767, "percentage": 88.91, "elapsed_time": "4:07:57", "remaining_time": "0:30:55", "throughput": 2314.69, "total_tokens": 34435944} {"current_steps": 59700, "total_steps": 67140, "loss": 0.7677, "lr": 1.8475721876989177e-06, "epoch": 8.891867739052726, "percentage": 88.92, "elapsed_time": "4:07:58", "remaining_time": "0:30:54", "throughput": 2314.7, "total_tokens": 34438824} {"current_steps": 59705, "total_steps": 67140, "loss": 0.5564, "lr": 1.845121052614196e-06, "epoch": 8.892612451593685, "percentage": 88.93, "elapsed_time": "4:07:59", "remaining_time": "0:30:52", "throughput": 2314.72, "total_tokens": 34441640} {"current_steps": 59710, "total_steps": 67140, "loss": 0.5828, "lr": 1.842671482242056e-06, "epoch": 8.893357164134644, "percentage": 88.93, "elapsed_time": "4:08:00", "remaining_time": "0:30:51", "throughput": 2314.73, "total_tokens": 34444328} {"current_steps": 59715, "total_steps": 67140, "loss": 0.5536, "lr": 1.8402234767480237e-06, "epoch": 8.894101876675602, "percentage": 88.94, "elapsed_time": "4:08:01", "remaining_time": "0:30:50", "throughput": 2314.75, "total_tokens": 34447272} {"current_steps": 59720, "total_steps": 67140, "loss": 0.4981, "lr": 1.8377770362975277e-06, "epoch": 8.894846589216563, "percentage": 88.95, "elapsed_time": "4:08:02", "remaining_time": "0:30:49", "throughput": 2314.75, "total_tokens": 34449832} {"current_steps": 59725, "total_steps": 67140, "loss": 0.5919, "lr": 1.835332161055886e-06, "epoch": 8.895591301757522, "percentage": 88.96, "elapsed_time": "4:08:03", "remaining_time": "0:30:47", "throughput": 2314.77, "total_tokens": 34452872} {"current_steps": 59730, "total_steps": 67140, "loss": 0.5936, "lr": 1.832888851188319e-06, "epoch": 8.89633601429848, "percentage": 88.96, "elapsed_time": "4:08:05", "remaining_time": "0:30:46", "throughput": 2314.78, "total_tokens": 34455624} {"current_steps": 59735, "total_steps": 67140, "loss": 0.5594, "lr": 1.8304471068599365e-06, "epoch": 8.89708072683944, "percentage": 88.97, "elapsed_time": "4:08:06", "remaining_time": "0:30:45", "throughput": 2314.8, "total_tokens": 34458568} {"current_steps": 59740, "total_steps": 67140, "loss": 0.5553, "lr": 1.8280069282357342e-06, "epoch": 8.8978254393804, "percentage": 88.98, "elapsed_time": "4:08:07", "remaining_time": "0:30:44", "throughput": 2314.81, "total_tokens": 34461352} {"current_steps": 59745, "total_steps": 67140, "loss": 0.8773, "lr": 1.8255683154806163e-06, "epoch": 8.898570151921358, "percentage": 88.99, "elapsed_time": "4:08:08", "remaining_time": "0:30:42", "throughput": 2314.83, "total_tokens": 34464232} {"current_steps": 59750, "total_steps": 67140, "loss": 0.3897, "lr": 1.8231312687593677e-06, "epoch": 8.899314864462317, "percentage": 88.99, "elapsed_time": "4:08:09", "remaining_time": "0:30:41", "throughput": 2314.84, "total_tokens": 34467016} {"current_steps": 59755, "total_steps": 67140, "loss": 0.5744, "lr": 1.8206957882366788e-06, "epoch": 8.900059577003276, "percentage": 89.0, "elapsed_time": "4:08:10", "remaining_time": "0:30:40", "throughput": 2314.85, "total_tokens": 34469608} {"current_steps": 59760, "total_steps": 67140, "loss": 0.5031, "lr": 1.818261874077129e-06, "epoch": 8.900804289544237, "percentage": 89.01, "elapsed_time": "4:08:11", "remaining_time": "0:30:39", "throughput": 2314.87, "total_tokens": 34472648} {"current_steps": 59765, "total_steps": 67140, "loss": 0.4931, "lr": 1.8158295264451897e-06, "epoch": 8.901549002085195, "percentage": 89.02, "elapsed_time": "4:08:12", "remaining_time": "0:30:37", "throughput": 2314.9, "total_tokens": 34475752} {"current_steps": 59770, "total_steps": 67140, "loss": 0.4682, "lr": 1.813398745505235e-06, "epoch": 8.902293714626154, "percentage": 89.02, "elapsed_time": "4:08:14", "remaining_time": "0:30:36", "throughput": 2314.92, "total_tokens": 34478792} {"current_steps": 59775, "total_steps": 67140, "loss": 0.437, "lr": 1.8109695314215192e-06, "epoch": 8.903038427167113, "percentage": 89.03, "elapsed_time": "4:08:15", "remaining_time": "0:30:35", "throughput": 2314.94, "total_tokens": 34481800} {"current_steps": 59780, "total_steps": 67140, "loss": 0.7351, "lr": 1.8085418843582086e-06, "epoch": 8.903783139708073, "percentage": 89.04, "elapsed_time": "4:08:16", "remaining_time": "0:30:34", "throughput": 2314.97, "total_tokens": 34484840} {"current_steps": 59785, "total_steps": 67140, "loss": 0.7799, "lr": 1.8061158044793413e-06, "epoch": 8.904527852249032, "percentage": 89.05, "elapsed_time": "4:08:17", "remaining_time": "0:30:32", "throughput": 2314.99, "total_tokens": 34487720} {"current_steps": 59790, "total_steps": 67140, "loss": 0.4467, "lr": 1.8036912919488697e-06, "epoch": 8.90527256478999, "percentage": 89.05, "elapsed_time": "4:08:18", "remaining_time": "0:30:31", "throughput": 2315.01, "total_tokens": 34490760} {"current_steps": 59795, "total_steps": 67140, "loss": 0.6964, "lr": 1.8012683469306319e-06, "epoch": 8.90601727733095, "percentage": 89.06, "elapsed_time": "4:08:19", "remaining_time": "0:30:30", "throughput": 2315.03, "total_tokens": 34493608} {"current_steps": 59800, "total_steps": 67140, "loss": 0.617, "lr": 1.798846969588358e-06, "epoch": 8.90676198987191, "percentage": 89.07, "elapsed_time": "4:08:20", "remaining_time": "0:30:28", "throughput": 2315.03, "total_tokens": 34496232} {"current_steps": 59805, "total_steps": 67140, "loss": 0.5328, "lr": 1.7964271600856813e-06, "epoch": 8.907506702412869, "percentage": 89.08, "elapsed_time": "4:08:22", "remaining_time": "0:30:27", "throughput": 2315.05, "total_tokens": 34499080} {"current_steps": 59810, "total_steps": 67140, "loss": 0.7532, "lr": 1.7940089185861153e-06, "epoch": 8.908251414953828, "percentage": 89.08, "elapsed_time": "4:08:23", "remaining_time": "0:30:26", "throughput": 2315.07, "total_tokens": 34502088} {"current_steps": 59815, "total_steps": 67140, "loss": 0.5598, "lr": 1.7915922452530793e-06, "epoch": 8.908996127494786, "percentage": 89.09, "elapsed_time": "4:08:24", "remaining_time": "0:30:25", "throughput": 2315.1, "total_tokens": 34505320} {"current_steps": 59820, "total_steps": 67140, "loss": 0.4134, "lr": 1.7891771402498813e-06, "epoch": 8.909740840035747, "percentage": 89.1, "elapsed_time": "4:08:25", "remaining_time": "0:30:23", "throughput": 2315.12, "total_tokens": 34508328} {"current_steps": 59825, "total_steps": 67140, "loss": 0.6063, "lr": 1.7867636037397244e-06, "epoch": 8.910485552576706, "percentage": 89.1, "elapsed_time": "4:08:26", "remaining_time": "0:30:22", "throughput": 2315.14, "total_tokens": 34511080} {"current_steps": 59830, "total_steps": 67140, "loss": 0.4652, "lr": 1.7843516358857004e-06, "epoch": 8.911230265117664, "percentage": 89.11, "elapsed_time": "4:08:27", "remaining_time": "0:30:21", "throughput": 2315.15, "total_tokens": 34513800} {"current_steps": 59835, "total_steps": 67140, "loss": 0.547, "lr": 1.7819412368508064e-06, "epoch": 8.911974977658623, "percentage": 89.12, "elapsed_time": "4:08:28", "remaining_time": "0:30:20", "throughput": 2315.16, "total_tokens": 34516552} {"current_steps": 59840, "total_steps": 67140, "loss": 0.5962, "lr": 1.7795324067979318e-06, "epoch": 8.912719690199584, "percentage": 89.13, "elapsed_time": "4:08:30", "remaining_time": "0:30:18", "throughput": 2315.17, "total_tokens": 34519272} {"current_steps": 59845, "total_steps": 67140, "loss": 0.6878, "lr": 1.7771251458898436e-06, "epoch": 8.913464402740543, "percentage": 89.13, "elapsed_time": "4:08:31", "remaining_time": "0:30:17", "throughput": 2315.19, "total_tokens": 34522248} {"current_steps": 59850, "total_steps": 67140, "loss": 0.3585, "lr": 1.7747194542892226e-06, "epoch": 8.914209115281501, "percentage": 89.14, "elapsed_time": "4:08:32", "remaining_time": "0:30:16", "throughput": 2315.21, "total_tokens": 34525320} {"current_steps": 59855, "total_steps": 67140, "loss": 0.4957, "lr": 1.7723153321586305e-06, "epoch": 8.91495382782246, "percentage": 89.15, "elapsed_time": "4:08:33", "remaining_time": "0:30:15", "throughput": 2315.23, "total_tokens": 34528232} {"current_steps": 59860, "total_steps": 67140, "loss": 0.623, "lr": 1.7699127796605348e-06, "epoch": 8.915698540363419, "percentage": 89.16, "elapsed_time": "4:08:34", "remaining_time": "0:30:13", "throughput": 2315.26, "total_tokens": 34531368} {"current_steps": 59865, "total_steps": 67140, "loss": 0.4492, "lr": 1.7675117969572885e-06, "epoch": 8.91644325290438, "percentage": 89.16, "elapsed_time": "4:08:35", "remaining_time": "0:30:12", "throughput": 2315.28, "total_tokens": 34534280} {"current_steps": 59870, "total_steps": 67140, "loss": 0.8136, "lr": 1.7651123842111372e-06, "epoch": 8.917187965445338, "percentage": 89.17, "elapsed_time": "4:08:37", "remaining_time": "0:30:11", "throughput": 2315.31, "total_tokens": 34537480} {"current_steps": 59875, "total_steps": 67140, "loss": 0.5709, "lr": 1.7627145415842261e-06, "epoch": 8.917932677986297, "percentage": 89.18, "elapsed_time": "4:08:38", "remaining_time": "0:30:10", "throughput": 2315.32, "total_tokens": 34540296} {"current_steps": 59880, "total_steps": 67140, "loss": 0.6048, "lr": 1.7603182692385867e-06, "epoch": 8.918677390527257, "percentage": 89.19, "elapsed_time": "4:08:39", "remaining_time": "0:30:08", "throughput": 2315.33, "total_tokens": 34543048} {"current_steps": 59885, "total_steps": 67140, "loss": 0.4985, "lr": 1.7579235673361533e-06, "epoch": 8.919422103068216, "percentage": 89.19, "elapsed_time": "4:08:40", "remaining_time": "0:30:07", "throughput": 2315.37, "total_tokens": 34546312} {"current_steps": 59890, "total_steps": 67140, "loss": 0.4747, "lr": 1.755530436038752e-06, "epoch": 8.920166815609175, "percentage": 89.2, "elapsed_time": "4:08:41", "remaining_time": "0:30:06", "throughput": 2315.38, "total_tokens": 34549064} {"current_steps": 59895, "total_steps": 67140, "loss": 0.7472, "lr": 1.7531388755080951e-06, "epoch": 8.920911528150134, "percentage": 89.21, "elapsed_time": "4:08:42", "remaining_time": "0:30:05", "throughput": 2315.44, "total_tokens": 34553096} {"current_steps": 59900, "total_steps": 67140, "loss": 0.6203, "lr": 1.7507488859058035e-06, "epoch": 8.921656240691092, "percentage": 89.22, "elapsed_time": "4:08:44", "remaining_time": "0:30:03", "throughput": 2315.46, "total_tokens": 34556008} {"current_steps": 59905, "total_steps": 67140, "loss": 0.5505, "lr": 1.7483604673933756e-06, "epoch": 8.922400953232053, "percentage": 89.22, "elapsed_time": "4:08:45", "remaining_time": "0:30:02", "throughput": 2315.47, "total_tokens": 34558856} {"current_steps": 59910, "total_steps": 67140, "loss": 0.4576, "lr": 1.7459736201322158e-06, "epoch": 8.923145665773012, "percentage": 89.23, "elapsed_time": "4:08:46", "remaining_time": "0:30:01", "throughput": 2315.48, "total_tokens": 34561512} {"current_steps": 59915, "total_steps": 67140, "loss": 0.5902, "lr": 1.7435883442836086e-06, "epoch": 8.92389037831397, "percentage": 89.24, "elapsed_time": "4:08:47", "remaining_time": "0:30:00", "throughput": 2315.51, "total_tokens": 34564648} {"current_steps": 59920, "total_steps": 67140, "loss": 0.55, "lr": 1.7412046400087505e-06, "epoch": 8.92463509085493, "percentage": 89.25, "elapsed_time": "4:08:48", "remaining_time": "0:29:58", "throughput": 2315.52, "total_tokens": 34567432} {"current_steps": 59925, "total_steps": 67140, "loss": 0.4835, "lr": 1.7388225074687182e-06, "epoch": 8.92537980339589, "percentage": 89.25, "elapsed_time": "4:08:49", "remaining_time": "0:29:57", "throughput": 2315.53, "total_tokens": 34570152} {"current_steps": 59930, "total_steps": 67140, "loss": 0.4253, "lr": 1.736441946824488e-06, "epoch": 8.926124515936849, "percentage": 89.26, "elapsed_time": "4:08:50", "remaining_time": "0:29:56", "throughput": 2315.54, "total_tokens": 34572840} {"current_steps": 59935, "total_steps": 67140, "loss": 0.4966, "lr": 1.7340629582369316e-06, "epoch": 8.926869228477807, "percentage": 89.27, "elapsed_time": "4:08:51", "remaining_time": "0:29:55", "throughput": 2315.56, "total_tokens": 34575880} {"current_steps": 59940, "total_steps": 67140, "loss": 0.6025, "lr": 1.7316855418668038e-06, "epoch": 8.927613941018766, "percentage": 89.28, "elapsed_time": "4:08:53", "remaining_time": "0:29:53", "throughput": 2315.6, "total_tokens": 34579176} {"current_steps": 59945, "total_steps": 67140, "loss": 0.7317, "lr": 1.7293096978747703e-06, "epoch": 8.928358653559727, "percentage": 89.28, "elapsed_time": "4:08:54", "remaining_time": "0:29:52", "throughput": 2315.61, "total_tokens": 34581864} {"current_steps": 59950, "total_steps": 67140, "loss": 0.6694, "lr": 1.7269354264213694e-06, "epoch": 8.929103366100685, "percentage": 89.29, "elapsed_time": "4:08:55", "remaining_time": "0:29:51", "throughput": 2315.63, "total_tokens": 34584840} {"current_steps": 59955, "total_steps": 67140, "loss": 0.6805, "lr": 1.7245627276670535e-06, "epoch": 8.929848078641644, "percentage": 89.3, "elapsed_time": "4:08:56", "remaining_time": "0:29:49", "throughput": 2315.65, "total_tokens": 34587816} {"current_steps": 59960, "total_steps": 67140, "loss": 0.8479, "lr": 1.722191601772158e-06, "epoch": 8.930592791182603, "percentage": 89.31, "elapsed_time": "4:08:57", "remaining_time": "0:29:48", "throughput": 2315.67, "total_tokens": 34590792} {"current_steps": 59965, "total_steps": 67140, "loss": 0.6649, "lr": 1.7198220488969102e-06, "epoch": 8.931337503723563, "percentage": 89.31, "elapsed_time": "4:08:58", "remaining_time": "0:29:47", "throughput": 2315.69, "total_tokens": 34593640} {"current_steps": 59970, "total_steps": 67140, "loss": 0.4677, "lr": 1.7174540692014435e-06, "epoch": 8.932082216264522, "percentage": 89.32, "elapsed_time": "4:08:59", "remaining_time": "0:29:46", "throughput": 2315.69, "total_tokens": 34596232} {"current_steps": 59975, "total_steps": 67140, "loss": 0.6181, "lr": 1.7150876628457686e-06, "epoch": 8.932826928805481, "percentage": 89.33, "elapsed_time": "4:09:01", "remaining_time": "0:29:44", "throughput": 2315.69, "total_tokens": 34598792} {"current_steps": 59980, "total_steps": 67140, "loss": 0.6504, "lr": 1.7127228299897991e-06, "epoch": 8.93357164134644, "percentage": 89.34, "elapsed_time": "4:09:02", "remaining_time": "0:29:43", "throughput": 2315.71, "total_tokens": 34601704} {"current_steps": 59985, "total_steps": 67140, "loss": 0.6553, "lr": 1.7103595707933434e-06, "epoch": 8.9343163538874, "percentage": 89.34, "elapsed_time": "4:09:03", "remaining_time": "0:29:42", "throughput": 2315.72, "total_tokens": 34604392} {"current_steps": 59990, "total_steps": 67140, "loss": 0.5925, "lr": 1.707997885416096e-06, "epoch": 8.935061066428359, "percentage": 89.35, "elapsed_time": "4:09:04", "remaining_time": "0:29:41", "throughput": 2315.73, "total_tokens": 34607080} {"current_steps": 59995, "total_steps": 67140, "loss": 0.7789, "lr": 1.7056377740176543e-06, "epoch": 8.935805778969318, "percentage": 89.36, "elapsed_time": "4:09:05", "remaining_time": "0:29:39", "throughput": 2315.75, "total_tokens": 34609928} {"current_steps": 60000, "total_steps": 67140, "loss": 0.5172, "lr": 1.7032792367575047e-06, "epoch": 8.936550491510276, "percentage": 89.37, "elapsed_time": "4:09:06", "remaining_time": "0:29:38", "throughput": 2315.76, "total_tokens": 34612712} {"current_steps": 60005, "total_steps": 67140, "loss": 0.3764, "lr": 1.7009222737950276e-06, "epoch": 8.937295204051237, "percentage": 89.37, "elapsed_time": "4:09:07", "remaining_time": "0:29:37", "throughput": 2315.77, "total_tokens": 34615464} {"current_steps": 60010, "total_steps": 67140, "loss": 0.4118, "lr": 1.698566885289496e-06, "epoch": 8.938039916592196, "percentage": 89.38, "elapsed_time": "4:09:08", "remaining_time": "0:29:36", "throughput": 2315.78, "total_tokens": 34618248} {"current_steps": 60015, "total_steps": 67140, "loss": 0.6111, "lr": 1.696213071400074e-06, "epoch": 8.938784629133155, "percentage": 89.39, "elapsed_time": "4:09:09", "remaining_time": "0:29:34", "throughput": 2315.8, "total_tokens": 34621096} {"current_steps": 60020, "total_steps": 67140, "loss": 0.5128, "lr": 1.693860832285829e-06, "epoch": 8.939529341674113, "percentage": 89.4, "elapsed_time": "4:09:11", "remaining_time": "0:29:33", "throughput": 2315.83, "total_tokens": 34624296} {"current_steps": 60025, "total_steps": 67140, "loss": 0.436, "lr": 1.6915101681057144e-06, "epoch": 8.940274054215074, "percentage": 89.4, "elapsed_time": "4:09:12", "remaining_time": "0:29:32", "throughput": 2315.84, "total_tokens": 34627048} {"current_steps": 60030, "total_steps": 67140, "loss": 0.4207, "lr": 1.6891610790185752e-06, "epoch": 8.941018766756033, "percentage": 89.41, "elapsed_time": "4:09:13", "remaining_time": "0:29:31", "throughput": 2315.86, "total_tokens": 34629928} {"current_steps": 60035, "total_steps": 67140, "loss": 0.6819, "lr": 1.686813565183154e-06, "epoch": 8.941763479296991, "percentage": 89.42, "elapsed_time": "4:09:14", "remaining_time": "0:29:29", "throughput": 2315.89, "total_tokens": 34633224} {"current_steps": 60040, "total_steps": 67140, "loss": 0.616, "lr": 1.6844676267580932e-06, "epoch": 8.94250819183795, "percentage": 89.43, "elapsed_time": "4:09:15", "remaining_time": "0:29:28", "throughput": 2315.91, "total_tokens": 34636200} {"current_steps": 60045, "total_steps": 67140, "loss": 0.6531, "lr": 1.6821232639019107e-06, "epoch": 8.943252904378909, "percentage": 89.43, "elapsed_time": "4:09:16", "remaining_time": "0:29:27", "throughput": 2315.94, "total_tokens": 34639208} {"current_steps": 60050, "total_steps": 67140, "loss": 0.6102, "lr": 1.6797804767730352e-06, "epoch": 8.94399761691987, "percentage": 89.44, "elapsed_time": "4:09:18", "remaining_time": "0:29:26", "throughput": 2315.94, "total_tokens": 34641928} {"current_steps": 60055, "total_steps": 67140, "loss": 0.5985, "lr": 1.6774392655297817e-06, "epoch": 8.944742329460828, "percentage": 89.45, "elapsed_time": "4:09:19", "remaining_time": "0:29:24", "throughput": 2315.95, "total_tokens": 34644616} {"current_steps": 60060, "total_steps": 67140, "loss": 0.685, "lr": 1.6750996303303596e-06, "epoch": 8.945487042001787, "percentage": 89.45, "elapsed_time": "4:09:20", "remaining_time": "0:29:23", "throughput": 2315.98, "total_tokens": 34647656} {"current_steps": 60065, "total_steps": 67140, "loss": 0.6202, "lr": 1.6727615713328788e-06, "epoch": 8.946231754542747, "percentage": 89.46, "elapsed_time": "4:09:21", "remaining_time": "0:29:22", "throughput": 2316.0, "total_tokens": 34650664} {"current_steps": 60070, "total_steps": 67140, "loss": 0.6443, "lr": 1.670425088695321e-06, "epoch": 8.946976467083706, "percentage": 89.47, "elapsed_time": "4:09:22", "remaining_time": "0:29:21", "throughput": 2316.02, "total_tokens": 34653608} {"current_steps": 60075, "total_steps": 67140, "loss": 0.5249, "lr": 1.6680901825755908e-06, "epoch": 8.947721179624665, "percentage": 89.48, "elapsed_time": "4:09:23", "remaining_time": "0:29:19", "throughput": 2316.04, "total_tokens": 34656584} {"current_steps": 60080, "total_steps": 67140, "loss": 0.6776, "lr": 1.6657568531314615e-06, "epoch": 8.948465892165624, "percentage": 89.48, "elapsed_time": "4:09:24", "remaining_time": "0:29:18", "throughput": 2316.05, "total_tokens": 34659208} {"current_steps": 60085, "total_steps": 67140, "loss": 0.5909, "lr": 1.663425100520616e-06, "epoch": 8.949210604706582, "percentage": 89.49, "elapsed_time": "4:09:25", "remaining_time": "0:29:17", "throughput": 2316.05, "total_tokens": 34661864} {"current_steps": 60090, "total_steps": 67140, "loss": 0.7906, "lr": 1.661094924900619e-06, "epoch": 8.949955317247543, "percentage": 89.5, "elapsed_time": "4:09:27", "remaining_time": "0:29:15", "throughput": 2316.08, "total_tokens": 34665000} {"current_steps": 60095, "total_steps": 67140, "loss": 0.543, "lr": 1.65876632642894e-06, "epoch": 8.950700029788502, "percentage": 89.51, "elapsed_time": "4:09:28", "remaining_time": "0:29:14", "throughput": 2316.1, "total_tokens": 34667848} {"current_steps": 60100, "total_steps": 67140, "loss": 0.5994, "lr": 1.6564393052629384e-06, "epoch": 8.95144474232946, "percentage": 89.51, "elapsed_time": "4:09:29", "remaining_time": "0:29:13", "throughput": 2316.11, "total_tokens": 34670792} {"current_steps": 60105, "total_steps": 67140, "loss": 0.5074, "lr": 1.6541138615598585e-06, "epoch": 8.95218945487042, "percentage": 89.52, "elapsed_time": "4:09:30", "remaining_time": "0:29:12", "throughput": 2316.12, "total_tokens": 34673416} {"current_steps": 60110, "total_steps": 67140, "loss": 0.5224, "lr": 1.6517899954768434e-06, "epoch": 8.95293416741138, "percentage": 89.53, "elapsed_time": "4:09:31", "remaining_time": "0:29:10", "throughput": 2316.13, "total_tokens": 34676232} {"current_steps": 60115, "total_steps": 67140, "loss": 0.6109, "lr": 1.6494677071709347e-06, "epoch": 8.953678879952339, "percentage": 89.54, "elapsed_time": "4:09:32", "remaining_time": "0:29:09", "throughput": 2316.15, "total_tokens": 34679048} {"current_steps": 60120, "total_steps": 67140, "loss": 0.7743, "lr": 1.6471469967990622e-06, "epoch": 8.954423592493297, "percentage": 89.54, "elapsed_time": "4:09:33", "remaining_time": "0:29:08", "throughput": 2316.17, "total_tokens": 34681992} {"current_steps": 60125, "total_steps": 67140, "loss": 0.8659, "lr": 1.6448278645180477e-06, "epoch": 8.955168305034256, "percentage": 89.55, "elapsed_time": "4:09:34", "remaining_time": "0:29:07", "throughput": 2316.18, "total_tokens": 34684776} {"current_steps": 60130, "total_steps": 67140, "loss": 0.5815, "lr": 1.6425103104846128e-06, "epoch": 8.955913017575217, "percentage": 89.56, "elapsed_time": "4:09:36", "remaining_time": "0:29:05", "throughput": 2316.19, "total_tokens": 34687528} {"current_steps": 60135, "total_steps": 67140, "loss": 0.5495, "lr": 1.6401943348553688e-06, "epoch": 8.956657730116175, "percentage": 89.57, "elapsed_time": "4:09:37", "remaining_time": "0:29:04", "throughput": 2316.21, "total_tokens": 34690600} {"current_steps": 60140, "total_steps": 67140, "loss": 0.5294, "lr": 1.6378799377868155e-06, "epoch": 8.957402442657134, "percentage": 89.57, "elapsed_time": "4:09:38", "remaining_time": "0:29:03", "throughput": 2316.23, "total_tokens": 34693448} {"current_steps": 60145, "total_steps": 67140, "loss": 0.5779, "lr": 1.635567119435355e-06, "epoch": 8.958147155198093, "percentage": 89.58, "elapsed_time": "4:09:39", "remaining_time": "0:29:02", "throughput": 2316.25, "total_tokens": 34696520} {"current_steps": 60150, "total_steps": 67140, "loss": 0.5338, "lr": 1.6332558799572711e-06, "epoch": 8.958891867739053, "percentage": 89.59, "elapsed_time": "4:09:40", "remaining_time": "0:29:00", "throughput": 2316.26, "total_tokens": 34699240} {"current_steps": 60155, "total_steps": 67140, "loss": 0.589, "lr": 1.6309462195087555e-06, "epoch": 8.959636580280012, "percentage": 89.6, "elapsed_time": "4:09:41", "remaining_time": "0:28:59", "throughput": 2316.29, "total_tokens": 34702248} {"current_steps": 60160, "total_steps": 67140, "loss": 0.8711, "lr": 1.6286381382458803e-06, "epoch": 8.960381292820971, "percentage": 89.6, "elapsed_time": "4:09:43", "remaining_time": "0:28:58", "throughput": 2316.31, "total_tokens": 34705384} {"current_steps": 60165, "total_steps": 67140, "loss": 0.532, "lr": 1.6263316363246184e-06, "epoch": 8.96112600536193, "percentage": 89.61, "elapsed_time": "4:09:44", "remaining_time": "0:28:57", "throughput": 2316.33, "total_tokens": 34708168} {"current_steps": 60170, "total_steps": 67140, "loss": 0.3414, "lr": 1.624026713900839e-06, "epoch": 8.96187071790289, "percentage": 89.62, "elapsed_time": "4:09:45", "remaining_time": "0:28:55", "throughput": 2316.35, "total_tokens": 34711080} {"current_steps": 60175, "total_steps": 67140, "loss": 0.6088, "lr": 1.6217233711302904e-06, "epoch": 8.962615430443849, "percentage": 89.63, "elapsed_time": "4:09:46", "remaining_time": "0:28:54", "throughput": 2316.37, "total_tokens": 34714184} {"current_steps": 60180, "total_steps": 67140, "loss": 0.6179, "lr": 1.619421608168628e-06, "epoch": 8.963360142984808, "percentage": 89.63, "elapsed_time": "4:09:47", "remaining_time": "0:28:53", "throughput": 2316.39, "total_tokens": 34717000} {"current_steps": 60185, "total_steps": 67140, "loss": 0.8394, "lr": 1.6171214251713974e-06, "epoch": 8.964104855525767, "percentage": 89.64, "elapsed_time": "4:09:48", "remaining_time": "0:28:52", "throughput": 2316.4, "total_tokens": 34719816} {"current_steps": 60190, "total_steps": 67140, "loss": 0.5975, "lr": 1.6148228222940292e-06, "epoch": 8.964849568066727, "percentage": 89.65, "elapsed_time": "4:09:49", "remaining_time": "0:28:50", "throughput": 2316.4, "total_tokens": 34722376} {"current_steps": 60195, "total_steps": 67140, "loss": 0.4086, "lr": 1.6125257996918609e-06, "epoch": 8.965594280607686, "percentage": 89.66, "elapsed_time": "4:09:50", "remaining_time": "0:28:49", "throughput": 2316.41, "total_tokens": 34725128} {"current_steps": 60200, "total_steps": 67140, "loss": 0.5655, "lr": 1.6102303575201095e-06, "epoch": 8.966338993148645, "percentage": 89.66, "elapsed_time": "4:09:52", "remaining_time": "0:28:48", "throughput": 2316.45, "total_tokens": 34728392} {"current_steps": 60205, "total_steps": 67140, "loss": 0.4413, "lr": 1.6079364959338983e-06, "epoch": 8.967083705689603, "percentage": 89.67, "elapsed_time": "4:09:53", "remaining_time": "0:28:47", "throughput": 2316.45, "total_tokens": 34730984} {"current_steps": 60210, "total_steps": 67140, "loss": 0.6033, "lr": 1.6056442150882283e-06, "epoch": 8.967828418230564, "percentage": 89.68, "elapsed_time": "4:09:54", "remaining_time": "0:28:45", "throughput": 2316.47, "total_tokens": 34733864} {"current_steps": 60215, "total_steps": 67140, "loss": 0.7252, "lr": 1.6033535151380092e-06, "epoch": 8.968573130771523, "percentage": 89.69, "elapsed_time": "4:09:55", "remaining_time": "0:28:44", "throughput": 2316.48, "total_tokens": 34736584} {"current_steps": 60220, "total_steps": 67140, "loss": 0.509, "lr": 1.6010643962380362e-06, "epoch": 8.969317843312481, "percentage": 89.69, "elapsed_time": "4:09:56", "remaining_time": "0:28:43", "throughput": 2316.5, "total_tokens": 34739496} {"current_steps": 60225, "total_steps": 67140, "loss": 0.8502, "lr": 1.5987768585430025e-06, "epoch": 8.97006255585344, "percentage": 89.7, "elapsed_time": "4:09:57", "remaining_time": "0:28:42", "throughput": 2316.5, "total_tokens": 34742184} {"current_steps": 60230, "total_steps": 67140, "loss": 0.5281, "lr": 1.5964909022074815e-06, "epoch": 8.970807268394399, "percentage": 89.71, "elapsed_time": "4:09:58", "remaining_time": "0:28:40", "throughput": 2316.52, "total_tokens": 34745128} {"current_steps": 60235, "total_steps": 67140, "loss": 0.4491, "lr": 1.5942065273859552e-06, "epoch": 8.97155198093536, "percentage": 89.72, "elapsed_time": "4:09:59", "remaining_time": "0:28:39", "throughput": 2316.54, "total_tokens": 34748072} {"current_steps": 60240, "total_steps": 67140, "loss": 0.7975, "lr": 1.591923734232792e-06, "epoch": 8.972296693476318, "percentage": 89.72, "elapsed_time": "4:10:01", "remaining_time": "0:28:38", "throughput": 2316.55, "total_tokens": 34750792} {"current_steps": 60245, "total_steps": 67140, "loss": 0.5863, "lr": 1.5896425229022488e-06, "epoch": 8.973041406017277, "percentage": 89.73, "elapsed_time": "4:10:02", "remaining_time": "0:28:36", "throughput": 2316.56, "total_tokens": 34753480} {"current_steps": 60250, "total_steps": 67140, "loss": 0.563, "lr": 1.5873628935484858e-06, "epoch": 8.973786118558236, "percentage": 89.74, "elapsed_time": "4:10:03", "remaining_time": "0:28:35", "throughput": 2316.58, "total_tokens": 34756424} {"current_steps": 60255, "total_steps": 67140, "loss": 0.5856, "lr": 1.585084846325549e-06, "epoch": 8.974530831099196, "percentage": 89.75, "elapsed_time": "4:10:04", "remaining_time": "0:28:34", "throughput": 2316.58, "total_tokens": 34759112} {"current_steps": 60260, "total_steps": 67140, "loss": 0.5473, "lr": 1.5828083813873824e-06, "epoch": 8.975275543640155, "percentage": 89.75, "elapsed_time": "4:10:05", "remaining_time": "0:28:33", "throughput": 2316.6, "total_tokens": 34762056} {"current_steps": 60265, "total_steps": 67140, "loss": 0.5091, "lr": 1.580533498887818e-06, "epoch": 8.976020256181114, "percentage": 89.76, "elapsed_time": "4:10:06", "remaining_time": "0:28:31", "throughput": 2316.61, "total_tokens": 34764808} {"current_steps": 60270, "total_steps": 67140, "loss": 0.5987, "lr": 1.5782601989805857e-06, "epoch": 8.976764968722073, "percentage": 89.77, "elapsed_time": "4:10:07", "remaining_time": "0:28:30", "throughput": 2316.62, "total_tokens": 34767528} {"current_steps": 60275, "total_steps": 67140, "loss": 0.5621, "lr": 1.5759884818192988e-06, "epoch": 8.977509681263033, "percentage": 89.78, "elapsed_time": "4:10:09", "remaining_time": "0:28:29", "throughput": 2316.57, "total_tokens": 34770472} {"current_steps": 60280, "total_steps": 67140, "loss": 0.4052, "lr": 1.5737183475574762e-06, "epoch": 8.978254393803992, "percentage": 89.78, "elapsed_time": "4:10:10", "remaining_time": "0:28:28", "throughput": 2316.58, "total_tokens": 34773192} {"current_steps": 60285, "total_steps": 67140, "loss": 0.5281, "lr": 1.5714497963485203e-06, "epoch": 8.97899910634495, "percentage": 89.79, "elapsed_time": "4:10:11", "remaining_time": "0:28:26", "throughput": 2316.59, "total_tokens": 34775880} {"current_steps": 60290, "total_steps": 67140, "loss": 0.5112, "lr": 1.569182828345736e-06, "epoch": 8.97974381888591, "percentage": 89.8, "elapsed_time": "4:10:12", "remaining_time": "0:28:25", "throughput": 2316.6, "total_tokens": 34778600} {"current_steps": 60295, "total_steps": 67140, "loss": 0.4643, "lr": 1.5669174437023149e-06, "epoch": 8.98048853142687, "percentage": 89.8, "elapsed_time": "4:10:13", "remaining_time": "0:28:24", "throughput": 2316.61, "total_tokens": 34781512} {"current_steps": 60300, "total_steps": 67140, "loss": 0.5058, "lr": 1.5646536425713426e-06, "epoch": 8.981233243967829, "percentage": 89.81, "elapsed_time": "4:10:15", "remaining_time": "0:28:23", "throughput": 2316.64, "total_tokens": 34784680} {"current_steps": 60305, "total_steps": 67140, "loss": 0.3266, "lr": 1.5623914251057942e-06, "epoch": 8.981977956508787, "percentage": 89.82, "elapsed_time": "4:10:16", "remaining_time": "0:28:21", "throughput": 2316.66, "total_tokens": 34787560} {"current_steps": 60310, "total_steps": 67140, "loss": 0.6672, "lr": 1.5601307914585416e-06, "epoch": 8.982722669049746, "percentage": 89.83, "elapsed_time": "4:10:17", "remaining_time": "0:28:20", "throughput": 2316.67, "total_tokens": 34790344} {"current_steps": 60315, "total_steps": 67140, "loss": 0.5411, "lr": 1.5578717417823518e-06, "epoch": 8.983467381590707, "percentage": 89.83, "elapsed_time": "4:10:18", "remaining_time": "0:28:19", "throughput": 2316.68, "total_tokens": 34793096} {"current_steps": 60320, "total_steps": 67140, "loss": 0.6762, "lr": 1.5556142762298776e-06, "epoch": 8.984212094131665, "percentage": 89.84, "elapsed_time": "4:10:19", "remaining_time": "0:28:18", "throughput": 2316.69, "total_tokens": 34795912} {"current_steps": 60325, "total_steps": 67140, "loss": 0.6211, "lr": 1.5533583949536745e-06, "epoch": 8.984956806672624, "percentage": 89.85, "elapsed_time": "4:10:20", "remaining_time": "0:28:16", "throughput": 2316.73, "total_tokens": 34799112} {"current_steps": 60330, "total_steps": 67140, "loss": 0.5157, "lr": 1.5511040981061848e-06, "epoch": 8.985701519213583, "percentage": 89.86, "elapsed_time": "4:10:21", "remaining_time": "0:28:15", "throughput": 2316.74, "total_tokens": 34801832} {"current_steps": 60335, "total_steps": 67140, "loss": 0.5317, "lr": 1.5488513858397475e-06, "epoch": 8.986446231754543, "percentage": 89.86, "elapsed_time": "4:10:23", "remaining_time": "0:28:14", "throughput": 2316.76, "total_tokens": 34804808} {"current_steps": 60340, "total_steps": 67140, "loss": 0.7576, "lr": 1.5466002583065825e-06, "epoch": 8.987190944295502, "percentage": 89.87, "elapsed_time": "4:10:24", "remaining_time": "0:28:13", "throughput": 2316.77, "total_tokens": 34807688} {"current_steps": 60345, "total_steps": 67140, "loss": 0.4426, "lr": 1.544350715658821e-06, "epoch": 8.987935656836461, "percentage": 89.88, "elapsed_time": "4:10:25", "remaining_time": "0:28:11", "throughput": 2316.8, "total_tokens": 34810696} {"current_steps": 60350, "total_steps": 67140, "loss": 0.6207, "lr": 1.542102758048472e-06, "epoch": 8.98868036937742, "percentage": 89.89, "elapsed_time": "4:10:26", "remaining_time": "0:28:10", "throughput": 2316.82, "total_tokens": 34813640} {"current_steps": 60355, "total_steps": 67140, "loss": 0.8469, "lr": 1.5398563856274472e-06, "epoch": 8.98942508191838, "percentage": 89.89, "elapsed_time": "4:10:27", "remaining_time": "0:28:09", "throughput": 2316.83, "total_tokens": 34816520} {"current_steps": 60360, "total_steps": 67140, "loss": 0.6652, "lr": 1.5376115985475448e-06, "epoch": 8.990169794459339, "percentage": 89.9, "elapsed_time": "4:10:28", "remaining_time": "0:28:08", "throughput": 2316.84, "total_tokens": 34819144} {"current_steps": 60365, "total_steps": 67140, "loss": 0.6422, "lr": 1.535368396960457e-06, "epoch": 8.990914507000298, "percentage": 89.91, "elapsed_time": "4:10:29", "remaining_time": "0:28:06", "throughput": 2316.85, "total_tokens": 34821928} {"current_steps": 60370, "total_steps": 67140, "loss": 0.5667, "lr": 1.5331267810177797e-06, "epoch": 8.991659219541257, "percentage": 89.92, "elapsed_time": "4:10:30", "remaining_time": "0:28:05", "throughput": 2316.86, "total_tokens": 34824712} {"current_steps": 60375, "total_steps": 67140, "loss": 0.5405, "lr": 1.53088675087098e-06, "epoch": 8.992403932082215, "percentage": 89.92, "elapsed_time": "4:10:32", "remaining_time": "0:28:04", "throughput": 2316.88, "total_tokens": 34827592} {"current_steps": 60380, "total_steps": 67140, "loss": 0.434, "lr": 1.5286483066714347e-06, "epoch": 8.993148644623176, "percentage": 89.93, "elapsed_time": "4:10:33", "remaining_time": "0:28:03", "throughput": 2316.9, "total_tokens": 34830600} {"current_steps": 60385, "total_steps": 67140, "loss": 0.6811, "lr": 1.526411448570414e-06, "epoch": 8.993893357164135, "percentage": 89.94, "elapsed_time": "4:10:34", "remaining_time": "0:28:01", "throughput": 2316.92, "total_tokens": 34833416} {"current_steps": 60390, "total_steps": 67140, "loss": 0.6056, "lr": 1.5241761767190665e-06, "epoch": 8.994638069705093, "percentage": 89.95, "elapsed_time": "4:10:35", "remaining_time": "0:28:00", "throughput": 2316.92, "total_tokens": 34836104} {"current_steps": 60395, "total_steps": 67140, "loss": 0.8914, "lr": 1.5219424912684494e-06, "epoch": 8.995382782246054, "percentage": 89.95, "elapsed_time": "4:10:36", "remaining_time": "0:27:59", "throughput": 2316.94, "total_tokens": 34839048} {"current_steps": 60400, "total_steps": 67140, "loss": 0.594, "lr": 1.5197103923695e-06, "epoch": 8.996127494787013, "percentage": 89.96, "elapsed_time": "4:10:37", "remaining_time": "0:27:58", "throughput": 2316.96, "total_tokens": 34841832} {"current_steps": 60405, "total_steps": 67140, "loss": 0.634, "lr": 1.5174798801730644e-06, "epoch": 8.996872207327971, "percentage": 89.97, "elapsed_time": "4:10:38", "remaining_time": "0:27:56", "throughput": 2316.97, "total_tokens": 34844584} {"current_steps": 60410, "total_steps": 67140, "loss": 0.5215, "lr": 1.5152509548298639e-06, "epoch": 8.99761691986893, "percentage": 89.98, "elapsed_time": "4:10:40", "remaining_time": "0:27:55", "throughput": 2317.0, "total_tokens": 34847880} {"current_steps": 60415, "total_steps": 67140, "loss": 0.777, "lr": 1.5130236164905192e-06, "epoch": 8.998361632409889, "percentage": 89.98, "elapsed_time": "4:10:41", "remaining_time": "0:27:54", "throughput": 2317.02, "total_tokens": 34850984} {"current_steps": 60420, "total_steps": 67140, "loss": 0.6147, "lr": 1.5107978653055466e-06, "epoch": 8.99910634495085, "percentage": 89.99, "elapsed_time": "4:10:42", "remaining_time": "0:27:53", "throughput": 2317.04, "total_tokens": 34853736} {"current_steps": 60425, "total_steps": 67140, "loss": 0.465, "lr": 1.5085737014253586e-06, "epoch": 8.999851057491808, "percentage": 90.0, "elapsed_time": "4:10:43", "remaining_time": "0:27:51", "throughput": 2317.05, "total_tokens": 34856584} {"current_steps": 60426, "total_steps": 67140, "eval_loss": 0.6799556016921997, "epoch": 9.0, "percentage": 90.0, "elapsed_time": "4:11:57", "remaining_time": "0:27:59", "throughput": 2305.65, "total_tokens": 34856680} {"current_steps": 60430, "total_steps": 67140, "loss": 0.6018, "lr": 1.5063511250002466e-06, "epoch": 9.000595770032767, "percentage": 90.01, "elapsed_time": "4:12:00", "remaining_time": "0:27:58", "throughput": 2305.37, "total_tokens": 34859112} {"current_steps": 60435, "total_steps": 67140, "loss": 0.4742, "lr": 1.5041301361804123e-06, "epoch": 9.001340482573726, "percentage": 90.01, "elapsed_time": "4:12:01", "remaining_time": "0:27:57", "throughput": 2305.39, "total_tokens": 34862024} {"current_steps": 60440, "total_steps": 67140, "loss": 0.5398, "lr": 1.5019107351159328e-06, "epoch": 9.002085195114686, "percentage": 90.02, "elapsed_time": "4:12:03", "remaining_time": "0:27:56", "throughput": 2305.43, "total_tokens": 34865224} {"current_steps": 60445, "total_steps": 67140, "loss": 0.5959, "lr": 1.4996929219567884e-06, "epoch": 9.002829907655645, "percentage": 90.03, "elapsed_time": "4:12:04", "remaining_time": "0:27:55", "throughput": 2305.46, "total_tokens": 34868520} {"current_steps": 60450, "total_steps": 67140, "loss": 0.5901, "lr": 1.4974766968528508e-06, "epoch": 9.003574620196604, "percentage": 90.04, "elapsed_time": "4:12:05", "remaining_time": "0:27:53", "throughput": 2305.48, "total_tokens": 34871400} {"current_steps": 60455, "total_steps": 67140, "loss": 0.5162, "lr": 1.4952620599538864e-06, "epoch": 9.004319332737563, "percentage": 90.04, "elapsed_time": "4:12:06", "remaining_time": "0:27:52", "throughput": 2305.5, "total_tokens": 34874344} {"current_steps": 60460, "total_steps": 67140, "loss": 0.5449, "lr": 1.4930490114095446e-06, "epoch": 9.005064045278523, "percentage": 90.05, "elapsed_time": "4:12:07", "remaining_time": "0:27:51", "throughput": 2305.51, "total_tokens": 34877064} {"current_steps": 60465, "total_steps": 67140, "loss": 0.5033, "lr": 1.490837551369384e-06, "epoch": 9.005808757819482, "percentage": 90.06, "elapsed_time": "4:12:08", "remaining_time": "0:27:50", "throughput": 2305.53, "total_tokens": 34880008} {"current_steps": 60470, "total_steps": 67140, "loss": 0.6758, "lr": 1.4886276799828402e-06, "epoch": 9.00655347036044, "percentage": 90.07, "elapsed_time": "4:12:09", "remaining_time": "0:27:48", "throughput": 2305.54, "total_tokens": 34882824} {"current_steps": 60475, "total_steps": 67140, "loss": 0.3898, "lr": 1.4864193973992441e-06, "epoch": 9.0072981829014, "percentage": 90.07, "elapsed_time": "4:12:11", "remaining_time": "0:27:47", "throughput": 2305.56, "total_tokens": 34885736} {"current_steps": 60480, "total_steps": 67140, "loss": 0.5228, "lr": 1.484212703767826e-06, "epoch": 9.00804289544236, "percentage": 90.08, "elapsed_time": "4:12:12", "remaining_time": "0:27:46", "throughput": 2305.59, "total_tokens": 34888904} {"current_steps": 60485, "total_steps": 67140, "loss": 0.5813, "lr": 1.482007599237706e-06, "epoch": 9.008787607983319, "percentage": 90.09, "elapsed_time": "4:12:13", "remaining_time": "0:27:45", "throughput": 2305.61, "total_tokens": 34891816} {"current_steps": 60490, "total_steps": 67140, "loss": 0.7235, "lr": 1.4798040839578946e-06, "epoch": 9.009532320524277, "percentage": 90.1, "elapsed_time": "4:12:14", "remaining_time": "0:27:43", "throughput": 2305.63, "total_tokens": 34894664} {"current_steps": 60495, "total_steps": 67140, "loss": 0.3818, "lr": 1.4776021580772958e-06, "epoch": 9.010277033065236, "percentage": 90.1, "elapsed_time": "4:12:15", "remaining_time": "0:27:42", "throughput": 2305.64, "total_tokens": 34897448} {"current_steps": 60500, "total_steps": 67140, "loss": 0.4924, "lr": 1.4754018217447125e-06, "epoch": 9.011021745606197, "percentage": 90.11, "elapsed_time": "4:12:16", "remaining_time": "0:27:41", "throughput": 2305.65, "total_tokens": 34900264} {"current_steps": 60505, "total_steps": 67140, "loss": 0.4275, "lr": 1.4732030751088255e-06, "epoch": 9.011766458147155, "percentage": 90.12, "elapsed_time": "4:12:17", "remaining_time": "0:27:40", "throughput": 2305.66, "total_tokens": 34902952} {"current_steps": 60510, "total_steps": 67140, "loss": 0.6031, "lr": 1.4710059183182274e-06, "epoch": 9.012511170688114, "percentage": 90.13, "elapsed_time": "4:12:19", "remaining_time": "0:27:38", "throughput": 2305.67, "total_tokens": 34905704} {"current_steps": 60515, "total_steps": 67140, "loss": 0.5243, "lr": 1.4688103515213824e-06, "epoch": 9.013255883229073, "percentage": 90.13, "elapsed_time": "4:12:20", "remaining_time": "0:27:37", "throughput": 2305.7, "total_tokens": 34908808} {"current_steps": 60520, "total_steps": 67140, "loss": 0.6775, "lr": 1.466616374866664e-06, "epoch": 9.014000595770034, "percentage": 90.14, "elapsed_time": "4:12:21", "remaining_time": "0:27:36", "throughput": 2305.72, "total_tokens": 34911656} {"current_steps": 60525, "total_steps": 67140, "loss": 0.4624, "lr": 1.4644239885023309e-06, "epoch": 9.014745308310992, "percentage": 90.15, "elapsed_time": "4:12:22", "remaining_time": "0:27:34", "throughput": 2305.74, "total_tokens": 34914568} {"current_steps": 60530, "total_steps": 67140, "loss": 0.5299, "lr": 1.4622331925765343e-06, "epoch": 9.015490020851951, "percentage": 90.15, "elapsed_time": "4:12:23", "remaining_time": "0:27:33", "throughput": 2305.76, "total_tokens": 34917544} {"current_steps": 60535, "total_steps": 67140, "loss": 0.6957, "lr": 1.460043987237325e-06, "epoch": 9.01623473339291, "percentage": 90.16, "elapsed_time": "4:12:24", "remaining_time": "0:27:32", "throughput": 2305.76, "total_tokens": 34920200} {"current_steps": 60540, "total_steps": 67140, "loss": 0.6404, "lr": 1.457856372632635e-06, "epoch": 9.01697944593387, "percentage": 90.17, "elapsed_time": "4:12:25", "remaining_time": "0:27:31", "throughput": 2305.78, "total_tokens": 34923016} {"current_steps": 60545, "total_steps": 67140, "loss": 0.484, "lr": 1.4556703489102958e-06, "epoch": 9.017724158474829, "percentage": 90.18, "elapsed_time": "4:12:26", "remaining_time": "0:27:29", "throughput": 2305.79, "total_tokens": 34925800} {"current_steps": 60550, "total_steps": 67140, "loss": 0.6748, "lr": 1.4534859162180308e-06, "epoch": 9.018468871015788, "percentage": 90.18, "elapsed_time": "4:12:28", "remaining_time": "0:27:28", "throughput": 2305.82, "total_tokens": 34929032} {"current_steps": 60555, "total_steps": 67140, "loss": 0.8661, "lr": 1.451303074703453e-06, "epoch": 9.019213583556747, "percentage": 90.19, "elapsed_time": "4:12:29", "remaining_time": "0:27:27", "throughput": 2305.85, "total_tokens": 34932104} {"current_steps": 60560, "total_steps": 67140, "loss": 0.524, "lr": 1.4491218245140715e-06, "epoch": 9.019958296097707, "percentage": 90.2, "elapsed_time": "4:12:30", "remaining_time": "0:27:26", "throughput": 2305.87, "total_tokens": 34934952} {"current_steps": 60565, "total_steps": 67140, "loss": 0.7224, "lr": 1.4469421657972855e-06, "epoch": 9.020703008638666, "percentage": 90.21, "elapsed_time": "4:12:31", "remaining_time": "0:27:24", "throughput": 2305.89, "total_tokens": 34937960} {"current_steps": 60570, "total_steps": 67140, "loss": 0.4835, "lr": 1.4447640987003935e-06, "epoch": 9.021447721179625, "percentage": 90.21, "elapsed_time": "4:12:32", "remaining_time": "0:27:23", "throughput": 2305.92, "total_tokens": 34941000} {"current_steps": 60575, "total_steps": 67140, "loss": 0.6879, "lr": 1.4425876233705698e-06, "epoch": 9.022192433720583, "percentage": 90.22, "elapsed_time": "4:12:33", "remaining_time": "0:27:22", "throughput": 2305.93, "total_tokens": 34943752} {"current_steps": 60580, "total_steps": 67140, "loss": 0.6599, "lr": 1.4404127399548966e-06, "epoch": 9.022937146261542, "percentage": 90.23, "elapsed_time": "4:12:34", "remaining_time": "0:27:21", "throughput": 2305.94, "total_tokens": 34946440} {"current_steps": 60585, "total_steps": 67140, "loss": 0.4263, "lr": 1.4382394486003454e-06, "epoch": 9.023681858802503, "percentage": 90.24, "elapsed_time": "4:12:36", "remaining_time": "0:27:19", "throughput": 2305.96, "total_tokens": 34949448} {"current_steps": 60590, "total_steps": 67140, "loss": 0.4933, "lr": 1.436067749453779e-06, "epoch": 9.024426571343461, "percentage": 90.24, "elapsed_time": "4:12:37", "remaining_time": "0:27:18", "throughput": 2305.98, "total_tokens": 34952424} {"current_steps": 60595, "total_steps": 67140, "loss": 0.5825, "lr": 1.4338976426619493e-06, "epoch": 9.02517128388442, "percentage": 90.25, "elapsed_time": "4:12:38", "remaining_time": "0:27:17", "throughput": 2306.01, "total_tokens": 34955528} {"current_steps": 60600, "total_steps": 67140, "loss": 0.707, "lr": 1.431729128371506e-06, "epoch": 9.025915996425379, "percentage": 90.26, "elapsed_time": "4:12:39", "remaining_time": "0:27:16", "throughput": 2306.04, "total_tokens": 34958760} {"current_steps": 60605, "total_steps": 67140, "loss": 0.5921, "lr": 1.4295622067289821e-06, "epoch": 9.02666070896634, "percentage": 90.27, "elapsed_time": "4:12:40", "remaining_time": "0:27:14", "throughput": 2306.06, "total_tokens": 34961640} {"current_steps": 60610, "total_steps": 67140, "loss": 0.4584, "lr": 1.4273968778808155e-06, "epoch": 9.027405421507298, "percentage": 90.27, "elapsed_time": "4:12:41", "remaining_time": "0:27:13", "throughput": 2306.09, "total_tokens": 34964808} {"current_steps": 60615, "total_steps": 67140, "loss": 0.6648, "lr": 1.4252331419733283e-06, "epoch": 9.028150134048257, "percentage": 90.28, "elapsed_time": "4:12:43", "remaining_time": "0:27:12", "throughput": 2306.09, "total_tokens": 34967464} {"current_steps": 60620, "total_steps": 67140, "loss": 0.4513, "lr": 1.423070999152737e-06, "epoch": 9.028894846589216, "percentage": 90.29, "elapsed_time": "4:12:44", "remaining_time": "0:27:10", "throughput": 2306.13, "total_tokens": 34970696} {"current_steps": 60625, "total_steps": 67140, "loss": 0.6166, "lr": 1.4209104495651492e-06, "epoch": 9.029639559130176, "percentage": 90.3, "elapsed_time": "4:12:45", "remaining_time": "0:27:09", "throughput": 2306.15, "total_tokens": 34973608} {"current_steps": 60630, "total_steps": 67140, "loss": 0.5713, "lr": 1.4187514933565738e-06, "epoch": 9.030384271671135, "percentage": 90.3, "elapsed_time": "4:12:46", "remaining_time": "0:27:08", "throughput": 2306.16, "total_tokens": 34976520} {"current_steps": 60635, "total_steps": 67140, "loss": 0.7396, "lr": 1.4165941306728963e-06, "epoch": 9.031128984212094, "percentage": 90.31, "elapsed_time": "4:12:47", "remaining_time": "0:27:07", "throughput": 2306.19, "total_tokens": 34979496} {"current_steps": 60640, "total_steps": 67140, "loss": 0.6434, "lr": 1.4144383616599033e-06, "epoch": 9.031873696753053, "percentage": 90.32, "elapsed_time": "4:12:48", "remaining_time": "0:27:05", "throughput": 2306.2, "total_tokens": 34982376} {"current_steps": 60645, "total_steps": 67140, "loss": 0.5892, "lr": 1.4122841864632724e-06, "epoch": 9.032618409294013, "percentage": 90.33, "elapsed_time": "4:12:49", "remaining_time": "0:27:04", "throughput": 2306.21, "total_tokens": 34985000} {"current_steps": 60650, "total_steps": 67140, "loss": 0.4236, "lr": 1.4101316052285734e-06, "epoch": 9.033363121834972, "percentage": 90.33, "elapsed_time": "4:12:51", "remaining_time": "0:27:03", "throughput": 2306.23, "total_tokens": 34987848} {"current_steps": 60655, "total_steps": 67140, "loss": 0.533, "lr": 1.4079806181012733e-06, "epoch": 9.03410783437593, "percentage": 90.34, "elapsed_time": "4:12:52", "remaining_time": "0:27:02", "throughput": 2306.23, "total_tokens": 34990376} {"current_steps": 60660, "total_steps": 67140, "loss": 0.6026, "lr": 1.4058312252267253e-06, "epoch": 9.03485254691689, "percentage": 90.35, "elapsed_time": "4:12:53", "remaining_time": "0:27:00", "throughput": 2306.24, "total_tokens": 34993032} {"current_steps": 60665, "total_steps": 67140, "loss": 0.5637, "lr": 1.4036834267501796e-06, "epoch": 9.03559725945785, "percentage": 90.36, "elapsed_time": "4:12:54", "remaining_time": "0:26:59", "throughput": 2306.25, "total_tokens": 34995816} {"current_steps": 60670, "total_steps": 67140, "loss": 0.5003, "lr": 1.4015372228167705e-06, "epoch": 9.036341971998809, "percentage": 90.36, "elapsed_time": "4:12:55", "remaining_time": "0:26:58", "throughput": 2306.26, "total_tokens": 34998440} {"current_steps": 60675, "total_steps": 67140, "loss": 0.6068, "lr": 1.399392613571529e-06, "epoch": 9.037086684539767, "percentage": 90.37, "elapsed_time": "4:12:56", "remaining_time": "0:26:57", "throughput": 2306.28, "total_tokens": 35001416} {"current_steps": 60680, "total_steps": 67140, "loss": 0.678, "lr": 1.3972495991593836e-06, "epoch": 9.037831397080726, "percentage": 90.38, "elapsed_time": "4:12:57", "remaining_time": "0:26:55", "throughput": 2306.29, "total_tokens": 35004232} {"current_steps": 60685, "total_steps": 67140, "loss": 0.6204, "lr": 1.3951081797251463e-06, "epoch": 9.038576109621687, "percentage": 90.39, "elapsed_time": "4:12:58", "remaining_time": "0:26:54", "throughput": 2306.31, "total_tokens": 35007016} {"current_steps": 60690, "total_steps": 67140, "loss": 0.6295, "lr": 1.3929683554135292e-06, "epoch": 9.039320822162646, "percentage": 90.39, "elapsed_time": "4:12:59", "remaining_time": "0:26:53", "throughput": 2306.32, "total_tokens": 35009800} {"current_steps": 60695, "total_steps": 67140, "loss": 0.3594, "lr": 1.3908301263691303e-06, "epoch": 9.040065534703604, "percentage": 90.4, "elapsed_time": "4:13:01", "remaining_time": "0:26:52", "throughput": 2306.34, "total_tokens": 35012680} {"current_steps": 60700, "total_steps": 67140, "loss": 0.6376, "lr": 1.3886934927364454e-06, "epoch": 9.040810247244563, "percentage": 90.41, "elapsed_time": "4:13:02", "remaining_time": "0:26:50", "throughput": 2306.34, "total_tokens": 35015304} {"current_steps": 60705, "total_steps": 67140, "loss": 0.4785, "lr": 1.3865584546598559e-06, "epoch": 9.041554959785524, "percentage": 90.42, "elapsed_time": "4:13:03", "remaining_time": "0:26:49", "throughput": 2306.36, "total_tokens": 35018056} {"current_steps": 60710, "total_steps": 67140, "loss": 0.4728, "lr": 1.384425012283644e-06, "epoch": 9.042299672326482, "percentage": 90.42, "elapsed_time": "4:13:04", "remaining_time": "0:26:48", "throughput": 2306.36, "total_tokens": 35020616} {"current_steps": 60715, "total_steps": 67140, "loss": 0.6856, "lr": 1.3822931657519744e-06, "epoch": 9.043044384867441, "percentage": 90.43, "elapsed_time": "4:13:05", "remaining_time": "0:26:46", "throughput": 2306.37, "total_tokens": 35023496} {"current_steps": 60720, "total_steps": 67140, "loss": 0.6666, "lr": 1.3801629152089073e-06, "epoch": 9.0437890974084, "percentage": 90.44, "elapsed_time": "4:13:06", "remaining_time": "0:26:45", "throughput": 2306.39, "total_tokens": 35026408} {"current_steps": 60725, "total_steps": 67140, "loss": 0.5868, "lr": 1.3780342607983999e-06, "epoch": 9.04453380994936, "percentage": 90.45, "elapsed_time": "4:13:07", "remaining_time": "0:26:44", "throughput": 2306.4, "total_tokens": 35029160} {"current_steps": 60730, "total_steps": 67140, "loss": 0.5993, "lr": 1.3759072026642978e-06, "epoch": 9.04527852249032, "percentage": 90.45, "elapsed_time": "4:13:08", "remaining_time": "0:26:43", "throughput": 2306.42, "total_tokens": 35031912} {"current_steps": 60735, "total_steps": 67140, "loss": 0.4536, "lr": 1.3737817409503417e-06, "epoch": 9.046023235031278, "percentage": 90.46, "elapsed_time": "4:13:10", "remaining_time": "0:26:41", "throughput": 2306.44, "total_tokens": 35034856} {"current_steps": 60740, "total_steps": 67140, "loss": 0.4001, "lr": 1.3716578758001557e-06, "epoch": 9.046767947572237, "percentage": 90.47, "elapsed_time": "4:13:11", "remaining_time": "0:26:40", "throughput": 2306.46, "total_tokens": 35037832} {"current_steps": 60745, "total_steps": 67140, "loss": 0.5706, "lr": 1.3695356073572612e-06, "epoch": 9.047512660113195, "percentage": 90.48, "elapsed_time": "4:13:12", "remaining_time": "0:26:39", "throughput": 2306.48, "total_tokens": 35040904} {"current_steps": 60750, "total_steps": 67140, "loss": 0.3884, "lr": 1.3674149357650822e-06, "epoch": 9.048257372654156, "percentage": 90.48, "elapsed_time": "4:13:13", "remaining_time": "0:26:38", "throughput": 2306.49, "total_tokens": 35043688} {"current_steps": 60755, "total_steps": 67140, "loss": 0.474, "lr": 1.3652958611669153e-06, "epoch": 9.049002085195115, "percentage": 90.49, "elapsed_time": "4:13:14", "remaining_time": "0:26:36", "throughput": 2306.52, "total_tokens": 35046696} {"current_steps": 60760, "total_steps": 67140, "loss": 0.4676, "lr": 1.3631783837059625e-06, "epoch": 9.049746797736073, "percentage": 90.5, "elapsed_time": "4:13:15", "remaining_time": "0:26:35", "throughput": 2306.55, "total_tokens": 35050088} {"current_steps": 60765, "total_steps": 67140, "loss": 0.6072, "lr": 1.3610625035253178e-06, "epoch": 9.050491510277032, "percentage": 90.5, "elapsed_time": "4:13:17", "remaining_time": "0:26:34", "throughput": 2306.57, "total_tokens": 35053000} {"current_steps": 60770, "total_steps": 67140, "loss": 0.6738, "lr": 1.3589482207679555e-06, "epoch": 9.051236222817993, "percentage": 90.51, "elapsed_time": "4:13:18", "remaining_time": "0:26:33", "throughput": 2306.58, "total_tokens": 35055752} {"current_steps": 60775, "total_steps": 67140, "loss": 0.598, "lr": 1.3568355355767559e-06, "epoch": 9.051980935358952, "percentage": 90.52, "elapsed_time": "4:13:19", "remaining_time": "0:26:31", "throughput": 2306.61, "total_tokens": 35058696} {"current_steps": 60780, "total_steps": 67140, "loss": 0.7388, "lr": 1.3547244480944826e-06, "epoch": 9.05272564789991, "percentage": 90.53, "elapsed_time": "4:13:20", "remaining_time": "0:26:30", "throughput": 2306.62, "total_tokens": 35061544} {"current_steps": 60785, "total_steps": 67140, "loss": 0.5125, "lr": 1.3526149584637993e-06, "epoch": 9.053470360440869, "percentage": 90.53, "elapsed_time": "4:13:21", "remaining_time": "0:26:29", "throughput": 2306.64, "total_tokens": 35064488} {"current_steps": 60790, "total_steps": 67140, "loss": 0.4077, "lr": 1.3505070668272556e-06, "epoch": 9.05421507298183, "percentage": 90.54, "elapsed_time": "4:13:22", "remaining_time": "0:26:28", "throughput": 2306.65, "total_tokens": 35067176} {"current_steps": 60795, "total_steps": 67140, "loss": 0.4534, "lr": 1.3484007733272908e-06, "epoch": 9.054959785522788, "percentage": 90.55, "elapsed_time": "4:13:23", "remaining_time": "0:26:26", "throughput": 2306.66, "total_tokens": 35069768} {"current_steps": 60800, "total_steps": 67140, "loss": 0.584, "lr": 1.3462960781062434e-06, "epoch": 9.055704498063747, "percentage": 90.56, "elapsed_time": "4:13:24", "remaining_time": "0:26:25", "throughput": 2306.67, "total_tokens": 35072680} {"current_steps": 60805, "total_steps": 67140, "loss": 0.701, "lr": 1.344192981306333e-06, "epoch": 9.056449210604706, "percentage": 90.56, "elapsed_time": "4:13:26", "remaining_time": "0:26:24", "throughput": 2306.7, "total_tokens": 35075688} {"current_steps": 60810, "total_steps": 67140, "loss": 0.5138, "lr": 1.3420914830696851e-06, "epoch": 9.057193923145666, "percentage": 90.57, "elapsed_time": "4:13:27", "remaining_time": "0:26:22", "throughput": 2306.72, "total_tokens": 35078664} {"current_steps": 60815, "total_steps": 67140, "loss": 0.4801, "lr": 1.339991583538308e-06, "epoch": 9.057938635686625, "percentage": 90.58, "elapsed_time": "4:13:28", "remaining_time": "0:26:21", "throughput": 2306.74, "total_tokens": 35081576} {"current_steps": 60820, "total_steps": 67140, "loss": 0.313, "lr": 1.337893282854108e-06, "epoch": 9.058683348227584, "percentage": 90.59, "elapsed_time": "4:13:29", "remaining_time": "0:26:20", "throughput": 2306.77, "total_tokens": 35084744} {"current_steps": 60825, "total_steps": 67140, "loss": 0.7659, "lr": 1.3357965811588741e-06, "epoch": 9.059428060768543, "percentage": 90.59, "elapsed_time": "4:13:30", "remaining_time": "0:26:19", "throughput": 2306.78, "total_tokens": 35087400} {"current_steps": 60830, "total_steps": 67140, "loss": 0.8584, "lr": 1.3337014785942985e-06, "epoch": 9.060172773309503, "percentage": 90.6, "elapsed_time": "4:13:31", "remaining_time": "0:26:17", "throughput": 2306.79, "total_tokens": 35090312} {"current_steps": 60835, "total_steps": 67140, "loss": 0.551, "lr": 1.33160797530196e-06, "epoch": 9.060917485850462, "percentage": 90.61, "elapsed_time": "4:13:32", "remaining_time": "0:26:16", "throughput": 2306.82, "total_tokens": 35093416} {"current_steps": 60840, "total_steps": 67140, "loss": 0.6428, "lr": 1.32951607142332e-06, "epoch": 9.06166219839142, "percentage": 90.62, "elapsed_time": "4:13:34", "remaining_time": "0:26:15", "throughput": 2306.83, "total_tokens": 35096264} {"current_steps": 60845, "total_steps": 67140, "loss": 0.3731, "lr": 1.3274257670997464e-06, "epoch": 9.06240691093238, "percentage": 90.62, "elapsed_time": "4:13:35", "remaining_time": "0:26:14", "throughput": 2306.86, "total_tokens": 35099208} {"current_steps": 60850, "total_steps": 67140, "loss": 0.5398, "lr": 1.3253370624724953e-06, "epoch": 9.06315162347334, "percentage": 90.63, "elapsed_time": "4:13:36", "remaining_time": "0:26:12", "throughput": 2306.87, "total_tokens": 35102024} {"current_steps": 60855, "total_steps": 67140, "loss": 0.5412, "lr": 1.3232499576827096e-06, "epoch": 9.063896336014299, "percentage": 90.64, "elapsed_time": "4:13:37", "remaining_time": "0:26:11", "throughput": 2306.9, "total_tokens": 35105288} {"current_steps": 60860, "total_steps": 67140, "loss": 0.5961, "lr": 1.321164452871429e-06, "epoch": 9.064641048555258, "percentage": 90.65, "elapsed_time": "4:13:38", "remaining_time": "0:26:10", "throughput": 2306.91, "total_tokens": 35107944} {"current_steps": 60865, "total_steps": 67140, "loss": 0.5119, "lr": 1.319080548179588e-06, "epoch": 9.065385761096216, "percentage": 90.65, "elapsed_time": "4:13:39", "remaining_time": "0:26:09", "throughput": 2306.95, "total_tokens": 35111400} {"current_steps": 60870, "total_steps": 67140, "loss": 0.4218, "lr": 1.316998243748005e-06, "epoch": 9.066130473637177, "percentage": 90.66, "elapsed_time": "4:13:40", "remaining_time": "0:26:07", "throughput": 2306.96, "total_tokens": 35114184} {"current_steps": 60875, "total_steps": 67140, "loss": 0.8118, "lr": 1.3149175397173891e-06, "epoch": 9.066875186178136, "percentage": 90.67, "elapsed_time": "4:13:42", "remaining_time": "0:26:06", "throughput": 2307.0, "total_tokens": 35117416} {"current_steps": 60880, "total_steps": 67140, "loss": 0.6919, "lr": 1.3128384362283474e-06, "epoch": 9.067619898719094, "percentage": 90.68, "elapsed_time": "4:13:43", "remaining_time": "0:26:05", "throughput": 2307.03, "total_tokens": 35120648} {"current_steps": 60885, "total_steps": 67140, "loss": 0.4356, "lr": 1.3107609334213816e-06, "epoch": 9.068364611260053, "percentage": 90.68, "elapsed_time": "4:13:44", "remaining_time": "0:26:04", "throughput": 2307.05, "total_tokens": 35123656} {"current_steps": 60890, "total_steps": 67140, "loss": 0.6024, "lr": 1.3086850314368764e-06, "epoch": 9.069109323801014, "percentage": 90.69, "elapsed_time": "4:13:45", "remaining_time": "0:26:02", "throughput": 2307.07, "total_tokens": 35126536} {"current_steps": 60895, "total_steps": 67140, "loss": 0.7147, "lr": 1.3066107304151142e-06, "epoch": 9.069854036341972, "percentage": 90.7, "elapsed_time": "4:13:46", "remaining_time": "0:26:01", "throughput": 2307.1, "total_tokens": 35129704} {"current_steps": 60900, "total_steps": 67140, "loss": 0.7039, "lr": 1.3045380304962745e-06, "epoch": 9.070598748882931, "percentage": 90.71, "elapsed_time": "4:13:47", "remaining_time": "0:26:00", "throughput": 2307.12, "total_tokens": 35132488} {"current_steps": 60905, "total_steps": 67140, "loss": 0.5707, "lr": 1.302466931820412e-06, "epoch": 9.07134346142389, "percentage": 90.71, "elapsed_time": "4:13:49", "remaining_time": "0:25:59", "throughput": 2307.14, "total_tokens": 35135496} {"current_steps": 60910, "total_steps": 67140, "loss": 0.5561, "lr": 1.3003974345274894e-06, "epoch": 9.07208817396485, "percentage": 90.72, "elapsed_time": "4:13:50", "remaining_time": "0:25:57", "throughput": 2307.15, "total_tokens": 35138344} {"current_steps": 60915, "total_steps": 67140, "loss": 0.5292, "lr": 1.2983295387573507e-06, "epoch": 9.07283288650581, "percentage": 90.73, "elapsed_time": "4:13:51", "remaining_time": "0:25:56", "throughput": 2307.16, "total_tokens": 35141000} {"current_steps": 60920, "total_steps": 67140, "loss": 0.3647, "lr": 1.296263244649737e-06, "epoch": 9.073577599046768, "percentage": 90.74, "elapsed_time": "4:13:52", "remaining_time": "0:25:55", "throughput": 2307.18, "total_tokens": 35143784} {"current_steps": 60925, "total_steps": 67140, "loss": 0.6901, "lr": 1.2941985523442806e-06, "epoch": 9.074322311587727, "percentage": 90.74, "elapsed_time": "4:13:53", "remaining_time": "0:25:53", "throughput": 2307.19, "total_tokens": 35146568} {"current_steps": 60930, "total_steps": 67140, "loss": 0.5341, "lr": 1.2921354619805066e-06, "epoch": 9.075067024128685, "percentage": 90.75, "elapsed_time": "4:13:54", "remaining_time": "0:25:52", "throughput": 2307.22, "total_tokens": 35149768} {"current_steps": 60935, "total_steps": 67140, "loss": 0.6102, "lr": 1.290073973697828e-06, "epoch": 9.075811736669646, "percentage": 90.76, "elapsed_time": "4:13:55", "remaining_time": "0:25:51", "throughput": 2307.22, "total_tokens": 35152424} {"current_steps": 60940, "total_steps": 67140, "loss": 0.5906, "lr": 1.288014087635553e-06, "epoch": 9.076556449210605, "percentage": 90.77, "elapsed_time": "4:13:56", "remaining_time": "0:25:50", "throughput": 2307.24, "total_tokens": 35155272} {"current_steps": 60945, "total_steps": 67140, "loss": 0.6939, "lr": 1.2859558039328784e-06, "epoch": 9.077301161751564, "percentage": 90.77, "elapsed_time": "4:13:58", "remaining_time": "0:25:48", "throughput": 2307.26, "total_tokens": 35158216} {"current_steps": 60950, "total_steps": 67140, "loss": 0.502, "lr": 1.2838991227289016e-06, "epoch": 9.078045874292522, "percentage": 90.78, "elapsed_time": "4:13:59", "remaining_time": "0:25:47", "throughput": 2307.28, "total_tokens": 35161096} {"current_steps": 60955, "total_steps": 67140, "loss": 0.6324, "lr": 1.2818440441625946e-06, "epoch": 9.078790586833483, "percentage": 90.79, "elapsed_time": "4:14:00", "remaining_time": "0:25:46", "throughput": 2307.29, "total_tokens": 35163848} {"current_steps": 60960, "total_steps": 67140, "loss": 0.6212, "lr": 1.2797905683728377e-06, "epoch": 9.079535299374442, "percentage": 90.8, "elapsed_time": "4:14:01", "remaining_time": "0:25:45", "throughput": 2307.31, "total_tokens": 35166856} {"current_steps": 60965, "total_steps": 67140, "loss": 0.6063, "lr": 1.2777386954983956e-06, "epoch": 9.0802800119154, "percentage": 90.8, "elapsed_time": "4:14:02", "remaining_time": "0:25:43", "throughput": 2307.34, "total_tokens": 35170024} {"current_steps": 60970, "total_steps": 67140, "loss": 0.5857, "lr": 1.2756884256779234e-06, "epoch": 9.081024724456359, "percentage": 90.81, "elapsed_time": "4:14:03", "remaining_time": "0:25:42", "throughput": 2307.35, "total_tokens": 35172712} {"current_steps": 60975, "total_steps": 67140, "loss": 0.5455, "lr": 1.2736397590499716e-06, "epoch": 9.08176943699732, "percentage": 90.82, "elapsed_time": "4:14:04", "remaining_time": "0:25:41", "throughput": 2307.36, "total_tokens": 35175464} {"current_steps": 60980, "total_steps": 67140, "loss": 0.5365, "lr": 1.2715926957529794e-06, "epoch": 9.082514149538278, "percentage": 90.83, "elapsed_time": "4:14:05", "remaining_time": "0:25:40", "throughput": 2307.36, "total_tokens": 35177992} {"current_steps": 60985, "total_steps": 67140, "loss": 0.7271, "lr": 1.2695472359252808e-06, "epoch": 9.083258862079237, "percentage": 90.83, "elapsed_time": "4:14:07", "remaining_time": "0:25:38", "throughput": 2307.37, "total_tokens": 35180680} {"current_steps": 60990, "total_steps": 67140, "loss": 0.4187, "lr": 1.267503379705104e-06, "epoch": 9.084003574620196, "percentage": 90.84, "elapsed_time": "4:14:08", "remaining_time": "0:25:37", "throughput": 2307.39, "total_tokens": 35183592} {"current_steps": 60995, "total_steps": 67140, "loss": 0.6706, "lr": 1.2654611272305521e-06, "epoch": 9.084748287161156, "percentage": 90.85, "elapsed_time": "4:14:09", "remaining_time": "0:25:36", "throughput": 2307.4, "total_tokens": 35186280} {"current_steps": 61000, "total_steps": 67140, "loss": 0.448, "lr": 1.2634204786396458e-06, "epoch": 9.085492999702115, "percentage": 90.85, "elapsed_time": "4:14:10", "remaining_time": "0:25:35", "throughput": 2307.42, "total_tokens": 35189352} {"current_steps": 61005, "total_steps": 67140, "loss": 0.4344, "lr": 1.2613814340702746e-06, "epoch": 9.086237712243074, "percentage": 90.86, "elapsed_time": "4:14:11", "remaining_time": "0:25:33", "throughput": 2307.44, "total_tokens": 35192232} {"current_steps": 61010, "total_steps": 67140, "loss": 0.3909, "lr": 1.2593439936602308e-06, "epoch": 9.086982424784033, "percentage": 90.87, "elapsed_time": "4:14:12", "remaining_time": "0:25:32", "throughput": 2307.45, "total_tokens": 35194856} {"current_steps": 61015, "total_steps": 67140, "loss": 0.5379, "lr": 1.2573081575471963e-06, "epoch": 9.087727137324993, "percentage": 90.88, "elapsed_time": "4:14:13", "remaining_time": "0:25:31", "throughput": 2307.46, "total_tokens": 35197704} {"current_steps": 61020, "total_steps": 67140, "loss": 0.5871, "lr": 1.2552739258687469e-06, "epoch": 9.088471849865952, "percentage": 90.88, "elapsed_time": "4:14:15", "remaining_time": "0:25:30", "throughput": 2307.49, "total_tokens": 35200840} {"current_steps": 61025, "total_steps": 67140, "loss": 0.7158, "lr": 1.2532412987623477e-06, "epoch": 9.08921656240691, "percentage": 90.89, "elapsed_time": "4:14:16", "remaining_time": "0:25:28", "throughput": 2307.51, "total_tokens": 35203784} {"current_steps": 61030, "total_steps": 67140, "loss": 0.4959, "lr": 1.2512102763653556e-06, "epoch": 9.08996127494787, "percentage": 90.9, "elapsed_time": "4:14:17", "remaining_time": "0:25:27", "throughput": 2307.52, "total_tokens": 35206600} {"current_steps": 61035, "total_steps": 67140, "loss": 0.4898, "lr": 1.249180858815019e-06, "epoch": 9.09070598748883, "percentage": 90.91, "elapsed_time": "4:14:18", "remaining_time": "0:25:26", "throughput": 2307.54, "total_tokens": 35209544} {"current_steps": 61040, "total_steps": 67140, "loss": 0.6687, "lr": 1.2471530462484727e-06, "epoch": 9.091450700029789, "percentage": 90.91, "elapsed_time": "4:14:19", "remaining_time": "0:25:24", "throughput": 2307.55, "total_tokens": 35212264} {"current_steps": 61045, "total_steps": 67140, "loss": 0.4517, "lr": 1.2451268388027514e-06, "epoch": 9.092195412570748, "percentage": 90.92, "elapsed_time": "4:14:20", "remaining_time": "0:25:23", "throughput": 2307.57, "total_tokens": 35215016} {"current_steps": 61050, "total_steps": 67140, "loss": 0.5731, "lr": 1.2431022366147766e-06, "epoch": 9.092940125111706, "percentage": 90.93, "elapsed_time": "4:14:21", "remaining_time": "0:25:22", "throughput": 2307.58, "total_tokens": 35217896} {"current_steps": 61055, "total_steps": 67140, "loss": 0.4466, "lr": 1.2410792398213662e-06, "epoch": 9.093684837652667, "percentage": 90.94, "elapsed_time": "4:14:22", "remaining_time": "0:25:21", "throughput": 2307.6, "total_tokens": 35220744} {"current_steps": 61060, "total_steps": 67140, "loss": 0.5805, "lr": 1.2390578485592246e-06, "epoch": 9.094429550193626, "percentage": 90.94, "elapsed_time": "4:14:24", "remaining_time": "0:25:19", "throughput": 2307.62, "total_tokens": 35223624} {"current_steps": 61065, "total_steps": 67140, "loss": 0.5882, "lr": 1.2370380629649486e-06, "epoch": 9.095174262734584, "percentage": 90.95, "elapsed_time": "4:14:25", "remaining_time": "0:25:18", "throughput": 2307.63, "total_tokens": 35226408} {"current_steps": 61070, "total_steps": 67140, "loss": 0.3072, "lr": 1.2350198831750259e-06, "epoch": 9.095918975275543, "percentage": 90.96, "elapsed_time": "4:14:26", "remaining_time": "0:25:17", "throughput": 2307.65, "total_tokens": 35229320} {"current_steps": 61075, "total_steps": 67140, "loss": 0.6634, "lr": 1.233003309325842e-06, "epoch": 9.096663687816504, "percentage": 90.97, "elapsed_time": "4:14:27", "remaining_time": "0:25:16", "throughput": 2307.67, "total_tokens": 35232360} {"current_steps": 61080, "total_steps": 67140, "loss": 0.6533, "lr": 1.23098834155366e-06, "epoch": 9.097408400357462, "percentage": 90.97, "elapsed_time": "4:14:28", "remaining_time": "0:25:14", "throughput": 2307.7, "total_tokens": 35235464} {"current_steps": 61085, "total_steps": 67140, "loss": 0.4048, "lr": 1.2289749799946487e-06, "epoch": 9.098153112898421, "percentage": 90.98, "elapsed_time": "4:14:29", "remaining_time": "0:25:13", "throughput": 2307.73, "total_tokens": 35238696} {"current_steps": 61090, "total_steps": 67140, "loss": 0.3483, "lr": 1.2269632247848633e-06, "epoch": 9.09889782543938, "percentage": 90.99, "elapsed_time": "4:14:30", "remaining_time": "0:25:12", "throughput": 2307.74, "total_tokens": 35241448} {"current_steps": 61095, "total_steps": 67140, "loss": 0.7581, "lr": 1.2249530760602534e-06, "epoch": 9.099642537980339, "percentage": 91.0, "elapsed_time": "4:14:32", "remaining_time": "0:25:11", "throughput": 2307.76, "total_tokens": 35244200} {"current_steps": 61100, "total_steps": 67140, "loss": 0.5555, "lr": 1.2229445339566465e-06, "epoch": 9.1003872505213, "percentage": 91.0, "elapsed_time": "4:14:33", "remaining_time": "0:25:09", "throughput": 2307.78, "total_tokens": 35247208} {"current_steps": 61105, "total_steps": 67140, "loss": 0.5968, "lr": 1.2209375986097782e-06, "epoch": 9.101131963062258, "percentage": 91.01, "elapsed_time": "4:14:34", "remaining_time": "0:25:08", "throughput": 2307.81, "total_tokens": 35250312} {"current_steps": 61110, "total_steps": 67140, "loss": 0.5091, "lr": 1.218932270155268e-06, "epoch": 9.101876675603217, "percentage": 91.02, "elapsed_time": "4:14:35", "remaining_time": "0:25:07", "throughput": 2307.84, "total_tokens": 35253672} {"current_steps": 61115, "total_steps": 67140, "loss": 0.8164, "lr": 1.2169285487286325e-06, "epoch": 9.102621388144176, "percentage": 91.03, "elapsed_time": "4:14:36", "remaining_time": "0:25:06", "throughput": 2307.88, "total_tokens": 35257064} {"current_steps": 61120, "total_steps": 67140, "loss": 0.5684, "lr": 1.214926434465266e-06, "epoch": 9.103366100685136, "percentage": 91.03, "elapsed_time": "4:14:37", "remaining_time": "0:25:04", "throughput": 2307.89, "total_tokens": 35259784} {"current_steps": 61125, "total_steps": 67140, "loss": 0.5527, "lr": 1.212925927500469e-06, "epoch": 9.104110813226095, "percentage": 91.04, "elapsed_time": "4:14:39", "remaining_time": "0:25:03", "throughput": 2307.91, "total_tokens": 35262632} {"current_steps": 61130, "total_steps": 67140, "loss": 0.6749, "lr": 1.21092702796943e-06, "epoch": 9.104855525767054, "percentage": 91.05, "elapsed_time": "4:14:40", "remaining_time": "0:25:02", "throughput": 2307.92, "total_tokens": 35265544} {"current_steps": 61135, "total_steps": 67140, "loss": 0.4203, "lr": 1.2089297360072193e-06, "epoch": 9.105600238308012, "percentage": 91.06, "elapsed_time": "4:14:41", "remaining_time": "0:25:01", "throughput": 2307.94, "total_tokens": 35268328} {"current_steps": 61140, "total_steps": 67140, "loss": 0.4821, "lr": 1.2069340517488093e-06, "epoch": 9.106344950848973, "percentage": 91.06, "elapsed_time": "4:14:42", "remaining_time": "0:24:59", "throughput": 2307.96, "total_tokens": 35271304} {"current_steps": 61145, "total_steps": 67140, "loss": 0.5325, "lr": 1.2049399753290612e-06, "epoch": 9.107089663389932, "percentage": 91.07, "elapsed_time": "4:14:43", "remaining_time": "0:24:58", "throughput": 2307.97, "total_tokens": 35274120} {"current_steps": 61150, "total_steps": 67140, "loss": 0.511, "lr": 1.2029475068827262e-06, "epoch": 9.10783437593089, "percentage": 91.08, "elapsed_time": "4:14:44", "remaining_time": "0:24:57", "throughput": 2307.98, "total_tokens": 35276680} {"current_steps": 61155, "total_steps": 67140, "loss": 0.6519, "lr": 1.2009566465444517e-06, "epoch": 9.10857908847185, "percentage": 91.09, "elapsed_time": "4:14:45", "remaining_time": "0:24:55", "throughput": 2307.99, "total_tokens": 35279400} {"current_steps": 61160, "total_steps": 67140, "loss": 0.6615, "lr": 1.1989673944487606e-06, "epoch": 9.10932380101281, "percentage": 91.09, "elapsed_time": "4:14:46", "remaining_time": "0:24:54", "throughput": 2308.01, "total_tokens": 35282312} {"current_steps": 61165, "total_steps": 67140, "loss": 0.5492, "lr": 1.19697975073009e-06, "epoch": 9.110068513553768, "percentage": 91.1, "elapsed_time": "4:14:48", "remaining_time": "0:24:53", "throughput": 2308.03, "total_tokens": 35285288} {"current_steps": 61170, "total_steps": 67140, "loss": 0.592, "lr": 1.194993715522749e-06, "epoch": 9.110813226094727, "percentage": 91.11, "elapsed_time": "4:14:49", "remaining_time": "0:24:52", "throughput": 2308.05, "total_tokens": 35288296} {"current_steps": 61175, "total_steps": 67140, "loss": 0.7288, "lr": 1.1930092889609473e-06, "epoch": 9.111557938635686, "percentage": 91.12, "elapsed_time": "4:14:50", "remaining_time": "0:24:50", "throughput": 2308.07, "total_tokens": 35291240} {"current_steps": 61180, "total_steps": 67140, "loss": 0.6167, "lr": 1.1910264711787855e-06, "epoch": 9.112302651176647, "percentage": 91.12, "elapsed_time": "4:14:51", "remaining_time": "0:24:49", "throughput": 2308.08, "total_tokens": 35293960} {"current_steps": 61185, "total_steps": 67140, "loss": 0.5396, "lr": 1.1890452623102566e-06, "epoch": 9.113047363717605, "percentage": 91.13, "elapsed_time": "4:14:52", "remaining_time": "0:24:48", "throughput": 2308.1, "total_tokens": 35296744} {"current_steps": 61190, "total_steps": 67140, "loss": 0.5763, "lr": 1.1870656624892397e-06, "epoch": 9.113792076258564, "percentage": 91.14, "elapsed_time": "4:14:53", "remaining_time": "0:24:47", "throughput": 2308.12, "total_tokens": 35299624} {"current_steps": 61195, "total_steps": 67140, "loss": 0.6154, "lr": 1.1850876718495107e-06, "epoch": 9.114536788799523, "percentage": 91.15, "elapsed_time": "4:14:54", "remaining_time": "0:24:45", "throughput": 2308.12, "total_tokens": 35302216} {"current_steps": 61200, "total_steps": 67140, "loss": 0.7602, "lr": 1.1831112905247327e-06, "epoch": 9.115281501340483, "percentage": 91.15, "elapsed_time": "4:14:55", "remaining_time": "0:24:44", "throughput": 2308.13, "total_tokens": 35305000} {"current_steps": 61205, "total_steps": 67140, "loss": 0.4601, "lr": 1.1811365186484595e-06, "epoch": 9.116026213881442, "percentage": 91.16, "elapsed_time": "4:14:57", "remaining_time": "0:24:43", "throughput": 2308.16, "total_tokens": 35308136} {"current_steps": 61210, "total_steps": 67140, "loss": 0.6184, "lr": 1.1791633563541404e-06, "epoch": 9.1167709264224, "percentage": 91.17, "elapsed_time": "4:14:58", "remaining_time": "0:24:42", "throughput": 2308.18, "total_tokens": 35311112} {"current_steps": 61215, "total_steps": 67140, "loss": 0.6797, "lr": 1.1771918037751128e-06, "epoch": 9.11751563896336, "percentage": 91.18, "elapsed_time": "4:14:59", "remaining_time": "0:24:40", "throughput": 2308.19, "total_tokens": 35313800} {"current_steps": 61220, "total_steps": 67140, "loss": 0.4783, "lr": 1.1752218610446037e-06, "epoch": 9.11826035150432, "percentage": 91.18, "elapsed_time": "4:15:00", "remaining_time": "0:24:39", "throughput": 2308.2, "total_tokens": 35316584} {"current_steps": 61225, "total_steps": 67140, "loss": 0.3994, "lr": 1.1732535282957397e-06, "epoch": 9.119005064045279, "percentage": 91.19, "elapsed_time": "4:15:01", "remaining_time": "0:24:38", "throughput": 2308.22, "total_tokens": 35319432} {"current_steps": 61230, "total_steps": 67140, "loss": 0.5349, "lr": 1.171286805661534e-06, "epoch": 9.119749776586238, "percentage": 91.2, "elapsed_time": "4:15:02", "remaining_time": "0:24:37", "throughput": 2308.23, "total_tokens": 35322216} {"current_steps": 61235, "total_steps": 67140, "loss": 0.5414, "lr": 1.169321693274883e-06, "epoch": 9.120494489127196, "percentage": 91.2, "elapsed_time": "4:15:03", "remaining_time": "0:24:35", "throughput": 2308.25, "total_tokens": 35325096} {"current_steps": 61240, "total_steps": 67140, "loss": 0.6466, "lr": 1.1673581912685805e-06, "epoch": 9.121239201668157, "percentage": 91.21, "elapsed_time": "4:15:04", "remaining_time": "0:24:34", "throughput": 2308.26, "total_tokens": 35327816} {"current_steps": 61245, "total_steps": 67140, "loss": 0.6708, "lr": 1.1653962997753148e-06, "epoch": 9.121983914209116, "percentage": 91.22, "elapsed_time": "4:15:06", "remaining_time": "0:24:33", "throughput": 2308.27, "total_tokens": 35330600} {"current_steps": 61250, "total_steps": 67140, "loss": 0.6077, "lr": 1.1634360189276632e-06, "epoch": 9.122728626750074, "percentage": 91.23, "elapsed_time": "4:15:07", "remaining_time": "0:24:31", "throughput": 2308.3, "total_tokens": 35333768} {"current_steps": 61255, "total_steps": 67140, "loss": 0.6844, "lr": 1.161477348858095e-06, "epoch": 9.123473339291033, "percentage": 91.23, "elapsed_time": "4:15:08", "remaining_time": "0:24:30", "throughput": 2308.31, "total_tokens": 35336488} {"current_steps": 61260, "total_steps": 67140, "loss": 0.5459, "lr": 1.1595202896989677e-06, "epoch": 9.124218051831992, "percentage": 91.24, "elapsed_time": "4:15:09", "remaining_time": "0:24:29", "throughput": 2308.33, "total_tokens": 35339272} {"current_steps": 61265, "total_steps": 67140, "loss": 0.5923, "lr": 1.1575648415825285e-06, "epoch": 9.124962764372953, "percentage": 91.25, "elapsed_time": "4:15:10", "remaining_time": "0:24:28", "throughput": 2308.35, "total_tokens": 35342216} {"current_steps": 61270, "total_steps": 67140, "loss": 0.6042, "lr": 1.1556110046409218e-06, "epoch": 9.125707476913911, "percentage": 91.26, "elapsed_time": "4:15:11", "remaining_time": "0:24:26", "throughput": 2308.37, "total_tokens": 35345160} {"current_steps": 61275, "total_steps": 67140, "loss": 0.625, "lr": 1.153658779006181e-06, "epoch": 9.12645218945487, "percentage": 91.26, "elapsed_time": "4:15:12", "remaining_time": "0:24:25", "throughput": 2308.38, "total_tokens": 35347944} {"current_steps": 61280, "total_steps": 67140, "loss": 0.5977, "lr": 1.151708164810228e-06, "epoch": 9.127196901995829, "percentage": 91.27, "elapsed_time": "4:15:14", "remaining_time": "0:24:24", "throughput": 2308.4, "total_tokens": 35350920} {"current_steps": 61285, "total_steps": 67140, "loss": 0.4927, "lr": 1.1497591621848741e-06, "epoch": 9.12794161453679, "percentage": 91.28, "elapsed_time": "4:15:15", "remaining_time": "0:24:23", "throughput": 2308.42, "total_tokens": 35353800} {"current_steps": 61290, "total_steps": 67140, "loss": 0.5004, "lr": 1.1478117712618281e-06, "epoch": 9.128686327077748, "percentage": 91.29, "elapsed_time": "4:15:16", "remaining_time": "0:24:21", "throughput": 2308.44, "total_tokens": 35356840} {"current_steps": 61295, "total_steps": 67140, "loss": 0.5851, "lr": 1.14586599217269e-06, "epoch": 9.129431039618707, "percentage": 91.29, "elapsed_time": "4:15:17", "remaining_time": "0:24:20", "throughput": 2308.44, "total_tokens": 35359400} {"current_steps": 61300, "total_steps": 67140, "loss": 0.4292, "lr": 1.1439218250489408e-06, "epoch": 9.130175752159666, "percentage": 91.3, "elapsed_time": "4:15:18", "remaining_time": "0:24:19", "throughput": 2308.46, "total_tokens": 35362312} {"current_steps": 61305, "total_steps": 67140, "loss": 0.6739, "lr": 1.1419792700219644e-06, "epoch": 9.130920464700626, "percentage": 91.31, "elapsed_time": "4:15:19", "remaining_time": "0:24:18", "throughput": 2308.48, "total_tokens": 35365384} {"current_steps": 61310, "total_steps": 67140, "loss": 0.6263, "lr": 1.1400383272230281e-06, "epoch": 9.131665177241585, "percentage": 91.32, "elapsed_time": "4:15:20", "remaining_time": "0:24:16", "throughput": 2308.51, "total_tokens": 35368424} {"current_steps": 61315, "total_steps": 67140, "loss": 0.8308, "lr": 1.1380989967832962e-06, "epoch": 9.132409889782544, "percentage": 91.32, "elapsed_time": "4:15:22", "remaining_time": "0:24:15", "throughput": 2308.53, "total_tokens": 35371496} {"current_steps": 61320, "total_steps": 67140, "loss": 0.4271, "lr": 1.1361612788338166e-06, "epoch": 9.133154602323502, "percentage": 91.33, "elapsed_time": "4:15:23", "remaining_time": "0:24:14", "throughput": 2308.54, "total_tokens": 35374312} {"current_steps": 61325, "total_steps": 67140, "loss": 0.6092, "lr": 1.134225173505535e-06, "epoch": 9.133899314864463, "percentage": 91.34, "elapsed_time": "4:15:24", "remaining_time": "0:24:13", "throughput": 2308.56, "total_tokens": 35377128} {"current_steps": 61330, "total_steps": 67140, "loss": 0.5332, "lr": 1.1322906809292877e-06, "epoch": 9.134644027405422, "percentage": 91.35, "elapsed_time": "4:15:25", "remaining_time": "0:24:11", "throughput": 2308.58, "total_tokens": 35380168} {"current_steps": 61335, "total_steps": 67140, "loss": 0.6729, "lr": 1.130357801235793e-06, "epoch": 9.13538873994638, "percentage": 91.35, "elapsed_time": "4:15:26", "remaining_time": "0:24:10", "throughput": 2308.59, "total_tokens": 35382856} {"current_steps": 61340, "total_steps": 67140, "loss": 0.6068, "lr": 1.128426534555674e-06, "epoch": 9.13613345248734, "percentage": 91.36, "elapsed_time": "4:15:27", "remaining_time": "0:24:09", "throughput": 2308.61, "total_tokens": 35385960} {"current_steps": 61345, "total_steps": 67140, "loss": 0.5711, "lr": 1.1264968810194315e-06, "epoch": 9.1368781650283, "percentage": 91.37, "elapsed_time": "4:15:28", "remaining_time": "0:24:08", "throughput": 2308.64, "total_tokens": 35389064} {"current_steps": 61350, "total_steps": 67140, "loss": 0.5407, "lr": 1.12456884075747e-06, "epoch": 9.137622877569259, "percentage": 91.38, "elapsed_time": "4:15:30", "remaining_time": "0:24:06", "throughput": 2308.66, "total_tokens": 35391944} {"current_steps": 61355, "total_steps": 67140, "loss": 0.377, "lr": 1.1226424139000797e-06, "epoch": 9.138367590110217, "percentage": 91.38, "elapsed_time": "4:15:31", "remaining_time": "0:24:05", "throughput": 2308.68, "total_tokens": 35395016} {"current_steps": 61360, "total_steps": 67140, "loss": 0.6507, "lr": 1.120717600577431e-06, "epoch": 9.139112302651176, "percentage": 91.39, "elapsed_time": "4:15:32", "remaining_time": "0:24:04", "throughput": 2308.7, "total_tokens": 35397864} {"current_steps": 61365, "total_steps": 67140, "loss": 0.5267, "lr": 1.1187944009196038e-06, "epoch": 9.139857015192137, "percentage": 91.4, "elapsed_time": "4:15:33", "remaining_time": "0:24:03", "throughput": 2308.71, "total_tokens": 35400648} {"current_steps": 61370, "total_steps": 67140, "loss": 0.7458, "lr": 1.116872815056555e-06, "epoch": 9.140601727733095, "percentage": 91.41, "elapsed_time": "4:15:34", "remaining_time": "0:24:01", "throughput": 2308.72, "total_tokens": 35403432} {"current_steps": 61375, "total_steps": 67140, "loss": 0.6991, "lr": 1.1149528431181417e-06, "epoch": 9.141346440274054, "percentage": 91.41, "elapsed_time": "4:15:35", "remaining_time": "0:24:00", "throughput": 2308.75, "total_tokens": 35406728} {"current_steps": 61380, "total_steps": 67140, "loss": 0.6446, "lr": 1.1130344852341017e-06, "epoch": 9.142091152815013, "percentage": 91.42, "elapsed_time": "4:15:36", "remaining_time": "0:23:59", "throughput": 2308.78, "total_tokens": 35409672} {"current_steps": 61385, "total_steps": 67140, "loss": 0.7527, "lr": 1.1111177415340762e-06, "epoch": 9.142835865355973, "percentage": 91.43, "elapsed_time": "4:15:38", "remaining_time": "0:23:57", "throughput": 2308.81, "total_tokens": 35412872} {"current_steps": 61390, "total_steps": 67140, "loss": 0.5999, "lr": 1.109202612147589e-06, "epoch": 9.143580577896932, "percentage": 91.44, "elapsed_time": "4:15:39", "remaining_time": "0:23:56", "throughput": 2308.82, "total_tokens": 35415624} {"current_steps": 61395, "total_steps": 67140, "loss": 0.4476, "lr": 1.1072890972040588e-06, "epoch": 9.14432529043789, "percentage": 91.44, "elapsed_time": "4:15:40", "remaining_time": "0:23:55", "throughput": 2308.83, "total_tokens": 35418408} {"current_steps": 61400, "total_steps": 67140, "loss": 0.4639, "lr": 1.1053771968327908e-06, "epoch": 9.14507000297885, "percentage": 91.45, "elapsed_time": "4:15:41", "remaining_time": "0:23:54", "throughput": 2308.84, "total_tokens": 35421160} {"current_steps": 61405, "total_steps": 67140, "loss": 0.9122, "lr": 1.1034669111629787e-06, "epoch": 9.14581471551981, "percentage": 91.46, "elapsed_time": "4:15:42", "remaining_time": "0:23:52", "throughput": 2308.87, "total_tokens": 35424200} {"current_steps": 61410, "total_steps": 67140, "loss": 0.6923, "lr": 1.101558240323719e-06, "epoch": 9.146559428060769, "percentage": 91.47, "elapsed_time": "4:15:43", "remaining_time": "0:23:51", "throughput": 2308.88, "total_tokens": 35426952} {"current_steps": 61415, "total_steps": 67140, "loss": 0.5759, "lr": 1.0996511844439867e-06, "epoch": 9.147304140601728, "percentage": 91.47, "elapsed_time": "4:15:44", "remaining_time": "0:23:50", "throughput": 2308.89, "total_tokens": 35429640} {"current_steps": 61420, "total_steps": 67140, "loss": 0.5329, "lr": 1.097745743652659e-06, "epoch": 9.148048853142686, "percentage": 91.48, "elapsed_time": "4:15:46", "remaining_time": "0:23:49", "throughput": 2308.92, "total_tokens": 35432904} {"current_steps": 61425, "total_steps": 67140, "loss": 0.5572, "lr": 1.095841918078494e-06, "epoch": 9.148793565683647, "percentage": 91.49, "elapsed_time": "4:15:47", "remaining_time": "0:23:47", "throughput": 2308.93, "total_tokens": 35435688} {"current_steps": 61430, "total_steps": 67140, "loss": 0.6109, "lr": 1.0939397078501445e-06, "epoch": 9.149538278224606, "percentage": 91.5, "elapsed_time": "4:15:48", "remaining_time": "0:23:46", "throughput": 2308.95, "total_tokens": 35438504} {"current_steps": 61435, "total_steps": 67140, "loss": 0.5099, "lr": 1.0920391130961577e-06, "epoch": 9.150282990765565, "percentage": 91.5, "elapsed_time": "4:15:49", "remaining_time": "0:23:45", "throughput": 2308.97, "total_tokens": 35441384} {"current_steps": 61440, "total_steps": 67140, "loss": 0.5785, "lr": 1.0901401339449613e-06, "epoch": 9.151027703306523, "percentage": 91.51, "elapsed_time": "4:15:50", "remaining_time": "0:23:44", "throughput": 2308.97, "total_tokens": 35444008} {"current_steps": 61445, "total_steps": 67140, "loss": 0.817, "lr": 1.0882427705248832e-06, "epoch": 9.151772415847482, "percentage": 91.52, "elapsed_time": "4:15:51", "remaining_time": "0:23:42", "throughput": 2308.99, "total_tokens": 35446856} {"current_steps": 61450, "total_steps": 67140, "loss": 0.5414, "lr": 1.0863470229641403e-06, "epoch": 9.152517128388443, "percentage": 91.53, "elapsed_time": "4:15:52", "remaining_time": "0:23:41", "throughput": 2309.01, "total_tokens": 35449800} {"current_steps": 61455, "total_steps": 67140, "loss": 0.5262, "lr": 1.0844528913908414e-06, "epoch": 9.153261840929401, "percentage": 91.53, "elapsed_time": "4:15:53", "remaining_time": "0:23:40", "throughput": 2309.03, "total_tokens": 35452712} {"current_steps": 61460, "total_steps": 67140, "loss": 0.6263, "lr": 1.0825603759329866e-06, "epoch": 9.15400655347036, "percentage": 91.54, "elapsed_time": "4:15:55", "remaining_time": "0:23:39", "throughput": 2309.04, "total_tokens": 35455624} {"current_steps": 61465, "total_steps": 67140, "loss": 0.5129, "lr": 1.0806694767184545e-06, "epoch": 9.154751266011319, "percentage": 91.55, "elapsed_time": "4:15:56", "remaining_time": "0:23:37", "throughput": 2309.07, "total_tokens": 35458760} {"current_steps": 61470, "total_steps": 67140, "loss": 0.372, "lr": 1.0787801938750314e-06, "epoch": 9.15549597855228, "percentage": 91.55, "elapsed_time": "4:15:57", "remaining_time": "0:23:36", "throughput": 2309.09, "total_tokens": 35461576} {"current_steps": 61475, "total_steps": 67140, "loss": 0.5913, "lr": 1.0768925275303903e-06, "epoch": 9.156240691093238, "percentage": 91.56, "elapsed_time": "4:15:58", "remaining_time": "0:23:35", "throughput": 2309.11, "total_tokens": 35464552} {"current_steps": 61480, "total_steps": 67140, "loss": 0.4829, "lr": 1.0750064778120822e-06, "epoch": 9.156985403634197, "percentage": 91.57, "elapsed_time": "4:15:59", "remaining_time": "0:23:34", "throughput": 2309.13, "total_tokens": 35467560} {"current_steps": 61485, "total_steps": 67140, "loss": 0.8246, "lr": 1.073122044847566e-06, "epoch": 9.157730116175156, "percentage": 91.58, "elapsed_time": "4:16:00", "remaining_time": "0:23:32", "throughput": 2309.15, "total_tokens": 35470632} {"current_steps": 61490, "total_steps": 67140, "loss": 0.6749, "lr": 1.0712392287641842e-06, "epoch": 9.158474828716116, "percentage": 91.58, "elapsed_time": "4:16:02", "remaining_time": "0:23:31", "throughput": 2309.17, "total_tokens": 35473640} {"current_steps": 61495, "total_steps": 67140, "loss": 0.4549, "lr": 1.0693580296891686e-06, "epoch": 9.159219541257075, "percentage": 91.59, "elapsed_time": "4:16:03", "remaining_time": "0:23:30", "throughput": 2309.19, "total_tokens": 35476520} {"current_steps": 61500, "total_steps": 67140, "loss": 0.4265, "lr": 1.0674784477496396e-06, "epoch": 9.159964253798034, "percentage": 91.6, "elapsed_time": "4:16:04", "remaining_time": "0:23:29", "throughput": 2309.2, "total_tokens": 35479144} {"current_steps": 61505, "total_steps": 67140, "loss": 0.4114, "lr": 1.0656004830726153e-06, "epoch": 9.160708966338992, "percentage": 91.61, "elapsed_time": "4:16:05", "remaining_time": "0:23:27", "throughput": 2309.21, "total_tokens": 35481864} {"current_steps": 61510, "total_steps": 67140, "loss": 0.4029, "lr": 1.0637241357849993e-06, "epoch": 9.161453678879953, "percentage": 91.61, "elapsed_time": "4:16:06", "remaining_time": "0:23:26", "throughput": 2309.24, "total_tokens": 35484936} {"current_steps": 61515, "total_steps": 67140, "loss": 0.5622, "lr": 1.061849406013593e-06, "epoch": 9.162198391420912, "percentage": 91.62, "elapsed_time": "4:16:07", "remaining_time": "0:23:25", "throughput": 2309.25, "total_tokens": 35487880} {"current_steps": 61520, "total_steps": 67140, "loss": 0.4849, "lr": 1.059976293885076e-06, "epoch": 9.16294310396187, "percentage": 91.63, "elapsed_time": "4:16:08", "remaining_time": "0:23:23", "throughput": 2309.27, "total_tokens": 35490824} {"current_steps": 61525, "total_steps": 67140, "loss": 0.4317, "lr": 1.0581047995260246e-06, "epoch": 9.16368781650283, "percentage": 91.64, "elapsed_time": "4:16:09", "remaining_time": "0:23:22", "throughput": 2309.29, "total_tokens": 35493704} {"current_steps": 61530, "total_steps": 67140, "loss": 0.7865, "lr": 1.0562349230629154e-06, "epoch": 9.16443252904379, "percentage": 91.64, "elapsed_time": "4:16:11", "remaining_time": "0:23:21", "throughput": 2309.31, "total_tokens": 35496712} {"current_steps": 61535, "total_steps": 67140, "loss": 0.5503, "lr": 1.0543666646221002e-06, "epoch": 9.165177241584749, "percentage": 91.65, "elapsed_time": "4:16:12", "remaining_time": "0:23:20", "throughput": 2309.33, "total_tokens": 35499464} {"current_steps": 61540, "total_steps": 67140, "loss": 0.442, "lr": 1.0525000243298278e-06, "epoch": 9.165921954125707, "percentage": 91.66, "elapsed_time": "4:16:13", "remaining_time": "0:23:18", "throughput": 2309.34, "total_tokens": 35502216} {"current_steps": 61545, "total_steps": 67140, "loss": 0.4025, "lr": 1.050635002312239e-06, "epoch": 9.166666666666666, "percentage": 91.67, "elapsed_time": "4:16:14", "remaining_time": "0:23:17", "throughput": 2309.35, "total_tokens": 35504936} {"current_steps": 61550, "total_steps": 67140, "loss": 0.6444, "lr": 1.0487715986953695e-06, "epoch": 9.167411379207627, "percentage": 91.67, "elapsed_time": "4:16:15", "remaining_time": "0:23:16", "throughput": 2309.36, "total_tokens": 35507688} {"current_steps": 61555, "total_steps": 67140, "loss": 0.4941, "lr": 1.0469098136051375e-06, "epoch": 9.168156091748585, "percentage": 91.68, "elapsed_time": "4:16:16", "remaining_time": "0:23:15", "throughput": 2309.37, "total_tokens": 35510536} {"current_steps": 61560, "total_steps": 67140, "loss": 0.5535, "lr": 1.045049647167351e-06, "epoch": 9.168900804289544, "percentage": 91.69, "elapsed_time": "4:16:17", "remaining_time": "0:23:13", "throughput": 2309.39, "total_tokens": 35513352} {"current_steps": 61565, "total_steps": 67140, "loss": 0.6527, "lr": 1.0431910995077205e-06, "epoch": 9.169645516830503, "percentage": 91.7, "elapsed_time": "4:16:18", "remaining_time": "0:23:12", "throughput": 2309.41, "total_tokens": 35516392} {"current_steps": 61570, "total_steps": 67140, "loss": 0.6573, "lr": 1.0413341707518287e-06, "epoch": 9.170390229371463, "percentage": 91.7, "elapsed_time": "4:16:20", "remaining_time": "0:23:11", "throughput": 2309.43, "total_tokens": 35519240} {"current_steps": 61575, "total_steps": 67140, "loss": 0.3718, "lr": 1.039478861025167e-06, "epoch": 9.171134941912422, "percentage": 91.71, "elapsed_time": "4:16:21", "remaining_time": "0:23:10", "throughput": 2309.45, "total_tokens": 35522184} {"current_steps": 61580, "total_steps": 67140, "loss": 0.5007, "lr": 1.0376251704531049e-06, "epoch": 9.171879654453381, "percentage": 91.72, "elapsed_time": "4:16:22", "remaining_time": "0:23:08", "throughput": 2309.46, "total_tokens": 35524968} {"current_steps": 61585, "total_steps": 67140, "loss": 0.3004, "lr": 1.035773099160911e-06, "epoch": 9.17262436699434, "percentage": 91.73, "elapsed_time": "4:16:23", "remaining_time": "0:23:07", "throughput": 2309.49, "total_tokens": 35528136} {"current_steps": 61590, "total_steps": 67140, "loss": 0.539, "lr": 1.033922647273744e-06, "epoch": 9.1733690795353, "percentage": 91.73, "elapsed_time": "4:16:24", "remaining_time": "0:23:06", "throughput": 2309.5, "total_tokens": 35530856} {"current_steps": 61595, "total_steps": 67140, "loss": 0.6204, "lr": 1.0320738149166397e-06, "epoch": 9.174113792076259, "percentage": 91.74, "elapsed_time": "4:16:25", "remaining_time": "0:23:05", "throughput": 2309.52, "total_tokens": 35533640} {"current_steps": 61600, "total_steps": 67140, "loss": 0.7811, "lr": 1.0302266022145457e-06, "epoch": 9.174858504617218, "percentage": 91.75, "elapsed_time": "4:16:26", "remaining_time": "0:23:03", "throughput": 2309.52, "total_tokens": 35536232} {"current_steps": 61605, "total_steps": 67140, "loss": 0.7214, "lr": 1.0283810092922812e-06, "epoch": 9.175603217158177, "percentage": 91.76, "elapsed_time": "4:16:27", "remaining_time": "0:23:02", "throughput": 2309.52, "total_tokens": 35538696} {"current_steps": 61610, "total_steps": 67140, "loss": 0.4105, "lr": 1.0265370362745663e-06, "epoch": 9.176347929699135, "percentage": 91.76, "elapsed_time": "4:16:29", "remaining_time": "0:23:01", "throughput": 2309.54, "total_tokens": 35541608} {"current_steps": 61615, "total_steps": 67140, "loss": 0.6046, "lr": 1.0246946832860093e-06, "epoch": 9.177092642240096, "percentage": 91.77, "elapsed_time": "4:16:30", "remaining_time": "0:23:00", "throughput": 2309.57, "total_tokens": 35544840} {"current_steps": 61620, "total_steps": 67140, "loss": 0.8139, "lr": 1.0228539504511082e-06, "epoch": 9.177837354781055, "percentage": 91.78, "elapsed_time": "4:16:31", "remaining_time": "0:22:58", "throughput": 2309.59, "total_tokens": 35547752} {"current_steps": 61625, "total_steps": 67140, "loss": 0.5477, "lr": 1.0210148378942573e-06, "epoch": 9.178582067322013, "percentage": 91.79, "elapsed_time": "4:16:32", "remaining_time": "0:22:57", "throughput": 2309.61, "total_tokens": 35550600} {"current_steps": 61630, "total_steps": 67140, "loss": 0.3375, "lr": 1.0191773457397274e-06, "epoch": 9.179326779862972, "percentage": 91.79, "elapsed_time": "4:16:33", "remaining_time": "0:22:56", "throughput": 2309.64, "total_tokens": 35553800} {"current_steps": 61635, "total_steps": 67140, "loss": 0.4479, "lr": 1.0173414741116994e-06, "epoch": 9.180071492403933, "percentage": 91.8, "elapsed_time": "4:16:34", "remaining_time": "0:22:55", "throughput": 2309.66, "total_tokens": 35556776} {"current_steps": 61640, "total_steps": 67140, "loss": 0.5401, "lr": 1.015507223134224e-06, "epoch": 9.180816204944891, "percentage": 91.81, "elapsed_time": "4:16:35", "remaining_time": "0:22:53", "throughput": 2309.67, "total_tokens": 35559496} {"current_steps": 61645, "total_steps": 67140, "loss": 0.4916, "lr": 1.0136745929312546e-06, "epoch": 9.18156091748585, "percentage": 91.82, "elapsed_time": "4:16:37", "remaining_time": "0:22:52", "throughput": 2309.69, "total_tokens": 35562408} {"current_steps": 61650, "total_steps": 67140, "loss": 0.5346, "lr": 1.011843583626637e-06, "epoch": 9.182305630026809, "percentage": 91.82, "elapsed_time": "4:16:38", "remaining_time": "0:22:51", "throughput": 2309.71, "total_tokens": 35565416} {"current_steps": 61655, "total_steps": 67140, "loss": 0.6585, "lr": 1.010014195344103e-06, "epoch": 9.18305034256777, "percentage": 91.83, "elapsed_time": "4:16:39", "remaining_time": "0:22:49", "throughput": 2309.72, "total_tokens": 35568136} {"current_steps": 61660, "total_steps": 67140, "loss": 0.4611, "lr": 1.0081864282072722e-06, "epoch": 9.183795055108728, "percentage": 91.84, "elapsed_time": "4:16:40", "remaining_time": "0:22:48", "throughput": 2309.75, "total_tokens": 35571208} {"current_steps": 61665, "total_steps": 67140, "loss": 0.6557, "lr": 1.0063602823396578e-06, "epoch": 9.184539767649687, "percentage": 91.85, "elapsed_time": "4:16:41", "remaining_time": "0:22:47", "throughput": 2309.77, "total_tokens": 35574152} {"current_steps": 61670, "total_steps": 67140, "loss": 0.5176, "lr": 1.0045357578646664e-06, "epoch": 9.185284480190646, "percentage": 91.85, "elapsed_time": "4:16:42", "remaining_time": "0:22:46", "throughput": 2309.77, "total_tokens": 35576808} {"current_steps": 61675, "total_steps": 67140, "loss": 0.6185, "lr": 1.0027128549055881e-06, "epoch": 9.186029192731606, "percentage": 91.86, "elapsed_time": "4:16:43", "remaining_time": "0:22:44", "throughput": 2309.81, "total_tokens": 35580168} {"current_steps": 61680, "total_steps": 67140, "loss": 0.6613, "lr": 1.0008915735856134e-06, "epoch": 9.186773905272565, "percentage": 91.87, "elapsed_time": "4:16:45", "remaining_time": "0:22:43", "throughput": 2309.84, "total_tokens": 35583272} {"current_steps": 61685, "total_steps": 67140, "loss": 0.4956, "lr": 9.990719140278077e-07, "epoch": 9.187518617813524, "percentage": 91.88, "elapsed_time": "4:16:46", "remaining_time": "0:22:42", "throughput": 2309.85, "total_tokens": 35586120} {"current_steps": 61690, "total_steps": 67140, "loss": 0.5309, "lr": 9.972538763551448e-07, "epoch": 9.188263330354483, "percentage": 91.88, "elapsed_time": "4:16:47", "remaining_time": "0:22:41", "throughput": 2309.87, "total_tokens": 35589160} {"current_steps": 61695, "total_steps": 67140, "loss": 0.7577, "lr": 9.954374606904765e-07, "epoch": 9.189008042895443, "percentage": 91.89, "elapsed_time": "4:16:48", "remaining_time": "0:22:39", "throughput": 2309.88, "total_tokens": 35591912} {"current_steps": 61700, "total_steps": 67140, "loss": 0.616, "lr": 9.936226671565491e-07, "epoch": 9.189752755436402, "percentage": 91.9, "elapsed_time": "4:16:49", "remaining_time": "0:22:38", "throughput": 2309.89, "total_tokens": 35594664} {"current_steps": 61705, "total_steps": 67140, "loss": 0.459, "lr": 9.91809495875995e-07, "epoch": 9.19049746797736, "percentage": 91.9, "elapsed_time": "4:16:50", "remaining_time": "0:22:37", "throughput": 2309.91, "total_tokens": 35597576} {"current_steps": 61710, "total_steps": 67140, "loss": 0.6297, "lr": 9.899979469713494e-07, "epoch": 9.19124218051832, "percentage": 91.91, "elapsed_time": "4:16:52", "remaining_time": "0:22:36", "throughput": 2309.94, "total_tokens": 35600776} {"current_steps": 61715, "total_steps": 67140, "loss": 0.2641, "lr": 9.88188020565023e-07, "epoch": 9.19198689305928, "percentage": 91.92, "elapsed_time": "4:16:53", "remaining_time": "0:22:34", "throughput": 2309.95, "total_tokens": 35603656} {"current_steps": 61720, "total_steps": 67140, "loss": 0.3169, "lr": 9.863797167793286e-07, "epoch": 9.192731605600239, "percentage": 91.93, "elapsed_time": "4:16:54", "remaining_time": "0:22:33", "throughput": 2309.96, "total_tokens": 35606280} {"current_steps": 61725, "total_steps": 67140, "loss": 0.5639, "lr": 9.84573035736455e-07, "epoch": 9.193476318141197, "percentage": 91.93, "elapsed_time": "4:16:55", "remaining_time": "0:22:32", "throughput": 2309.97, "total_tokens": 35609064} {"current_steps": 61730, "total_steps": 67140, "loss": 0.5956, "lr": 9.827679775585019e-07, "epoch": 9.194221030682156, "percentage": 91.94, "elapsed_time": "4:16:56", "remaining_time": "0:22:31", "throughput": 2310.0, "total_tokens": 35612168} {"current_steps": 61735, "total_steps": 67140, "loss": 0.4776, "lr": 9.80964542367438e-07, "epoch": 9.194965743223117, "percentage": 91.95, "elapsed_time": "4:16:57", "remaining_time": "0:22:29", "throughput": 2310.01, "total_tokens": 35614984} {"current_steps": 61740, "total_steps": 67140, "loss": 0.5065, "lr": 9.79162730285138e-07, "epoch": 9.195710455764075, "percentage": 91.96, "elapsed_time": "4:16:58", "remaining_time": "0:22:28", "throughput": 2310.02, "total_tokens": 35617640} {"current_steps": 61745, "total_steps": 67140, "loss": 0.5824, "lr": 9.773625414333576e-07, "epoch": 9.196455168305034, "percentage": 91.96, "elapsed_time": "4:16:59", "remaining_time": "0:22:27", "throughput": 2310.04, "total_tokens": 35620616} {"current_steps": 61750, "total_steps": 67140, "loss": 0.5419, "lr": 9.755639759337466e-07, "epoch": 9.197199880845993, "percentage": 91.97, "elapsed_time": "4:17:01", "remaining_time": "0:22:26", "throughput": 2310.05, "total_tokens": 35623336} {"current_steps": 61755, "total_steps": 67140, "loss": 0.4193, "lr": 9.737670339078491e-07, "epoch": 9.197944593386953, "percentage": 91.98, "elapsed_time": "4:17:02", "remaining_time": "0:22:24", "throughput": 2310.07, "total_tokens": 35626248} {"current_steps": 61760, "total_steps": 67140, "loss": 0.5156, "lr": 9.719717154770908e-07, "epoch": 9.198689305927912, "percentage": 91.99, "elapsed_time": "4:17:03", "remaining_time": "0:22:23", "throughput": 2310.08, "total_tokens": 35629032} {"current_steps": 61765, "total_steps": 67140, "loss": 0.6978, "lr": 9.701780207627963e-07, "epoch": 9.199434018468871, "percentage": 91.99, "elapsed_time": "4:17:04", "remaining_time": "0:22:22", "throughput": 2310.11, "total_tokens": 35632104} {"current_steps": 61770, "total_steps": 67140, "loss": 0.5622, "lr": 9.683859498861691e-07, "epoch": 9.20017873100983, "percentage": 92.0, "elapsed_time": "4:17:05", "remaining_time": "0:22:21", "throughput": 2310.13, "total_tokens": 35635080} {"current_steps": 61775, "total_steps": 67140, "loss": 0.4637, "lr": 9.665955029683122e-07, "epoch": 9.200923443550789, "percentage": 92.01, "elapsed_time": "4:17:06", "remaining_time": "0:22:19", "throughput": 2310.15, "total_tokens": 35637960} {"current_steps": 61780, "total_steps": 67140, "loss": 0.7576, "lr": 9.648066801302202e-07, "epoch": 9.201668156091749, "percentage": 92.02, "elapsed_time": "4:17:07", "remaining_time": "0:22:18", "throughput": 2310.17, "total_tokens": 35641096} {"current_steps": 61785, "total_steps": 67140, "loss": 0.609, "lr": 9.630194814927718e-07, "epoch": 9.202412868632708, "percentage": 92.02, "elapsed_time": "4:17:09", "remaining_time": "0:22:17", "throughput": 2310.2, "total_tokens": 35644136} {"current_steps": 61790, "total_steps": 67140, "loss": 0.5237, "lr": 9.612339071767451e-07, "epoch": 9.203157581173667, "percentage": 92.03, "elapsed_time": "4:17:10", "remaining_time": "0:22:16", "throughput": 2310.22, "total_tokens": 35647176} {"current_steps": 61795, "total_steps": 67140, "loss": 0.423, "lr": 9.59449957302791e-07, "epoch": 9.203902293714625, "percentage": 92.04, "elapsed_time": "4:17:11", "remaining_time": "0:22:14", "throughput": 2310.23, "total_tokens": 35649928} {"current_steps": 61800, "total_steps": 67140, "loss": 0.6227, "lr": 9.576676319914713e-07, "epoch": 9.204647006255586, "percentage": 92.05, "elapsed_time": "4:17:12", "remaining_time": "0:22:13", "throughput": 2310.26, "total_tokens": 35652936} {"current_steps": 61805, "total_steps": 67140, "loss": 0.3585, "lr": 9.558869313632202e-07, "epoch": 9.205391718796545, "percentage": 92.05, "elapsed_time": "4:17:13", "remaining_time": "0:22:12", "throughput": 2310.28, "total_tokens": 35655912} {"current_steps": 61810, "total_steps": 67140, "loss": 0.4314, "lr": 9.541078555383747e-07, "epoch": 9.206136431337503, "percentage": 92.06, "elapsed_time": "4:17:14", "remaining_time": "0:22:10", "throughput": 2310.29, "total_tokens": 35658632} {"current_steps": 61815, "total_steps": 67140, "loss": 0.6061, "lr": 9.523304046371556e-07, "epoch": 9.206881143878462, "percentage": 92.07, "elapsed_time": "4:17:15", "remaining_time": "0:22:09", "throughput": 2310.3, "total_tokens": 35661384} {"current_steps": 61820, "total_steps": 67140, "loss": 0.4805, "lr": 9.505545787796777e-07, "epoch": 9.207625856419423, "percentage": 92.08, "elapsed_time": "4:17:16", "remaining_time": "0:22:08", "throughput": 2310.31, "total_tokens": 35664200} {"current_steps": 61825, "total_steps": 67140, "loss": 0.5145, "lr": 9.48780378085945e-07, "epoch": 9.208370568960381, "percentage": 92.08, "elapsed_time": "4:17:18", "remaining_time": "0:22:07", "throughput": 2310.33, "total_tokens": 35667048} {"current_steps": 61830, "total_steps": 67140, "loss": 0.5813, "lr": 9.470078026758477e-07, "epoch": 9.20911528150134, "percentage": 92.09, "elapsed_time": "4:17:19", "remaining_time": "0:22:05", "throughput": 2310.35, "total_tokens": 35670088} {"current_steps": 61835, "total_steps": 67140, "loss": 0.4368, "lr": 9.452368526691735e-07, "epoch": 9.209859994042299, "percentage": 92.1, "elapsed_time": "4:17:20", "remaining_time": "0:22:04", "throughput": 2310.36, "total_tokens": 35672744} {"current_steps": 61840, "total_steps": 67140, "loss": 0.4926, "lr": 9.434675281855932e-07, "epoch": 9.21060470658326, "percentage": 92.11, "elapsed_time": "4:17:21", "remaining_time": "0:22:03", "throughput": 2310.37, "total_tokens": 35675592} {"current_steps": 61845, "total_steps": 67140, "loss": 0.3611, "lr": 9.416998293446666e-07, "epoch": 9.211349419124218, "percentage": 92.11, "elapsed_time": "4:17:22", "remaining_time": "0:22:02", "throughput": 2310.37, "total_tokens": 35678088} {"current_steps": 61850, "total_steps": 67140, "loss": 0.4071, "lr": 9.399337562658539e-07, "epoch": 9.212094131665177, "percentage": 92.12, "elapsed_time": "4:17:23", "remaining_time": "0:22:00", "throughput": 2310.39, "total_tokens": 35680840} {"current_steps": 61855, "total_steps": 67140, "loss": 0.5636, "lr": 9.381693090684957e-07, "epoch": 9.212838844206136, "percentage": 92.13, "elapsed_time": "4:17:24", "remaining_time": "0:21:59", "throughput": 2310.4, "total_tokens": 35683752} {"current_steps": 61860, "total_steps": 67140, "loss": 0.4944, "lr": 9.364064878718298e-07, "epoch": 9.213583556747096, "percentage": 92.14, "elapsed_time": "4:17:25", "remaining_time": "0:21:58", "throughput": 2310.42, "total_tokens": 35686568} {"current_steps": 61865, "total_steps": 67140, "loss": 0.7263, "lr": 9.346452927949778e-07, "epoch": 9.214328269288055, "percentage": 92.14, "elapsed_time": "4:17:27", "remaining_time": "0:21:57", "throughput": 2310.43, "total_tokens": 35689320} {"current_steps": 61870, "total_steps": 67140, "loss": 0.6056, "lr": 9.328857239569527e-07, "epoch": 9.215072981829014, "percentage": 92.15, "elapsed_time": "4:17:28", "remaining_time": "0:21:55", "throughput": 2310.44, "total_tokens": 35692200} {"current_steps": 61875, "total_steps": 67140, "loss": 0.4737, "lr": 9.311277814766595e-07, "epoch": 9.215817694369973, "percentage": 92.16, "elapsed_time": "4:17:29", "remaining_time": "0:21:54", "throughput": 2310.45, "total_tokens": 35694888} {"current_steps": 61880, "total_steps": 67140, "loss": 0.5923, "lr": 9.293714654728974e-07, "epoch": 9.216562406910933, "percentage": 92.17, "elapsed_time": "4:17:30", "remaining_time": "0:21:53", "throughput": 2310.48, "total_tokens": 35698024} {"current_steps": 61885, "total_steps": 67140, "loss": 0.549, "lr": 9.276167760643439e-07, "epoch": 9.217307119451892, "percentage": 92.17, "elapsed_time": "4:17:31", "remaining_time": "0:21:52", "throughput": 2310.49, "total_tokens": 35700744} {"current_steps": 61890, "total_steps": 67140, "loss": 0.5796, "lr": 9.258637133695791e-07, "epoch": 9.21805183199285, "percentage": 92.18, "elapsed_time": "4:17:32", "remaining_time": "0:21:50", "throughput": 2310.52, "total_tokens": 35703752} {"current_steps": 61895, "total_steps": 67140, "loss": 0.5582, "lr": 9.241122775070693e-07, "epoch": 9.21879654453381, "percentage": 92.19, "elapsed_time": "4:17:33", "remaining_time": "0:21:49", "throughput": 2310.52, "total_tokens": 35706440} {"current_steps": 61900, "total_steps": 67140, "loss": 0.6201, "lr": 9.223624685951615e-07, "epoch": 9.21954125707477, "percentage": 92.2, "elapsed_time": "4:17:34", "remaining_time": "0:21:48", "throughput": 2310.54, "total_tokens": 35709352} {"current_steps": 61905, "total_steps": 67140, "loss": 0.6018, "lr": 9.206142867521084e-07, "epoch": 9.220285969615729, "percentage": 92.2, "elapsed_time": "4:17:36", "remaining_time": "0:21:47", "throughput": 2310.57, "total_tokens": 35712456} {"current_steps": 61910, "total_steps": 67140, "loss": 0.5022, "lr": 9.188677320960404e-07, "epoch": 9.221030682156687, "percentage": 92.21, "elapsed_time": "4:17:37", "remaining_time": "0:21:45", "throughput": 2310.58, "total_tokens": 35715336} {"current_steps": 61915, "total_steps": 67140, "loss": 0.5993, "lr": 9.171228047449825e-07, "epoch": 9.221775394697646, "percentage": 92.22, "elapsed_time": "4:17:38", "remaining_time": "0:21:44", "throughput": 2310.59, "total_tokens": 35718152} {"current_steps": 61920, "total_steps": 67140, "loss": 0.7143, "lr": 9.153795048168573e-07, "epoch": 9.222520107238607, "percentage": 92.23, "elapsed_time": "4:17:39", "remaining_time": "0:21:43", "throughput": 2310.6, "total_tokens": 35720808} {"current_steps": 61925, "total_steps": 67140, "loss": 0.6665, "lr": 9.136378324294592e-07, "epoch": 9.223264819779565, "percentage": 92.23, "elapsed_time": "4:17:40", "remaining_time": "0:21:42", "throughput": 2310.62, "total_tokens": 35723592} {"current_steps": 61930, "total_steps": 67140, "loss": 0.5746, "lr": 9.118977877004942e-07, "epoch": 9.224009532320524, "percentage": 92.24, "elapsed_time": "4:17:41", "remaining_time": "0:21:40", "throughput": 2310.63, "total_tokens": 35726472} {"current_steps": 61935, "total_steps": 67140, "loss": 0.4253, "lr": 9.101593707475376e-07, "epoch": 9.224754244861483, "percentage": 92.25, "elapsed_time": "4:17:42", "remaining_time": "0:21:39", "throughput": 2310.64, "total_tokens": 35729192} {"current_steps": 61940, "total_steps": 67140, "loss": 0.5418, "lr": 9.084225816880677e-07, "epoch": 9.225498957402444, "percentage": 92.25, "elapsed_time": "4:17:44", "remaining_time": "0:21:38", "throughput": 2310.67, "total_tokens": 35732264} {"current_steps": 61945, "total_steps": 67140, "loss": 0.5934, "lr": 9.066874206394488e-07, "epoch": 9.226243669943402, "percentage": 92.26, "elapsed_time": "4:17:45", "remaining_time": "0:21:36", "throughput": 2310.68, "total_tokens": 35735112} {"current_steps": 61950, "total_steps": 67140, "loss": 0.5442, "lr": 9.049538877189401e-07, "epoch": 9.226988382484361, "percentage": 92.27, "elapsed_time": "4:17:46", "remaining_time": "0:21:35", "throughput": 2310.7, "total_tokens": 35738024} {"current_steps": 61955, "total_steps": 67140, "loss": 0.6954, "lr": 9.032219830436867e-07, "epoch": 9.22773309502532, "percentage": 92.28, "elapsed_time": "4:17:47", "remaining_time": "0:21:34", "throughput": 2310.72, "total_tokens": 35740840} {"current_steps": 61960, "total_steps": 67140, "loss": 0.6035, "lr": 9.014917067307227e-07, "epoch": 9.228477807566279, "percentage": 92.28, "elapsed_time": "4:17:48", "remaining_time": "0:21:33", "throughput": 2310.73, "total_tokens": 35743752} {"current_steps": 61965, "total_steps": 67140, "loss": 0.4694, "lr": 8.997630588969686e-07, "epoch": 9.229222520107239, "percentage": 92.29, "elapsed_time": "4:17:49", "remaining_time": "0:21:31", "throughput": 2310.76, "total_tokens": 35746856} {"current_steps": 61970, "total_steps": 67140, "loss": 0.3353, "lr": 8.980360396592419e-07, "epoch": 9.229967232648198, "percentage": 92.3, "elapsed_time": "4:17:50", "remaining_time": "0:21:30", "throughput": 2310.8, "total_tokens": 35750184} {"current_steps": 61975, "total_steps": 67140, "loss": 0.5308, "lr": 8.963106491342466e-07, "epoch": 9.230711945189157, "percentage": 92.31, "elapsed_time": "4:17:52", "remaining_time": "0:21:29", "throughput": 2310.81, "total_tokens": 35752936} {"current_steps": 61980, "total_steps": 67140, "loss": 0.6677, "lr": 8.94586887438581e-07, "epoch": 9.231456657730115, "percentage": 92.31, "elapsed_time": "4:17:53", "remaining_time": "0:21:28", "throughput": 2310.82, "total_tokens": 35755720} {"current_steps": 61985, "total_steps": 67140, "loss": 0.5916, "lr": 8.928647546887269e-07, "epoch": 9.232201370271076, "percentage": 92.32, "elapsed_time": "4:17:54", "remaining_time": "0:21:26", "throughput": 2310.84, "total_tokens": 35758632} {"current_steps": 61990, "total_steps": 67140, "loss": 0.6052, "lr": 8.911442510010637e-07, "epoch": 9.232946082812035, "percentage": 92.33, "elapsed_time": "4:17:55", "remaining_time": "0:21:25", "throughput": 2310.85, "total_tokens": 35761288} {"current_steps": 61995, "total_steps": 67140, "loss": 0.6485, "lr": 8.894253764918509e-07, "epoch": 9.233690795352993, "percentage": 92.34, "elapsed_time": "4:17:56", "remaining_time": "0:21:24", "throughput": 2310.86, "total_tokens": 35764040} {"current_steps": 62000, "total_steps": 67140, "loss": 0.5716, "lr": 8.877081312772456e-07, "epoch": 9.234435507893952, "percentage": 92.34, "elapsed_time": "4:17:57", "remaining_time": "0:21:23", "throughput": 2310.88, "total_tokens": 35766920} {"current_steps": 62005, "total_steps": 67140, "loss": 0.613, "lr": 8.859925154732885e-07, "epoch": 9.235180220434913, "percentage": 92.35, "elapsed_time": "4:17:58", "remaining_time": "0:21:21", "throughput": 2310.9, "total_tokens": 35770024} {"current_steps": 62010, "total_steps": 67140, "loss": 0.6907, "lr": 8.842785291959199e-07, "epoch": 9.235924932975871, "percentage": 92.36, "elapsed_time": "4:17:59", "remaining_time": "0:21:20", "throughput": 2310.91, "total_tokens": 35772776} {"current_steps": 62015, "total_steps": 67140, "loss": 0.717, "lr": 8.825661725609585e-07, "epoch": 9.23666964551683, "percentage": 92.37, "elapsed_time": "4:18:01", "remaining_time": "0:21:19", "throughput": 2310.93, "total_tokens": 35775528} {"current_steps": 62020, "total_steps": 67140, "loss": 0.6404, "lr": 8.808554456841201e-07, "epoch": 9.237414358057789, "percentage": 92.37, "elapsed_time": "4:18:02", "remaining_time": "0:21:18", "throughput": 2310.95, "total_tokens": 35778632} {"current_steps": 62025, "total_steps": 67140, "loss": 0.5922, "lr": 8.79146348681012e-07, "epoch": 9.23815907059875, "percentage": 92.38, "elapsed_time": "4:18:03", "remaining_time": "0:21:16", "throughput": 2310.96, "total_tokens": 35781416} {"current_steps": 62030, "total_steps": 67140, "loss": 0.6023, "lr": 8.774388816671253e-07, "epoch": 9.238903783139708, "percentage": 92.39, "elapsed_time": "4:18:04", "remaining_time": "0:21:15", "throughput": 2310.97, "total_tokens": 35784136} {"current_steps": 62035, "total_steps": 67140, "loss": 0.692, "lr": 8.757330447578399e-07, "epoch": 9.239648495680667, "percentage": 92.4, "elapsed_time": "4:18:05", "remaining_time": "0:21:14", "throughput": 2310.99, "total_tokens": 35787112} {"current_steps": 62040, "total_steps": 67140, "loss": 0.5854, "lr": 8.740288380684386e-07, "epoch": 9.240393208221626, "percentage": 92.4, "elapsed_time": "4:18:06", "remaining_time": "0:21:13", "throughput": 2311.02, "total_tokens": 35790312} {"current_steps": 62045, "total_steps": 67140, "loss": 0.7117, "lr": 8.723262617140765e-07, "epoch": 9.241137920762586, "percentage": 92.41, "elapsed_time": "4:18:07", "remaining_time": "0:21:11", "throughput": 2311.03, "total_tokens": 35793032} {"current_steps": 62050, "total_steps": 67140, "loss": 0.6413, "lr": 8.706253158098088e-07, "epoch": 9.241882633303545, "percentage": 92.42, "elapsed_time": "4:18:08", "remaining_time": "0:21:10", "throughput": 2311.04, "total_tokens": 35795688} {"current_steps": 62055, "total_steps": 67140, "loss": 0.4765, "lr": 8.689260004705823e-07, "epoch": 9.242627345844504, "percentage": 92.43, "elapsed_time": "4:18:10", "remaining_time": "0:21:09", "throughput": 2311.07, "total_tokens": 35798888} {"current_steps": 62060, "total_steps": 67140, "loss": 0.4968, "lr": 8.672283158112249e-07, "epoch": 9.243372058385463, "percentage": 92.43, "elapsed_time": "4:18:11", "remaining_time": "0:21:08", "throughput": 2311.08, "total_tokens": 35801544} {"current_steps": 62065, "total_steps": 67140, "loss": 0.7369, "lr": 8.655322619464612e-07, "epoch": 9.244116770926423, "percentage": 92.44, "elapsed_time": "4:18:12", "remaining_time": "0:21:06", "throughput": 2311.09, "total_tokens": 35804424} {"current_steps": 62070, "total_steps": 67140, "loss": 0.5115, "lr": 8.638378389909052e-07, "epoch": 9.244861483467382, "percentage": 92.45, "elapsed_time": "4:18:13", "remaining_time": "0:21:05", "throughput": 2311.13, "total_tokens": 35807752} {"current_steps": 62075, "total_steps": 67140, "loss": 0.4687, "lr": 8.621450470590542e-07, "epoch": 9.24560619600834, "percentage": 92.46, "elapsed_time": "4:18:14", "remaining_time": "0:21:04", "throughput": 2311.14, "total_tokens": 35810632} {"current_steps": 62080, "total_steps": 67140, "loss": 0.4537, "lr": 8.604538862653084e-07, "epoch": 9.2463509085493, "percentage": 92.46, "elapsed_time": "4:18:15", "remaining_time": "0:21:03", "throughput": 2311.15, "total_tokens": 35813384} {"current_steps": 62085, "total_steps": 67140, "loss": 0.5282, "lr": 8.5876435672394e-07, "epoch": 9.24709562109026, "percentage": 92.47, "elapsed_time": "4:18:17", "remaining_time": "0:21:01", "throughput": 2311.17, "total_tokens": 35816168} {"current_steps": 62090, "total_steps": 67140, "loss": 0.4257, "lr": 8.570764585491275e-07, "epoch": 9.247840333631219, "percentage": 92.48, "elapsed_time": "4:18:18", "remaining_time": "0:21:00", "throughput": 2311.19, "total_tokens": 35819112} {"current_steps": 62095, "total_steps": 67140, "loss": 0.4739, "lr": 8.553901918549323e-07, "epoch": 9.248585046172177, "percentage": 92.49, "elapsed_time": "4:18:19", "remaining_time": "0:20:59", "throughput": 2311.2, "total_tokens": 35821992} {"current_steps": 62100, "total_steps": 67140, "loss": 0.5143, "lr": 8.537055567552993e-07, "epoch": 9.249329758713136, "percentage": 92.49, "elapsed_time": "4:18:20", "remaining_time": "0:20:58", "throughput": 2311.22, "total_tokens": 35824904} {"current_steps": 62105, "total_steps": 67140, "loss": 0.5846, "lr": 8.520225533640735e-07, "epoch": 9.250074471254097, "percentage": 92.5, "elapsed_time": "4:18:21", "remaining_time": "0:20:56", "throughput": 2311.24, "total_tokens": 35827784} {"current_steps": 62110, "total_steps": 67140, "loss": 0.4419, "lr": 8.503411817949863e-07, "epoch": 9.250819183795056, "percentage": 92.51, "elapsed_time": "4:18:22", "remaining_time": "0:20:55", "throughput": 2311.25, "total_tokens": 35830664} {"current_steps": 62115, "total_steps": 67140, "loss": 0.8084, "lr": 8.486614421616551e-07, "epoch": 9.251563896336014, "percentage": 92.52, "elapsed_time": "4:18:23", "remaining_time": "0:20:54", "throughput": 2311.27, "total_tokens": 35833544} {"current_steps": 62120, "total_steps": 67140, "loss": 0.7066, "lr": 8.469833345775946e-07, "epoch": 9.252308608876973, "percentage": 92.52, "elapsed_time": "4:18:24", "remaining_time": "0:20:52", "throughput": 2311.28, "total_tokens": 35836264} {"current_steps": 62125, "total_steps": 67140, "loss": 0.5957, "lr": 8.453068591562003e-07, "epoch": 9.253053321417934, "percentage": 92.53, "elapsed_time": "4:18:26", "remaining_time": "0:20:51", "throughput": 2311.29, "total_tokens": 35839080} {"current_steps": 62130, "total_steps": 67140, "loss": 0.7597, "lr": 8.436320160107619e-07, "epoch": 9.253798033958892, "percentage": 92.54, "elapsed_time": "4:18:27", "remaining_time": "0:20:50", "throughput": 2311.3, "total_tokens": 35841832} {"current_steps": 62135, "total_steps": 67140, "loss": 0.6112, "lr": 8.419588052544586e-07, "epoch": 9.254542746499851, "percentage": 92.55, "elapsed_time": "4:18:28", "remaining_time": "0:20:49", "throughput": 2311.31, "total_tokens": 35844520} {"current_steps": 62140, "total_steps": 67140, "loss": 0.6309, "lr": 8.402872270003582e-07, "epoch": 9.25528745904081, "percentage": 92.55, "elapsed_time": "4:18:29", "remaining_time": "0:20:47", "throughput": 2311.33, "total_tokens": 35847400} {"current_steps": 62145, "total_steps": 67140, "loss": 0.607, "lr": 8.386172813614229e-07, "epoch": 9.256032171581769, "percentage": 92.56, "elapsed_time": "4:18:30", "remaining_time": "0:20:46", "throughput": 2311.34, "total_tokens": 35850184} {"current_steps": 62150, "total_steps": 67140, "loss": 0.6525, "lr": 8.369489684504961e-07, "epoch": 9.25677688412273, "percentage": 92.57, "elapsed_time": "4:18:31", "remaining_time": "0:20:45", "throughput": 2311.37, "total_tokens": 35853256} {"current_steps": 62155, "total_steps": 67140, "loss": 0.6186, "lr": 8.352822883803235e-07, "epoch": 9.257521596663688, "percentage": 92.58, "elapsed_time": "4:18:32", "remaining_time": "0:20:44", "throughput": 2311.38, "total_tokens": 35856104} {"current_steps": 62160, "total_steps": 67140, "loss": 0.4633, "lr": 8.336172412635263e-07, "epoch": 9.258266309204647, "percentage": 92.58, "elapsed_time": "4:18:33", "remaining_time": "0:20:42", "throughput": 2311.38, "total_tokens": 35858664} {"current_steps": 62165, "total_steps": 67140, "loss": 0.7699, "lr": 8.319538272126198e-07, "epoch": 9.259011021745605, "percentage": 92.59, "elapsed_time": "4:18:35", "remaining_time": "0:20:41", "throughput": 2311.4, "total_tokens": 35861512} {"current_steps": 62170, "total_steps": 67140, "loss": 0.5172, "lr": 8.302920463400143e-07, "epoch": 9.259755734286566, "percentage": 92.6, "elapsed_time": "4:18:36", "remaining_time": "0:20:40", "throughput": 2311.42, "total_tokens": 35864328} {"current_steps": 62175, "total_steps": 67140, "loss": 0.5373, "lr": 8.286318987580061e-07, "epoch": 9.260500446827525, "percentage": 92.61, "elapsed_time": "4:18:37", "remaining_time": "0:20:39", "throughput": 2311.43, "total_tokens": 35867144} {"current_steps": 62180, "total_steps": 67140, "loss": 0.5115, "lr": 8.269733845787775e-07, "epoch": 9.261245159368483, "percentage": 92.61, "elapsed_time": "4:18:38", "remaining_time": "0:20:37", "throughput": 2311.45, "total_tokens": 35870056} {"current_steps": 62185, "total_steps": 67140, "loss": 0.6282, "lr": 8.253165039144111e-07, "epoch": 9.261989871909442, "percentage": 92.62, "elapsed_time": "4:18:39", "remaining_time": "0:20:36", "throughput": 2311.47, "total_tokens": 35873000} {"current_steps": 62190, "total_steps": 67140, "loss": 0.6288, "lr": 8.236612568768676e-07, "epoch": 9.262734584450403, "percentage": 92.63, "elapsed_time": "4:18:40", "remaining_time": "0:20:35", "throughput": 2311.49, "total_tokens": 35875976} {"current_steps": 62195, "total_steps": 67140, "loss": 0.6318, "lr": 8.220076435780016e-07, "epoch": 9.263479296991362, "percentage": 92.63, "elapsed_time": "4:18:41", "remaining_time": "0:20:34", "throughput": 2311.5, "total_tokens": 35878696} {"current_steps": 62200, "total_steps": 67140, "loss": 0.6212, "lr": 8.203556641295601e-07, "epoch": 9.26422400953232, "percentage": 92.64, "elapsed_time": "4:18:43", "remaining_time": "0:20:32", "throughput": 2311.52, "total_tokens": 35881800} {"current_steps": 62205, "total_steps": 67140, "loss": 0.6018, "lr": 8.187053186431731e-07, "epoch": 9.264968722073279, "percentage": 92.65, "elapsed_time": "4:18:44", "remaining_time": "0:20:31", "throughput": 2311.56, "total_tokens": 35885160} {"current_steps": 62210, "total_steps": 67140, "loss": 0.5694, "lr": 8.170566072303681e-07, "epoch": 9.26571343461424, "percentage": 92.66, "elapsed_time": "4:18:45", "remaining_time": "0:20:30", "throughput": 2311.58, "total_tokens": 35888008} {"current_steps": 62215, "total_steps": 67140, "loss": 0.4628, "lr": 8.15409530002556e-07, "epoch": 9.266458147155198, "percentage": 92.66, "elapsed_time": "4:18:46", "remaining_time": "0:20:29", "throughput": 2311.6, "total_tokens": 35891112} {"current_steps": 62220, "total_steps": 67140, "loss": 0.6374, "lr": 8.137640870710395e-07, "epoch": 9.267202859696157, "percentage": 92.67, "elapsed_time": "4:18:47", "remaining_time": "0:20:27", "throughput": 2311.61, "total_tokens": 35893768} {"current_steps": 62225, "total_steps": 67140, "loss": 0.6369, "lr": 8.121202785470156e-07, "epoch": 9.267947572237116, "percentage": 92.68, "elapsed_time": "4:18:48", "remaining_time": "0:20:26", "throughput": 2311.62, "total_tokens": 35896616} {"current_steps": 62230, "total_steps": 67140, "loss": 0.4074, "lr": 8.104781045415594e-07, "epoch": 9.268692284778076, "percentage": 92.69, "elapsed_time": "4:18:49", "remaining_time": "0:20:25", "throughput": 2311.64, "total_tokens": 35899400} {"current_steps": 62235, "total_steps": 67140, "loss": 0.4642, "lr": 8.08837565165646e-07, "epoch": 9.269436997319035, "percentage": 92.69, "elapsed_time": "4:18:51", "remaining_time": "0:20:24", "throughput": 2311.65, "total_tokens": 35902312} {"current_steps": 62240, "total_steps": 67140, "loss": 0.6055, "lr": 8.071986605301396e-07, "epoch": 9.270181709859994, "percentage": 92.7, "elapsed_time": "4:18:52", "remaining_time": "0:20:22", "throughput": 2311.68, "total_tokens": 35905448} {"current_steps": 62245, "total_steps": 67140, "loss": 0.4472, "lr": 8.055613907457821e-07, "epoch": 9.270926422400953, "percentage": 92.71, "elapsed_time": "4:18:53", "remaining_time": "0:20:21", "throughput": 2311.71, "total_tokens": 35908680} {"current_steps": 62250, "total_steps": 67140, "loss": 0.5838, "lr": 8.039257559232182e-07, "epoch": 9.271671134941913, "percentage": 92.72, "elapsed_time": "4:18:54", "remaining_time": "0:20:20", "throughput": 2311.73, "total_tokens": 35911688} {"current_steps": 62255, "total_steps": 67140, "loss": 0.612, "lr": 8.022917561729793e-07, "epoch": 9.272415847482872, "percentage": 92.72, "elapsed_time": "4:18:55", "remaining_time": "0:20:19", "throughput": 2311.75, "total_tokens": 35914536} {"current_steps": 62260, "total_steps": 67140, "loss": 0.4488, "lr": 8.00659391605485e-07, "epoch": 9.27316056002383, "percentage": 92.73, "elapsed_time": "4:18:56", "remaining_time": "0:20:17", "throughput": 2311.77, "total_tokens": 35917576} {"current_steps": 62265, "total_steps": 67140, "loss": 0.5044, "lr": 7.990286623310389e-07, "epoch": 9.27390527256479, "percentage": 92.74, "elapsed_time": "4:18:57", "remaining_time": "0:20:16", "throughput": 2311.78, "total_tokens": 35920296} {"current_steps": 62270, "total_steps": 67140, "loss": 0.6314, "lr": 7.973995684598418e-07, "epoch": 9.27464998510575, "percentage": 92.75, "elapsed_time": "4:18:59", "remaining_time": "0:20:15", "throughput": 2311.79, "total_tokens": 35923112} {"current_steps": 62275, "total_steps": 67140, "loss": 0.5372, "lr": 7.957721101019805e-07, "epoch": 9.275394697646709, "percentage": 92.75, "elapsed_time": "4:19:00", "remaining_time": "0:20:14", "throughput": 2311.82, "total_tokens": 35926248} {"current_steps": 62280, "total_steps": 67140, "loss": 0.599, "lr": 7.941462873674338e-07, "epoch": 9.276139410187668, "percentage": 92.76, "elapsed_time": "4:19:01", "remaining_time": "0:20:12", "throughput": 2311.84, "total_tokens": 35929256} {"current_steps": 62285, "total_steps": 67140, "loss": 0.4746, "lr": 7.925221003660694e-07, "epoch": 9.276884122728626, "percentage": 92.77, "elapsed_time": "4:19:02", "remaining_time": "0:20:11", "throughput": 2311.84, "total_tokens": 35931784} {"current_steps": 62290, "total_steps": 67140, "loss": 0.5058, "lr": 7.90899549207641e-07, "epoch": 9.277628835269585, "percentage": 92.78, "elapsed_time": "4:19:03", "remaining_time": "0:20:10", "throughput": 2311.86, "total_tokens": 35934696} {"current_steps": 62295, "total_steps": 67140, "loss": 0.4586, "lr": 7.892786340017916e-07, "epoch": 9.278373547810546, "percentage": 92.78, "elapsed_time": "4:19:04", "remaining_time": "0:20:08", "throughput": 2311.87, "total_tokens": 35937512} {"current_steps": 62300, "total_steps": 67140, "loss": 0.7586, "lr": 7.876593548580585e-07, "epoch": 9.279118260351504, "percentage": 92.79, "elapsed_time": "4:19:05", "remaining_time": "0:20:07", "throughput": 2311.89, "total_tokens": 35940392} {"current_steps": 62305, "total_steps": 67140, "loss": 0.5596, "lr": 7.860417118858654e-07, "epoch": 9.279862972892463, "percentage": 92.8, "elapsed_time": "4:19:07", "remaining_time": "0:20:06", "throughput": 2311.9, "total_tokens": 35943240} {"current_steps": 62310, "total_steps": 67140, "loss": 0.5183, "lr": 7.844257051945275e-07, "epoch": 9.280607685433422, "percentage": 92.81, "elapsed_time": "4:19:08", "remaining_time": "0:20:05", "throughput": 2311.93, "total_tokens": 35946280} {"current_steps": 62315, "total_steps": 67140, "loss": 0.5901, "lr": 7.828113348932464e-07, "epoch": 9.281352397974382, "percentage": 92.81, "elapsed_time": "4:19:09", "remaining_time": "0:20:03", "throughput": 2311.94, "total_tokens": 35948936} {"current_steps": 62320, "total_steps": 67140, "loss": 0.5103, "lr": 7.811986010911182e-07, "epoch": 9.282097110515341, "percentage": 92.82, "elapsed_time": "4:19:10", "remaining_time": "0:20:02", "throughput": 2311.97, "total_tokens": 35952392} {"current_steps": 62325, "total_steps": 67140, "loss": 0.4427, "lr": 7.795875038971223e-07, "epoch": 9.2828418230563, "percentage": 92.83, "elapsed_time": "4:19:11", "remaining_time": "0:20:01", "throughput": 2311.98, "total_tokens": 35955112} {"current_steps": 62330, "total_steps": 67140, "loss": 0.5382, "lr": 7.779780434201273e-07, "epoch": 9.283586535597259, "percentage": 92.84, "elapsed_time": "4:19:12", "remaining_time": "0:20:00", "throughput": 2312.0, "total_tokens": 35957928} {"current_steps": 62335, "total_steps": 67140, "loss": 0.5175, "lr": 7.76370219768896e-07, "epoch": 9.28433124813822, "percentage": 92.84, "elapsed_time": "4:19:13", "remaining_time": "0:19:58", "throughput": 2312.03, "total_tokens": 35961032} {"current_steps": 62340, "total_steps": 67140, "loss": 0.4535, "lr": 7.747640330520805e-07, "epoch": 9.285075960679178, "percentage": 92.85, "elapsed_time": "4:19:15", "remaining_time": "0:19:57", "throughput": 2312.05, "total_tokens": 35964040} {"current_steps": 62345, "total_steps": 67140, "loss": 0.429, "lr": 7.731594833782191e-07, "epoch": 9.285820673220137, "percentage": 92.86, "elapsed_time": "4:19:16", "remaining_time": "0:19:56", "throughput": 2312.05, "total_tokens": 35966696} {"current_steps": 62350, "total_steps": 67140, "loss": 0.3777, "lr": 7.715565708557387e-07, "epoch": 9.286565385761095, "percentage": 92.87, "elapsed_time": "4:19:17", "remaining_time": "0:19:55", "throughput": 2312.07, "total_tokens": 35969480} {"current_steps": 62355, "total_steps": 67140, "loss": 0.7001, "lr": 7.69955295592964e-07, "epoch": 9.287310098302056, "percentage": 92.87, "elapsed_time": "4:19:18", "remaining_time": "0:19:53", "throughput": 2312.08, "total_tokens": 35972296} {"current_steps": 62360, "total_steps": 67140, "loss": 0.4779, "lr": 7.683556576980944e-07, "epoch": 9.288054810843015, "percentage": 92.88, "elapsed_time": "4:19:19", "remaining_time": "0:19:52", "throughput": 2312.1, "total_tokens": 35975144} {"current_steps": 62365, "total_steps": 67140, "loss": 0.6264, "lr": 7.667576572792323e-07, "epoch": 9.288799523383974, "percentage": 92.89, "elapsed_time": "4:19:20", "remaining_time": "0:19:51", "throughput": 2312.11, "total_tokens": 35977896} {"current_steps": 62370, "total_steps": 67140, "loss": 0.4331, "lr": 7.651612944443609e-07, "epoch": 9.289544235924932, "percentage": 92.9, "elapsed_time": "4:19:21", "remaining_time": "0:19:50", "throughput": 2312.12, "total_tokens": 35980712} {"current_steps": 62375, "total_steps": 67140, "loss": 0.666, "lr": 7.635665693013577e-07, "epoch": 9.290288948465893, "percentage": 92.9, "elapsed_time": "4:19:22", "remaining_time": "0:19:48", "throughput": 2312.13, "total_tokens": 35983496} {"current_steps": 62380, "total_steps": 67140, "loss": 0.5153, "lr": 7.619734819579893e-07, "epoch": 9.291033661006852, "percentage": 92.91, "elapsed_time": "4:19:23", "remaining_time": "0:19:47", "throughput": 2312.14, "total_tokens": 35986024} {"current_steps": 62385, "total_steps": 67140, "loss": 0.7145, "lr": 7.603820325219058e-07, "epoch": 9.29177837354781, "percentage": 92.92, "elapsed_time": "4:19:25", "remaining_time": "0:19:46", "throughput": 2312.15, "total_tokens": 35988808} {"current_steps": 62390, "total_steps": 67140, "loss": 0.4448, "lr": 7.58792221100657e-07, "epoch": 9.292523086088769, "percentage": 92.93, "elapsed_time": "4:19:26", "remaining_time": "0:19:45", "throughput": 2312.17, "total_tokens": 35991720} {"current_steps": 62395, "total_steps": 67140, "loss": 0.6077, "lr": 7.572040478016712e-07, "epoch": 9.29326779862973, "percentage": 92.93, "elapsed_time": "4:19:27", "remaining_time": "0:19:43", "throughput": 2312.17, "total_tokens": 35994440} {"current_steps": 62400, "total_steps": 67140, "loss": 0.5792, "lr": 7.556175127322707e-07, "epoch": 9.294012511170688, "percentage": 92.94, "elapsed_time": "4:19:28", "remaining_time": "0:19:42", "throughput": 2312.18, "total_tokens": 35997096} {"current_steps": 62405, "total_steps": 67140, "loss": 0.5178, "lr": 7.540326159996697e-07, "epoch": 9.294757223711647, "percentage": 92.95, "elapsed_time": "4:19:29", "remaining_time": "0:19:41", "throughput": 2312.21, "total_tokens": 36000168} {"current_steps": 62410, "total_steps": 67140, "loss": 0.5274, "lr": 7.524493577109659e-07, "epoch": 9.295501936252606, "percentage": 92.96, "elapsed_time": "4:19:30", "remaining_time": "0:19:40", "throughput": 2312.22, "total_tokens": 36003080} {"current_steps": 62415, "total_steps": 67140, "loss": 0.4357, "lr": 7.508677379731515e-07, "epoch": 9.296246648793566, "percentage": 92.96, "elapsed_time": "4:19:31", "remaining_time": "0:19:38", "throughput": 2312.24, "total_tokens": 36005896} {"current_steps": 62420, "total_steps": 67140, "loss": 0.6418, "lr": 7.49287756893105e-07, "epoch": 9.296991361334525, "percentage": 92.97, "elapsed_time": "4:19:33", "remaining_time": "0:19:37", "throughput": 2312.25, "total_tokens": 36008744} {"current_steps": 62425, "total_steps": 67140, "loss": 0.5708, "lr": 7.477094145775993e-07, "epoch": 9.297736073875484, "percentage": 92.98, "elapsed_time": "4:19:34", "remaining_time": "0:19:36", "throughput": 2312.28, "total_tokens": 36011912} {"current_steps": 62430, "total_steps": 67140, "loss": 0.6933, "lr": 7.46132711133285e-07, "epoch": 9.298480786416443, "percentage": 92.98, "elapsed_time": "4:19:35", "remaining_time": "0:19:35", "throughput": 2312.3, "total_tokens": 36014920} {"current_steps": 62435, "total_steps": 67140, "loss": 0.6135, "lr": 7.445576466667131e-07, "epoch": 9.299225498957403, "percentage": 92.99, "elapsed_time": "4:19:36", "remaining_time": "0:19:33", "throughput": 2312.32, "total_tokens": 36017992} {"current_steps": 62440, "total_steps": 67140, "loss": 0.5608, "lr": 7.429842212843208e-07, "epoch": 9.299970211498362, "percentage": 93.0, "elapsed_time": "4:19:37", "remaining_time": "0:19:32", "throughput": 2312.33, "total_tokens": 36020744} {"current_steps": 62445, "total_steps": 67140, "loss": 0.4737, "lr": 7.41412435092434e-07, "epoch": 9.30071492403932, "percentage": 93.01, "elapsed_time": "4:19:38", "remaining_time": "0:19:31", "throughput": 2312.34, "total_tokens": 36023304} {"current_steps": 62450, "total_steps": 67140, "loss": 0.5704, "lr": 7.39842288197265e-07, "epoch": 9.30145963658028, "percentage": 93.01, "elapsed_time": "4:19:39", "remaining_time": "0:19:30", "throughput": 2312.35, "total_tokens": 36026056} {"current_steps": 62455, "total_steps": 67140, "loss": 0.5323, "lr": 7.382737807049233e-07, "epoch": 9.30220434912124, "percentage": 93.02, "elapsed_time": "4:19:40", "remaining_time": "0:19:28", "throughput": 2312.35, "total_tokens": 36028680} {"current_steps": 62460, "total_steps": 67140, "loss": 0.7652, "lr": 7.367069127213938e-07, "epoch": 9.302949061662199, "percentage": 93.03, "elapsed_time": "4:19:42", "remaining_time": "0:19:27", "throughput": 2312.37, "total_tokens": 36031560} {"current_steps": 62465, "total_steps": 67140, "loss": 0.7079, "lr": 7.351416843525638e-07, "epoch": 9.303693774203158, "percentage": 93.04, "elapsed_time": "4:19:43", "remaining_time": "0:19:26", "throughput": 2312.38, "total_tokens": 36034440} {"current_steps": 62470, "total_steps": 67140, "loss": 0.6945, "lr": 7.335780957042071e-07, "epoch": 9.304438486744116, "percentage": 93.04, "elapsed_time": "4:19:44", "remaining_time": "0:19:25", "throughput": 2312.4, "total_tokens": 36037288} {"current_steps": 62475, "total_steps": 67140, "loss": 0.6867, "lr": 7.320161468819808e-07, "epoch": 9.305183199285075, "percentage": 93.05, "elapsed_time": "4:19:45", "remaining_time": "0:19:23", "throughput": 2312.42, "total_tokens": 36040264} {"current_steps": 62480, "total_steps": 67140, "loss": 0.7724, "lr": 7.304558379914395e-07, "epoch": 9.305927911826036, "percentage": 93.06, "elapsed_time": "4:19:46", "remaining_time": "0:19:22", "throughput": 2312.43, "total_tokens": 36043016} {"current_steps": 62485, "total_steps": 67140, "loss": 0.4535, "lr": 7.288971691380209e-07, "epoch": 9.306672624366994, "percentage": 93.07, "elapsed_time": "4:19:47", "remaining_time": "0:19:21", "throughput": 2312.44, "total_tokens": 36045800} {"current_steps": 62490, "total_steps": 67140, "loss": 0.5408, "lr": 7.273401404270519e-07, "epoch": 9.307417336907953, "percentage": 93.07, "elapsed_time": "4:19:48", "remaining_time": "0:19:20", "throughput": 2312.46, "total_tokens": 36048776} {"current_steps": 62495, "total_steps": 67140, "loss": 0.4508, "lr": 7.257847519637484e-07, "epoch": 9.308162049448912, "percentage": 93.08, "elapsed_time": "4:19:50", "remaining_time": "0:19:18", "throughput": 2312.49, "total_tokens": 36051816} {"current_steps": 62500, "total_steps": 67140, "loss": 0.5765, "lr": 7.24231003853218e-07, "epoch": 9.308906761989872, "percentage": 93.09, "elapsed_time": "4:19:51", "remaining_time": "0:19:17", "throughput": 2312.49, "total_tokens": 36054472} {"current_steps": 62505, "total_steps": 67140, "loss": 0.6653, "lr": 7.2267889620046e-07, "epoch": 9.309651474530831, "percentage": 93.1, "elapsed_time": "4:19:52", "remaining_time": "0:19:16", "throughput": 2312.5, "total_tokens": 36057256} {"current_steps": 62510, "total_steps": 67140, "loss": 0.4502, "lr": 7.21128429110357e-07, "epoch": 9.31039618707179, "percentage": 93.1, "elapsed_time": "4:19:53", "remaining_time": "0:19:14", "throughput": 2312.53, "total_tokens": 36060264} {"current_steps": 62515, "total_steps": 67140, "loss": 0.4056, "lr": 7.195796026876866e-07, "epoch": 9.311140899612749, "percentage": 93.11, "elapsed_time": "4:19:54", "remaining_time": "0:19:13", "throughput": 2312.54, "total_tokens": 36063016} {"current_steps": 62520, "total_steps": 67140, "loss": 0.5183, "lr": 7.180324170371095e-07, "epoch": 9.31188561215371, "percentage": 93.12, "elapsed_time": "4:19:55", "remaining_time": "0:19:12", "throughput": 2312.55, "total_tokens": 36065832} {"current_steps": 62525, "total_steps": 67140, "loss": 0.4562, "lr": 7.164868722631807e-07, "epoch": 9.312630324694668, "percentage": 93.13, "elapsed_time": "4:19:56", "remaining_time": "0:19:11", "throughput": 2312.57, "total_tokens": 36068744} {"current_steps": 62530, "total_steps": 67140, "loss": 0.5801, "lr": 7.149429684703335e-07, "epoch": 9.313375037235627, "percentage": 93.13, "elapsed_time": "4:19:57", "remaining_time": "0:19:09", "throughput": 2312.59, "total_tokens": 36071656} {"current_steps": 62535, "total_steps": 67140, "loss": 0.6306, "lr": 7.134007057629066e-07, "epoch": 9.314119749776586, "percentage": 93.14, "elapsed_time": "4:19:59", "remaining_time": "0:19:08", "throughput": 2312.6, "total_tokens": 36074440} {"current_steps": 62540, "total_steps": 67140, "loss": 0.63, "lr": 7.118600842451195e-07, "epoch": 9.314864462317546, "percentage": 93.15, "elapsed_time": "4:20:00", "remaining_time": "0:19:07", "throughput": 2312.63, "total_tokens": 36077672} {"current_steps": 62545, "total_steps": 67140, "loss": 0.7677, "lr": 7.103211040210778e-07, "epoch": 9.315609174858505, "percentage": 93.16, "elapsed_time": "4:20:01", "remaining_time": "0:19:06", "throughput": 2312.64, "total_tokens": 36080360} {"current_steps": 62550, "total_steps": 67140, "loss": 0.4269, "lr": 7.087837651947815e-07, "epoch": 9.316353887399464, "percentage": 93.16, "elapsed_time": "4:20:02", "remaining_time": "0:19:04", "throughput": 2312.66, "total_tokens": 36083336} {"current_steps": 62555, "total_steps": 67140, "loss": 0.4686, "lr": 7.072480678701198e-07, "epoch": 9.317098599940422, "percentage": 93.17, "elapsed_time": "4:20:03", "remaining_time": "0:19:03", "throughput": 2312.68, "total_tokens": 36086312} {"current_steps": 62560, "total_steps": 67140, "loss": 0.5503, "lr": 7.057140121508627e-07, "epoch": 9.317843312481383, "percentage": 93.18, "elapsed_time": "4:20:04", "remaining_time": "0:19:02", "throughput": 2312.69, "total_tokens": 36089064} {"current_steps": 62565, "total_steps": 67140, "loss": 0.7989, "lr": 7.041815981406852e-07, "epoch": 9.318588025022342, "percentage": 93.19, "elapsed_time": "4:20:05", "remaining_time": "0:19:01", "throughput": 2312.7, "total_tokens": 36091784} {"current_steps": 62570, "total_steps": 67140, "loss": 0.6101, "lr": 7.026508259431297e-07, "epoch": 9.3193327375633, "percentage": 93.19, "elapsed_time": "4:20:07", "remaining_time": "0:18:59", "throughput": 2312.71, "total_tokens": 36094536} {"current_steps": 62575, "total_steps": 67140, "loss": 0.4412, "lr": 7.011216956616467e-07, "epoch": 9.32007745010426, "percentage": 93.2, "elapsed_time": "4:20:08", "remaining_time": "0:18:58", "throughput": 2312.73, "total_tokens": 36097512} {"current_steps": 62580, "total_steps": 67140, "loss": 0.574, "lr": 6.995942073995676e-07, "epoch": 9.32082216264522, "percentage": 93.21, "elapsed_time": "4:20:09", "remaining_time": "0:18:57", "throughput": 2312.74, "total_tokens": 36100200} {"current_steps": 62585, "total_steps": 67140, "loss": 0.6606, "lr": 6.980683612601152e-07, "epoch": 9.321566875186178, "percentage": 93.22, "elapsed_time": "4:20:10", "remaining_time": "0:18:56", "throughput": 2312.75, "total_tokens": 36103016} {"current_steps": 62590, "total_steps": 67140, "loss": 0.8758, "lr": 6.965441573463988e-07, "epoch": 9.322311587727137, "percentage": 93.22, "elapsed_time": "4:20:11", "remaining_time": "0:18:54", "throughput": 2312.76, "total_tokens": 36105736} {"current_steps": 62595, "total_steps": 67140, "loss": 0.5546, "lr": 6.950215957614164e-07, "epoch": 9.323056300268096, "percentage": 93.23, "elapsed_time": "4:20:12", "remaining_time": "0:18:53", "throughput": 2312.77, "total_tokens": 36108552} {"current_steps": 62600, "total_steps": 67140, "loss": 0.718, "lr": 6.935006766080582e-07, "epoch": 9.323801012809056, "percentage": 93.24, "elapsed_time": "4:20:13", "remaining_time": "0:18:52", "throughput": 2312.79, "total_tokens": 36111432} {"current_steps": 62605, "total_steps": 67140, "loss": 0.5733, "lr": 6.919813999891028e-07, "epoch": 9.324545725350015, "percentage": 93.25, "elapsed_time": "4:20:14", "remaining_time": "0:18:51", "throughput": 2312.8, "total_tokens": 36114088} {"current_steps": 62610, "total_steps": 67140, "loss": 0.3682, "lr": 6.904637660072128e-07, "epoch": 9.325290437890974, "percentage": 93.25, "elapsed_time": "4:20:16", "remaining_time": "0:18:49", "throughput": 2312.82, "total_tokens": 36117064} {"current_steps": 62615, "total_steps": 67140, "loss": 0.4568, "lr": 6.889477747649447e-07, "epoch": 9.326035150431933, "percentage": 93.26, "elapsed_time": "4:20:17", "remaining_time": "0:18:48", "throughput": 2312.85, "total_tokens": 36120232} {"current_steps": 62620, "total_steps": 67140, "loss": 0.7356, "lr": 6.874334263647503e-07, "epoch": 9.326779862972893, "percentage": 93.27, "elapsed_time": "4:20:18", "remaining_time": "0:18:47", "throughput": 2312.86, "total_tokens": 36122888} {"current_steps": 62625, "total_steps": 67140, "loss": 0.3514, "lr": 6.859207209089502e-07, "epoch": 9.327524575513852, "percentage": 93.28, "elapsed_time": "4:20:19", "remaining_time": "0:18:46", "throughput": 2312.88, "total_tokens": 36125864} {"current_steps": 62630, "total_steps": 67140, "loss": 0.7322, "lr": 6.844096584997767e-07, "epoch": 9.32826928805481, "percentage": 93.28, "elapsed_time": "4:20:20", "remaining_time": "0:18:44", "throughput": 2312.89, "total_tokens": 36128584} {"current_steps": 62635, "total_steps": 67140, "loss": 0.7375, "lr": 6.829002392393396e-07, "epoch": 9.32901400059577, "percentage": 93.29, "elapsed_time": "4:20:21", "remaining_time": "0:18:43", "throughput": 2312.9, "total_tokens": 36131336} {"current_steps": 62640, "total_steps": 67140, "loss": 0.4542, "lr": 6.813924632296353e-07, "epoch": 9.32975871313673, "percentage": 93.3, "elapsed_time": "4:20:22", "remaining_time": "0:18:42", "throughput": 2312.91, "total_tokens": 36134216} {"current_steps": 62645, "total_steps": 67140, "loss": 0.8253, "lr": 6.798863305725628e-07, "epoch": 9.330503425677689, "percentage": 93.31, "elapsed_time": "4:20:23", "remaining_time": "0:18:41", "throughput": 2312.92, "total_tokens": 36136872} {"current_steps": 62650, "total_steps": 67140, "loss": 0.7182, "lr": 6.783818413698878e-07, "epoch": 9.331248138218648, "percentage": 93.31, "elapsed_time": "4:20:25", "remaining_time": "0:18:39", "throughput": 2312.96, "total_tokens": 36140264} {"current_steps": 62655, "total_steps": 67140, "loss": 0.5033, "lr": 6.768789957232874e-07, "epoch": 9.331992850759606, "percentage": 93.32, "elapsed_time": "4:20:26", "remaining_time": "0:18:38", "throughput": 2312.97, "total_tokens": 36143048} {"current_steps": 62660, "total_steps": 67140, "loss": 0.5418, "lr": 6.753777937343109e-07, "epoch": 9.332737563300565, "percentage": 93.33, "elapsed_time": "4:20:27", "remaining_time": "0:18:37", "throughput": 2312.98, "total_tokens": 36145768} {"current_steps": 62665, "total_steps": 67140, "loss": 0.7531, "lr": 6.738782355044049e-07, "epoch": 9.333482275841526, "percentage": 93.33, "elapsed_time": "4:20:28", "remaining_time": "0:18:36", "throughput": 2313.0, "total_tokens": 36148712} {"current_steps": 62670, "total_steps": 67140, "loss": 0.4752, "lr": 6.72380321134905e-07, "epoch": 9.334226988382484, "percentage": 93.34, "elapsed_time": "4:20:29", "remaining_time": "0:18:34", "throughput": 2313.02, "total_tokens": 36151496} {"current_steps": 62675, "total_steps": 67140, "loss": 0.5982, "lr": 6.708840507270359e-07, "epoch": 9.334971700923443, "percentage": 93.35, "elapsed_time": "4:20:30", "remaining_time": "0:18:33", "throughput": 2313.03, "total_tokens": 36154280} {"current_steps": 62680, "total_steps": 67140, "loss": 0.6149, "lr": 6.693894243819082e-07, "epoch": 9.335716413464402, "percentage": 93.36, "elapsed_time": "4:20:31", "remaining_time": "0:18:32", "throughput": 2313.05, "total_tokens": 36157256} {"current_steps": 62685, "total_steps": 67140, "loss": 0.545, "lr": 6.678964422005218e-07, "epoch": 9.336461126005362, "percentage": 93.36, "elapsed_time": "4:20:32", "remaining_time": "0:18:31", "throughput": 2313.07, "total_tokens": 36160264} {"current_steps": 62690, "total_steps": 67140, "loss": 0.4481, "lr": 6.66405104283771e-07, "epoch": 9.337205838546321, "percentage": 93.37, "elapsed_time": "4:20:34", "remaining_time": "0:18:29", "throughput": 2313.08, "total_tokens": 36163016} {"current_steps": 62695, "total_steps": 67140, "loss": 0.4476, "lr": 6.649154107324251e-07, "epoch": 9.33795055108728, "percentage": 93.38, "elapsed_time": "4:20:35", "remaining_time": "0:18:28", "throughput": 2313.1, "total_tokens": 36165896} {"current_steps": 62700, "total_steps": 67140, "loss": 0.5208, "lr": 6.634273616471565e-07, "epoch": 9.338695263628239, "percentage": 93.39, "elapsed_time": "4:20:36", "remaining_time": "0:18:27", "throughput": 2313.12, "total_tokens": 36168904} {"current_steps": 62705, "total_steps": 67140, "loss": 0.6315, "lr": 6.619409571285206e-07, "epoch": 9.3394399761692, "percentage": 93.39, "elapsed_time": "4:20:37", "remaining_time": "0:18:26", "throughput": 2313.14, "total_tokens": 36171880} {"current_steps": 62710, "total_steps": 67140, "loss": 0.5294, "lr": 6.604561972769652e-07, "epoch": 9.340184688710158, "percentage": 93.4, "elapsed_time": "4:20:38", "remaining_time": "0:18:24", "throughput": 2313.15, "total_tokens": 36174632} {"current_steps": 62715, "total_steps": 67140, "loss": 0.4264, "lr": 6.589730821928208e-07, "epoch": 9.340929401251117, "percentage": 93.41, "elapsed_time": "4:20:39", "remaining_time": "0:18:23", "throughput": 2313.18, "total_tokens": 36177800} {"current_steps": 62720, "total_steps": 67140, "loss": 0.6613, "lr": 6.574916119763158e-07, "epoch": 9.341674113792076, "percentage": 93.42, "elapsed_time": "4:20:41", "remaining_time": "0:18:22", "throughput": 2313.21, "total_tokens": 36180936} {"current_steps": 62725, "total_steps": 67140, "loss": 0.5176, "lr": 6.560117867275561e-07, "epoch": 9.342418826333036, "percentage": 93.42, "elapsed_time": "4:20:42", "remaining_time": "0:18:20", "throughput": 2313.21, "total_tokens": 36183560} {"current_steps": 62730, "total_steps": 67140, "loss": 0.4743, "lr": 6.545336065465451e-07, "epoch": 9.343163538873995, "percentage": 93.43, "elapsed_time": "4:20:43", "remaining_time": "0:18:19", "throughput": 2313.23, "total_tokens": 36186440} {"current_steps": 62735, "total_steps": 67140, "loss": 0.5497, "lr": 6.530570715331696e-07, "epoch": 9.343908251414954, "percentage": 93.44, "elapsed_time": "4:20:44", "remaining_time": "0:18:18", "throughput": 2313.24, "total_tokens": 36189256} {"current_steps": 62740, "total_steps": 67140, "loss": 0.5926, "lr": 6.515821817872109e-07, "epoch": 9.344652963955912, "percentage": 93.45, "elapsed_time": "4:20:45", "remaining_time": "0:18:17", "throughput": 2313.27, "total_tokens": 36192264} {"current_steps": 62745, "total_steps": 67140, "loss": 0.5009, "lr": 6.501089374083336e-07, "epoch": 9.345397676496873, "percentage": 93.45, "elapsed_time": "4:20:46", "remaining_time": "0:18:15", "throughput": 2313.28, "total_tokens": 36195048} {"current_steps": 62750, "total_steps": 67140, "loss": 0.6998, "lr": 6.48637338496097e-07, "epoch": 9.346142389037832, "percentage": 93.46, "elapsed_time": "4:20:47", "remaining_time": "0:18:14", "throughput": 2313.29, "total_tokens": 36197896} {"current_steps": 62755, "total_steps": 67140, "loss": 0.6275, "lr": 6.471673851499438e-07, "epoch": 9.34688710157879, "percentage": 93.47, "elapsed_time": "4:20:48", "remaining_time": "0:18:13", "throughput": 2313.31, "total_tokens": 36200808} {"current_steps": 62760, "total_steps": 67140, "loss": 0.4348, "lr": 6.456990774692057e-07, "epoch": 9.34763181411975, "percentage": 93.48, "elapsed_time": "4:20:50", "remaining_time": "0:18:12", "throughput": 2313.33, "total_tokens": 36203880} {"current_steps": 62765, "total_steps": 67140, "loss": 0.4758, "lr": 6.442324155531088e-07, "epoch": 9.34837652666071, "percentage": 93.48, "elapsed_time": "4:20:51", "remaining_time": "0:18:10", "throughput": 2313.35, "total_tokens": 36206888} {"current_steps": 62770, "total_steps": 67140, "loss": 0.7488, "lr": 6.4276739950076e-07, "epoch": 9.349121239201668, "percentage": 93.49, "elapsed_time": "4:20:52", "remaining_time": "0:18:09", "throughput": 2313.37, "total_tokens": 36209800} {"current_steps": 62775, "total_steps": 67140, "loss": 0.5035, "lr": 6.413040294111605e-07, "epoch": 9.349865951742627, "percentage": 93.5, "elapsed_time": "4:20:53", "remaining_time": "0:18:08", "throughput": 2313.39, "total_tokens": 36212648} {"current_steps": 62780, "total_steps": 67140, "loss": 0.4474, "lr": 6.398423053832009e-07, "epoch": 9.350610664283586, "percentage": 93.51, "elapsed_time": "4:20:54", "remaining_time": "0:18:07", "throughput": 2313.41, "total_tokens": 36215528} {"current_steps": 62785, "total_steps": 67140, "loss": 0.4956, "lr": 6.383822275156576e-07, "epoch": 9.351355376824547, "percentage": 93.51, "elapsed_time": "4:20:55", "remaining_time": "0:18:05", "throughput": 2313.41, "total_tokens": 36218120} {"current_steps": 62790, "total_steps": 67140, "loss": 0.4581, "lr": 6.369237959071933e-07, "epoch": 9.352100089365505, "percentage": 93.52, "elapsed_time": "4:20:56", "remaining_time": "0:18:04", "throughput": 2313.42, "total_tokens": 36220808} {"current_steps": 62795, "total_steps": 67140, "loss": 0.5594, "lr": 6.354670106563681e-07, "epoch": 9.352844801906464, "percentage": 93.53, "elapsed_time": "4:20:57", "remaining_time": "0:18:03", "throughput": 2313.45, "total_tokens": 36223944} {"current_steps": 62800, "total_steps": 67140, "loss": 0.621, "lr": 6.340118718616228e-07, "epoch": 9.353589514447423, "percentage": 93.54, "elapsed_time": "4:20:59", "remaining_time": "0:18:02", "throughput": 2313.46, "total_tokens": 36226696} {"current_steps": 62805, "total_steps": 67140, "loss": 0.4663, "lr": 6.325583796212925e-07, "epoch": 9.354334226988382, "percentage": 93.54, "elapsed_time": "4:21:00", "remaining_time": "0:18:00", "throughput": 2313.49, "total_tokens": 36229832} {"current_steps": 62810, "total_steps": 67140, "loss": 0.6855, "lr": 6.311065340335931e-07, "epoch": 9.355078939529342, "percentage": 93.55, "elapsed_time": "4:21:01", "remaining_time": "0:17:59", "throughput": 2313.51, "total_tokens": 36232776} {"current_steps": 62815, "total_steps": 67140, "loss": 0.7163, "lr": 6.296563351966378e-07, "epoch": 9.3558236520703, "percentage": 93.56, "elapsed_time": "4:21:02", "remaining_time": "0:17:58", "throughput": 2313.52, "total_tokens": 36235592} {"current_steps": 62820, "total_steps": 67140, "loss": 0.615, "lr": 6.282077832084259e-07, "epoch": 9.35656836461126, "percentage": 93.57, "elapsed_time": "4:21:03", "remaining_time": "0:17:57", "throughput": 2313.53, "total_tokens": 36238280} {"current_steps": 62825, "total_steps": 67140, "loss": 0.6424, "lr": 6.267608781668433e-07, "epoch": 9.357313077152218, "percentage": 93.57, "elapsed_time": "4:21:04", "remaining_time": "0:17:55", "throughput": 2313.54, "total_tokens": 36241064} {"current_steps": 62830, "total_steps": 67140, "loss": 0.8155, "lr": 6.253156201696669e-07, "epoch": 9.358057789693179, "percentage": 93.58, "elapsed_time": "4:21:05", "remaining_time": "0:17:54", "throughput": 2313.55, "total_tokens": 36243880} {"current_steps": 62835, "total_steps": 67140, "loss": 0.7144, "lr": 6.238720093145578e-07, "epoch": 9.358802502234138, "percentage": 93.59, "elapsed_time": "4:21:06", "remaining_time": "0:17:53", "throughput": 2313.56, "total_tokens": 36246472} {"current_steps": 62840, "total_steps": 67140, "loss": 0.5381, "lr": 6.22430045699074e-07, "epoch": 9.359547214775096, "percentage": 93.6, "elapsed_time": "4:21:08", "remaining_time": "0:17:52", "throughput": 2313.57, "total_tokens": 36249224} {"current_steps": 62845, "total_steps": 67140, "loss": 0.6512, "lr": 6.20989729420654e-07, "epoch": 9.360291927316055, "percentage": 93.6, "elapsed_time": "4:21:09", "remaining_time": "0:17:50", "throughput": 2313.58, "total_tokens": 36251944} {"current_steps": 62850, "total_steps": 67140, "loss": 0.5032, "lr": 6.195510605766342e-07, "epoch": 9.361036639857016, "percentage": 93.61, "elapsed_time": "4:21:10", "remaining_time": "0:17:49", "throughput": 2313.59, "total_tokens": 36254824} {"current_steps": 62855, "total_steps": 67140, "loss": 0.5762, "lr": 6.181140392642309e-07, "epoch": 9.361781352397974, "percentage": 93.62, "elapsed_time": "4:21:11", "remaining_time": "0:17:48", "throughput": 2313.61, "total_tokens": 36257800} {"current_steps": 62860, "total_steps": 67140, "loss": 0.5667, "lr": 6.166786655805473e-07, "epoch": 9.362526064938933, "percentage": 93.63, "elapsed_time": "4:21:12", "remaining_time": "0:17:47", "throughput": 2313.63, "total_tokens": 36260840} {"current_steps": 62865, "total_steps": 67140, "loss": 0.6744, "lr": 6.152449396225834e-07, "epoch": 9.363270777479892, "percentage": 93.63, "elapsed_time": "4:21:13", "remaining_time": "0:17:45", "throughput": 2313.65, "total_tokens": 36263752} {"current_steps": 62870, "total_steps": 67140, "loss": 0.4388, "lr": 6.138128614872258e-07, "epoch": 9.364015490020853, "percentage": 93.64, "elapsed_time": "4:21:14", "remaining_time": "0:17:44", "throughput": 2313.66, "total_tokens": 36266440} {"current_steps": 62875, "total_steps": 67140, "loss": 0.5702, "lr": 6.123824312712494e-07, "epoch": 9.364760202561811, "percentage": 93.65, "elapsed_time": "4:21:16", "remaining_time": "0:17:43", "throughput": 2313.66, "total_tokens": 36268968} {"current_steps": 62880, "total_steps": 67140, "loss": 0.6159, "lr": 6.109536490713136e-07, "epoch": 9.36550491510277, "percentage": 93.66, "elapsed_time": "4:21:17", "remaining_time": "0:17:42", "throughput": 2313.66, "total_tokens": 36271560} {"current_steps": 62885, "total_steps": 67140, "loss": 0.48, "lr": 6.095265149839769e-07, "epoch": 9.366249627643729, "percentage": 93.66, "elapsed_time": "4:21:18", "remaining_time": "0:17:40", "throughput": 2313.69, "total_tokens": 36274696} {"current_steps": 62890, "total_steps": 67140, "loss": 0.5899, "lr": 6.081010291056705e-07, "epoch": 9.36699434018469, "percentage": 93.67, "elapsed_time": "4:21:19", "remaining_time": "0:17:39", "throughput": 2313.69, "total_tokens": 36277288} {"current_steps": 62895, "total_steps": 67140, "loss": 0.6013, "lr": 6.066771915327257e-07, "epoch": 9.367739052725648, "percentage": 93.68, "elapsed_time": "4:21:20", "remaining_time": "0:17:38", "throughput": 2313.72, "total_tokens": 36280328} {"current_steps": 62900, "total_steps": 67140, "loss": 0.7128, "lr": 6.052550023613601e-07, "epoch": 9.368483765266607, "percentage": 93.68, "elapsed_time": "4:21:21", "remaining_time": "0:17:37", "throughput": 2313.73, "total_tokens": 36283112} {"current_steps": 62905, "total_steps": 67140, "loss": 0.5538, "lr": 6.038344616876801e-07, "epoch": 9.369228477807566, "percentage": 93.69, "elapsed_time": "4:21:22", "remaining_time": "0:17:35", "throughput": 2313.74, "total_tokens": 36285928} {"current_steps": 62910, "total_steps": 67140, "loss": 0.5892, "lr": 6.024155696076784e-07, "epoch": 9.369973190348526, "percentage": 93.7, "elapsed_time": "4:21:23", "remaining_time": "0:17:34", "throughput": 2313.75, "total_tokens": 36288712} {"current_steps": 62915, "total_steps": 67140, "loss": 0.589, "lr": 6.009983262172392e-07, "epoch": 9.370717902889485, "percentage": 93.71, "elapsed_time": "4:21:25", "remaining_time": "0:17:33", "throughput": 2313.76, "total_tokens": 36291368} {"current_steps": 62920, "total_steps": 67140, "loss": 0.5978, "lr": 5.995827316121388e-07, "epoch": 9.371462615430444, "percentage": 93.71, "elapsed_time": "4:21:26", "remaining_time": "0:17:32", "throughput": 2313.78, "total_tokens": 36294280} {"current_steps": 62925, "total_steps": 67140, "loss": 0.5008, "lr": 5.981687858880258e-07, "epoch": 9.372207327971402, "percentage": 93.72, "elapsed_time": "4:21:27", "remaining_time": "0:17:30", "throughput": 2313.79, "total_tokens": 36297000} {"current_steps": 62930, "total_steps": 67140, "loss": 0.5176, "lr": 5.967564891404626e-07, "epoch": 9.372952040512363, "percentage": 93.73, "elapsed_time": "4:21:28", "remaining_time": "0:17:29", "throughput": 2313.8, "total_tokens": 36299784} {"current_steps": 62935, "total_steps": 67140, "loss": 0.6454, "lr": 5.953458414648755e-07, "epoch": 9.373696753053322, "percentage": 93.74, "elapsed_time": "4:21:29", "remaining_time": "0:17:28", "throughput": 2313.81, "total_tokens": 36302312} {"current_steps": 62940, "total_steps": 67140, "loss": 0.4293, "lr": 5.939368429565911e-07, "epoch": 9.37444146559428, "percentage": 93.74, "elapsed_time": "4:21:30", "remaining_time": "0:17:27", "throughput": 2313.83, "total_tokens": 36305448} {"current_steps": 62945, "total_steps": 67140, "loss": 0.4265, "lr": 5.925294937108306e-07, "epoch": 9.37518617813524, "percentage": 93.75, "elapsed_time": "4:21:31", "remaining_time": "0:17:25", "throughput": 2313.85, "total_tokens": 36308424} {"current_steps": 62950, "total_steps": 67140, "loss": 0.5565, "lr": 5.911237938226954e-07, "epoch": 9.3759308906762, "percentage": 93.76, "elapsed_time": "4:21:32", "remaining_time": "0:17:24", "throughput": 2313.87, "total_tokens": 36311336} {"current_steps": 62955, "total_steps": 67140, "loss": 0.558, "lr": 5.897197433871709e-07, "epoch": 9.376675603217159, "percentage": 93.77, "elapsed_time": "4:21:33", "remaining_time": "0:17:23", "throughput": 2313.87, "total_tokens": 36313800} {"current_steps": 62960, "total_steps": 67140, "loss": 0.3307, "lr": 5.883173424991423e-07, "epoch": 9.377420315758117, "percentage": 93.77, "elapsed_time": "4:21:35", "remaining_time": "0:17:22", "throughput": 2313.88, "total_tokens": 36316712} {"current_steps": 62965, "total_steps": 67140, "loss": 0.5891, "lr": 5.86916591253378e-07, "epoch": 9.378165028299076, "percentage": 93.78, "elapsed_time": "4:21:36", "remaining_time": "0:17:20", "throughput": 2313.91, "total_tokens": 36319976} {"current_steps": 62970, "total_steps": 67140, "loss": 0.4658, "lr": 5.855174897445359e-07, "epoch": 9.378909740840037, "percentage": 93.79, "elapsed_time": "4:21:37", "remaining_time": "0:17:19", "throughput": 2313.94, "total_tokens": 36323016} {"current_steps": 62975, "total_steps": 67140, "loss": 0.4124, "lr": 5.841200380671569e-07, "epoch": 9.379654453380995, "percentage": 93.8, "elapsed_time": "4:21:38", "remaining_time": "0:17:18", "throughput": 2313.96, "total_tokens": 36326024} {"current_steps": 62980, "total_steps": 67140, "loss": 0.4163, "lr": 5.827242363156793e-07, "epoch": 9.380399165921954, "percentage": 93.8, "elapsed_time": "4:21:39", "remaining_time": "0:17:17", "throughput": 2313.99, "total_tokens": 36329224} {"current_steps": 62985, "total_steps": 67140, "loss": 0.6154, "lr": 5.813300845844249e-07, "epoch": 9.381143878462913, "percentage": 93.81, "elapsed_time": "4:21:41", "remaining_time": "0:17:15", "throughput": 2314.01, "total_tokens": 36332360} {"current_steps": 62990, "total_steps": 67140, "loss": 0.4802, "lr": 5.799375829676018e-07, "epoch": 9.381888591003872, "percentage": 93.82, "elapsed_time": "4:21:42", "remaining_time": "0:17:14", "throughput": 2314.02, "total_tokens": 36335016} {"current_steps": 62995, "total_steps": 67140, "loss": 0.5386, "lr": 5.785467315593124e-07, "epoch": 9.382633303544832, "percentage": 93.83, "elapsed_time": "4:21:43", "remaining_time": "0:17:13", "throughput": 2314.03, "total_tokens": 36337768} {"current_steps": 63000, "total_steps": 67140, "loss": 0.6712, "lr": 5.771575304535453e-07, "epoch": 9.383378016085791, "percentage": 93.83, "elapsed_time": "4:21:44", "remaining_time": "0:17:12", "throughput": 2314.05, "total_tokens": 36340680} {"current_steps": 63005, "total_steps": 67140, "loss": 0.4669, "lr": 5.757699797441757e-07, "epoch": 9.38412272862675, "percentage": 93.84, "elapsed_time": "4:21:45", "remaining_time": "0:17:10", "throughput": 2314.06, "total_tokens": 36343400} {"current_steps": 63010, "total_steps": 67140, "loss": 0.5288, "lr": 5.743840795249727e-07, "epoch": 9.384867441167708, "percentage": 93.85, "elapsed_time": "4:21:46", "remaining_time": "0:17:09", "throughput": 2314.08, "total_tokens": 36346408} {"current_steps": 63015, "total_steps": 67140, "loss": 0.5919, "lr": 5.729998298895839e-07, "epoch": 9.385612153708669, "percentage": 93.86, "elapsed_time": "4:21:47", "remaining_time": "0:17:08", "throughput": 2314.09, "total_tokens": 36349064} {"current_steps": 63020, "total_steps": 67140, "loss": 0.4986, "lr": 5.716172309315537e-07, "epoch": 9.386356866249628, "percentage": 93.86, "elapsed_time": "4:21:48", "remaining_time": "0:17:06", "throughput": 2314.1, "total_tokens": 36351784} {"current_steps": 63025, "total_steps": 67140, "loss": 0.4763, "lr": 5.702362827443131e-07, "epoch": 9.387101578790586, "percentage": 93.87, "elapsed_time": "4:21:49", "remaining_time": "0:17:05", "throughput": 2314.12, "total_tokens": 36354760} {"current_steps": 63030, "total_steps": 67140, "loss": 0.5866, "lr": 5.68856985421179e-07, "epoch": 9.387846291331545, "percentage": 93.88, "elapsed_time": "4:21:51", "remaining_time": "0:17:04", "throughput": 2314.14, "total_tokens": 36357832} {"current_steps": 63035, "total_steps": 67140, "loss": 0.5274, "lr": 5.674793390553601e-07, "epoch": 9.388591003872506, "percentage": 93.89, "elapsed_time": "4:21:52", "remaining_time": "0:17:03", "throughput": 2314.16, "total_tokens": 36360712} {"current_steps": 63040, "total_steps": 67140, "loss": 0.4542, "lr": 5.661033437399516e-07, "epoch": 9.389335716413465, "percentage": 93.89, "elapsed_time": "4:21:53", "remaining_time": "0:17:01", "throughput": 2314.17, "total_tokens": 36363432} {"current_steps": 63045, "total_steps": 67140, "loss": 0.6746, "lr": 5.647289995679372e-07, "epoch": 9.390080428954423, "percentage": 93.9, "elapsed_time": "4:21:54", "remaining_time": "0:17:00", "throughput": 2314.18, "total_tokens": 36366280} {"current_steps": 63050, "total_steps": 67140, "loss": 0.4183, "lr": 5.633563066321956e-07, "epoch": 9.390825141495382, "percentage": 93.91, "elapsed_time": "4:21:55", "remaining_time": "0:16:59", "throughput": 2314.19, "total_tokens": 36368968} {"current_steps": 63055, "total_steps": 67140, "loss": 0.633, "lr": 5.619852650254803e-07, "epoch": 9.391569854036343, "percentage": 93.92, "elapsed_time": "4:21:56", "remaining_time": "0:16:58", "throughput": 2314.21, "total_tokens": 36371912} {"current_steps": 63060, "total_steps": 67140, "loss": 0.5438, "lr": 5.606158748404423e-07, "epoch": 9.392314566577301, "percentage": 93.92, "elapsed_time": "4:21:57", "remaining_time": "0:16:56", "throughput": 2314.23, "total_tokens": 36374696} {"current_steps": 63065, "total_steps": 67140, "loss": 0.6185, "lr": 5.592481361696183e-07, "epoch": 9.39305927911826, "percentage": 93.93, "elapsed_time": "4:21:58", "remaining_time": "0:16:55", "throughput": 2314.24, "total_tokens": 36377480} {"current_steps": 63070, "total_steps": 67140, "loss": 0.4206, "lr": 5.578820491054376e-07, "epoch": 9.393803991659219, "percentage": 93.94, "elapsed_time": "4:22:00", "remaining_time": "0:16:54", "throughput": 2314.25, "total_tokens": 36380296} {"current_steps": 63075, "total_steps": 67140, "loss": 0.5525, "lr": 5.565176137402123e-07, "epoch": 9.39454870420018, "percentage": 93.95, "elapsed_time": "4:22:01", "remaining_time": "0:16:53", "throughput": 2314.26, "total_tokens": 36383048} {"current_steps": 63080, "total_steps": 67140, "loss": 0.5541, "lr": 5.551548301661492e-07, "epoch": 9.395293416741138, "percentage": 93.95, "elapsed_time": "4:22:02", "remaining_time": "0:16:51", "throughput": 2314.28, "total_tokens": 36385896} {"current_steps": 63085, "total_steps": 67140, "loss": 0.3473, "lr": 5.537936984753384e-07, "epoch": 9.396038129282097, "percentage": 93.96, "elapsed_time": "4:22:03", "remaining_time": "0:16:50", "throughput": 2314.31, "total_tokens": 36389032} {"current_steps": 63090, "total_steps": 67140, "loss": 0.4505, "lr": 5.524342187597564e-07, "epoch": 9.396782841823056, "percentage": 93.97, "elapsed_time": "4:22:04", "remaining_time": "0:16:49", "throughput": 2314.33, "total_tokens": 36392008} {"current_steps": 63095, "total_steps": 67140, "loss": 0.7627, "lr": 5.510763911112743e-07, "epoch": 9.397527554364016, "percentage": 93.98, "elapsed_time": "4:22:05", "remaining_time": "0:16:48", "throughput": 2314.34, "total_tokens": 36394824} {"current_steps": 63100, "total_steps": 67140, "loss": 0.5665, "lr": 5.497202156216463e-07, "epoch": 9.398272266904975, "percentage": 93.98, "elapsed_time": "4:22:06", "remaining_time": "0:16:46", "throughput": 2314.35, "total_tokens": 36397512} {"current_steps": 63105, "total_steps": 67140, "loss": 0.6885, "lr": 5.483656923825159e-07, "epoch": 9.399016979445934, "percentage": 93.99, "elapsed_time": "4:22:08", "remaining_time": "0:16:45", "throughput": 2314.36, "total_tokens": 36400424} {"current_steps": 63110, "total_steps": 67140, "loss": 0.6425, "lr": 5.470128214854236e-07, "epoch": 9.399761691986892, "percentage": 94.0, "elapsed_time": "4:22:09", "remaining_time": "0:16:44", "throughput": 2314.38, "total_tokens": 36403240} {"current_steps": 63115, "total_steps": 67140, "loss": 0.5119, "lr": 5.456616030217853e-07, "epoch": 9.400506404527853, "percentage": 94.01, "elapsed_time": "4:22:10", "remaining_time": "0:16:43", "throughput": 2314.39, "total_tokens": 36406024} {"current_steps": 63120, "total_steps": 67140, "loss": 0.6284, "lr": 5.443120370829114e-07, "epoch": 9.401251117068812, "percentage": 94.01, "elapsed_time": "4:22:11", "remaining_time": "0:16:41", "throughput": 2314.41, "total_tokens": 36409000} {"current_steps": 63125, "total_steps": 67140, "loss": 0.7907, "lr": 5.429641237599981e-07, "epoch": 9.40199582960977, "percentage": 94.02, "elapsed_time": "4:22:12", "remaining_time": "0:16:40", "throughput": 2314.43, "total_tokens": 36411976} {"current_steps": 63130, "total_steps": 67140, "loss": 0.5701, "lr": 5.416178631441393e-07, "epoch": 9.40274054215073, "percentage": 94.03, "elapsed_time": "4:22:13", "remaining_time": "0:16:39", "throughput": 2314.44, "total_tokens": 36414760} {"current_steps": 63135, "total_steps": 67140, "loss": 0.6145, "lr": 5.402732553263012e-07, "epoch": 9.40348525469169, "percentage": 94.03, "elapsed_time": "4:22:14", "remaining_time": "0:16:38", "throughput": 2314.45, "total_tokens": 36417544} {"current_steps": 63140, "total_steps": 67140, "loss": 0.6092, "lr": 5.389303003973501e-07, "epoch": 9.404229967232649, "percentage": 94.04, "elapsed_time": "4:22:16", "remaining_time": "0:16:36", "throughput": 2314.47, "total_tokens": 36420520} {"current_steps": 63145, "total_steps": 67140, "loss": 0.7305, "lr": 5.375889984480381e-07, "epoch": 9.404974679773607, "percentage": 94.05, "elapsed_time": "4:22:17", "remaining_time": "0:16:35", "throughput": 2314.48, "total_tokens": 36423240} {"current_steps": 63150, "total_steps": 67140, "loss": 0.4665, "lr": 5.362493495690069e-07, "epoch": 9.405719392314566, "percentage": 94.06, "elapsed_time": "4:22:18", "remaining_time": "0:16:34", "throughput": 2314.51, "total_tokens": 36426376} {"current_steps": 63155, "total_steps": 67140, "loss": 0.7191, "lr": 5.349113538507783e-07, "epoch": 9.406464104855527, "percentage": 94.06, "elapsed_time": "4:22:19", "remaining_time": "0:16:33", "throughput": 2314.52, "total_tokens": 36429320} {"current_steps": 63160, "total_steps": 67140, "loss": 0.5427, "lr": 5.335750113837745e-07, "epoch": 9.407208817396485, "percentage": 94.07, "elapsed_time": "4:22:20", "remaining_time": "0:16:31", "throughput": 2314.55, "total_tokens": 36432360} {"current_steps": 63165, "total_steps": 67140, "loss": 0.4657, "lr": 5.322403222582984e-07, "epoch": 9.407953529937444, "percentage": 94.08, "elapsed_time": "4:22:21", "remaining_time": "0:16:30", "throughput": 2314.57, "total_tokens": 36435496} {"current_steps": 63170, "total_steps": 67140, "loss": 0.4385, "lr": 5.309072865645442e-07, "epoch": 9.408698242478403, "percentage": 94.09, "elapsed_time": "4:22:22", "remaining_time": "0:16:29", "throughput": 2314.58, "total_tokens": 36438248} {"current_steps": 63175, "total_steps": 67140, "loss": 0.7601, "lr": 5.295759043925902e-07, "epoch": 9.409442955019362, "percentage": 94.09, "elapsed_time": "4:22:24", "remaining_time": "0:16:28", "throughput": 2314.6, "total_tokens": 36441288} {"current_steps": 63180, "total_steps": 67140, "loss": 0.5208, "lr": 5.282461758324058e-07, "epoch": 9.410187667560322, "percentage": 94.1, "elapsed_time": "4:22:25", "remaining_time": "0:16:26", "throughput": 2314.62, "total_tokens": 36444200} {"current_steps": 63185, "total_steps": 67140, "loss": 0.4357, "lr": 5.269181009738527e-07, "epoch": 9.410932380101281, "percentage": 94.11, "elapsed_time": "4:22:26", "remaining_time": "0:16:25", "throughput": 2314.65, "total_tokens": 36447400} {"current_steps": 63190, "total_steps": 67140, "loss": 0.5133, "lr": 5.255916799066729e-07, "epoch": 9.41167709264224, "percentage": 94.12, "elapsed_time": "4:22:27", "remaining_time": "0:16:24", "throughput": 2314.68, "total_tokens": 36450600} {"current_steps": 63195, "total_steps": 67140, "loss": 0.4998, "lr": 5.242669127205002e-07, "epoch": 9.412421805183198, "percentage": 94.12, "elapsed_time": "4:22:28", "remaining_time": "0:16:23", "throughput": 2314.7, "total_tokens": 36453448} {"current_steps": 63200, "total_steps": 67140, "loss": 0.3407, "lr": 5.229437995048603e-07, "epoch": 9.413166517724159, "percentage": 94.13, "elapsed_time": "4:22:29", "remaining_time": "0:16:21", "throughput": 2314.71, "total_tokens": 36456168} {"current_steps": 63205, "total_steps": 67140, "loss": 0.4807, "lr": 5.216223403491593e-07, "epoch": 9.413911230265118, "percentage": 94.14, "elapsed_time": "4:22:30", "remaining_time": "0:16:20", "throughput": 2314.73, "total_tokens": 36459336} {"current_steps": 63210, "total_steps": 67140, "loss": 0.4594, "lr": 5.203025353427038e-07, "epoch": 9.414655942806077, "percentage": 94.15, "elapsed_time": "4:22:32", "remaining_time": "0:16:19", "throughput": 2314.74, "total_tokens": 36461992} {"current_steps": 63215, "total_steps": 67140, "loss": 0.6104, "lr": 5.189843845746723e-07, "epoch": 9.415400655347035, "percentage": 94.15, "elapsed_time": "4:22:33", "remaining_time": "0:16:18", "throughput": 2314.77, "total_tokens": 36465192} {"current_steps": 63220, "total_steps": 67140, "loss": 0.6529, "lr": 5.176678881341435e-07, "epoch": 9.416145367887996, "percentage": 94.16, "elapsed_time": "4:22:34", "remaining_time": "0:16:16", "throughput": 2314.78, "total_tokens": 36468008} {"current_steps": 63225, "total_steps": 67140, "loss": 0.7215, "lr": 5.163530461100824e-07, "epoch": 9.416890080428955, "percentage": 94.17, "elapsed_time": "4:22:35", "remaining_time": "0:16:15", "throughput": 2314.81, "total_tokens": 36471080} {"current_steps": 63230, "total_steps": 67140, "loss": 0.6933, "lr": 5.150398585913374e-07, "epoch": 9.417634792969913, "percentage": 94.18, "elapsed_time": "4:22:36", "remaining_time": "0:16:14", "throughput": 2314.82, "total_tokens": 36473864} {"current_steps": 63235, "total_steps": 67140, "loss": 0.6637, "lr": 5.137283256666486e-07, "epoch": 9.418379505510872, "percentage": 94.18, "elapsed_time": "4:22:37", "remaining_time": "0:16:13", "throughput": 2314.84, "total_tokens": 36476840} {"current_steps": 63240, "total_steps": 67140, "loss": 0.7066, "lr": 5.12418447424648e-07, "epoch": 9.419124218051833, "percentage": 94.19, "elapsed_time": "4:22:38", "remaining_time": "0:16:11", "throughput": 2314.85, "total_tokens": 36479560} {"current_steps": 63245, "total_steps": 67140, "loss": 0.5931, "lr": 5.111102239538479e-07, "epoch": 9.419868930592791, "percentage": 94.2, "elapsed_time": "4:22:40", "remaining_time": "0:16:10", "throughput": 2314.85, "total_tokens": 36482024} {"current_steps": 63250, "total_steps": 67140, "loss": 0.6865, "lr": 5.098036553426583e-07, "epoch": 9.42061364313375, "percentage": 94.21, "elapsed_time": "4:22:41", "remaining_time": "0:16:09", "throughput": 2314.88, "total_tokens": 36485256} {"current_steps": 63255, "total_steps": 67140, "loss": 0.5651, "lr": 5.084987416793669e-07, "epoch": 9.421358355674709, "percentage": 94.21, "elapsed_time": "4:22:42", "remaining_time": "0:16:08", "throughput": 2314.88, "total_tokens": 36487912} {"current_steps": 63260, "total_steps": 67140, "loss": 0.615, "lr": 5.07195483052153e-07, "epoch": 9.42210306821567, "percentage": 94.22, "elapsed_time": "4:22:43", "remaining_time": "0:16:06", "throughput": 2314.89, "total_tokens": 36490600} {"current_steps": 63265, "total_steps": 67140, "loss": 0.5089, "lr": 5.058938795490881e-07, "epoch": 9.422847780756628, "percentage": 94.23, "elapsed_time": "4:22:44", "remaining_time": "0:16:05", "throughput": 2314.9, "total_tokens": 36493352} {"current_steps": 63270, "total_steps": 67140, "loss": 0.7278, "lr": 5.045939312581294e-07, "epoch": 9.423592493297587, "percentage": 94.24, "elapsed_time": "4:22:45", "remaining_time": "0:16:04", "throughput": 2314.92, "total_tokens": 36496296} {"current_steps": 63275, "total_steps": 67140, "loss": 0.5498, "lr": 5.032956382671206e-07, "epoch": 9.424337205838546, "percentage": 94.24, "elapsed_time": "4:22:46", "remaining_time": "0:16:03", "throughput": 2314.93, "total_tokens": 36499080} {"current_steps": 63280, "total_steps": 67140, "loss": 0.5355, "lr": 5.019990006637998e-07, "epoch": 9.425081918379506, "percentage": 94.25, "elapsed_time": "4:22:47", "remaining_time": "0:16:01", "throughput": 2314.94, "total_tokens": 36501736} {"current_steps": 63285, "total_steps": 67140, "loss": 0.749, "lr": 5.007040185357803e-07, "epoch": 9.425826630920465, "percentage": 94.26, "elapsed_time": "4:22:49", "remaining_time": "0:16:00", "throughput": 2314.96, "total_tokens": 36504680} {"current_steps": 63290, "total_steps": 67140, "loss": 0.5918, "lr": 4.99410691970581e-07, "epoch": 9.426571343461424, "percentage": 94.27, "elapsed_time": "4:22:50", "remaining_time": "0:15:59", "throughput": 2314.97, "total_tokens": 36507560} {"current_steps": 63295, "total_steps": 67140, "loss": 0.5123, "lr": 4.98119021055593e-07, "epoch": 9.427316056002383, "percentage": 94.27, "elapsed_time": "4:22:51", "remaining_time": "0:15:58", "throughput": 2314.99, "total_tokens": 36510440} {"current_steps": 63300, "total_steps": 67140, "loss": 0.3942, "lr": 4.968290058781022e-07, "epoch": 9.428060768543343, "percentage": 94.28, "elapsed_time": "4:22:52", "remaining_time": "0:15:56", "throughput": 2315.01, "total_tokens": 36513512} {"current_steps": 63305, "total_steps": 67140, "loss": 0.6626, "lr": 4.95540646525286e-07, "epoch": 9.428805481084302, "percentage": 94.29, "elapsed_time": "4:22:53", "remaining_time": "0:15:55", "throughput": 2315.03, "total_tokens": 36516328} {"current_steps": 63310, "total_steps": 67140, "loss": 0.7828, "lr": 4.942539430842052e-07, "epoch": 9.42955019362526, "percentage": 94.3, "elapsed_time": "4:22:54", "remaining_time": "0:15:54", "throughput": 2315.04, "total_tokens": 36519144} {"current_steps": 63315, "total_steps": 67140, "loss": 0.6342, "lr": 4.929688956418099e-07, "epoch": 9.43029490616622, "percentage": 94.3, "elapsed_time": "4:22:55", "remaining_time": "0:15:53", "throughput": 2315.05, "total_tokens": 36521992} {"current_steps": 63320, "total_steps": 67140, "loss": 0.5782, "lr": 4.916855042849388e-07, "epoch": 9.43103961870718, "percentage": 94.31, "elapsed_time": "4:22:57", "remaining_time": "0:15:51", "throughput": 2315.08, "total_tokens": 36525160} {"current_steps": 63325, "total_steps": 67140, "loss": 0.5517, "lr": 4.904037691003172e-07, "epoch": 9.431784331248139, "percentage": 94.32, "elapsed_time": "4:22:58", "remaining_time": "0:15:50", "throughput": 2315.1, "total_tokens": 36527944} {"current_steps": 63330, "total_steps": 67140, "loss": 0.7504, "lr": 4.891236901745616e-07, "epoch": 9.432529043789097, "percentage": 94.33, "elapsed_time": "4:22:59", "remaining_time": "0:15:49", "throughput": 2315.12, "total_tokens": 36531016} {"current_steps": 63335, "total_steps": 67140, "loss": 0.4139, "lr": 4.878452675941697e-07, "epoch": 9.433273756330056, "percentage": 94.33, "elapsed_time": "4:23:00", "remaining_time": "0:15:48", "throughput": 2315.14, "total_tokens": 36533992} {"current_steps": 63340, "total_steps": 67140, "loss": 0.709, "lr": 4.865685014455363e-07, "epoch": 9.434018468871017, "percentage": 94.34, "elapsed_time": "4:23:01", "remaining_time": "0:15:46", "throughput": 2315.15, "total_tokens": 36536616} {"current_steps": 63345, "total_steps": 67140, "loss": 0.7022, "lr": 4.852933918149394e-07, "epoch": 9.434763181411975, "percentage": 94.35, "elapsed_time": "4:23:02", "remaining_time": "0:15:45", "throughput": 2315.17, "total_tokens": 36539528} {"current_steps": 63350, "total_steps": 67140, "loss": 0.7075, "lr": 4.840199387885491e-07, "epoch": 9.435507893952934, "percentage": 94.36, "elapsed_time": "4:23:03", "remaining_time": "0:15:44", "throughput": 2315.18, "total_tokens": 36542344} {"current_steps": 63355, "total_steps": 67140, "loss": 0.8209, "lr": 4.827481424524133e-07, "epoch": 9.436252606493893, "percentage": 94.36, "elapsed_time": "4:23:04", "remaining_time": "0:15:43", "throughput": 2315.2, "total_tokens": 36545224} {"current_steps": 63360, "total_steps": 67140, "loss": 0.5537, "lr": 4.81478002892477e-07, "epoch": 9.436997319034852, "percentage": 94.37, "elapsed_time": "4:23:06", "remaining_time": "0:15:41", "throughput": 2315.22, "total_tokens": 36548264} {"current_steps": 63365, "total_steps": 67140, "loss": 0.3642, "lr": 4.802095201945745e-07, "epoch": 9.437742031575812, "percentage": 94.38, "elapsed_time": "4:23:07", "remaining_time": "0:15:40", "throughput": 2315.23, "total_tokens": 36550984} {"current_steps": 63370, "total_steps": 67140, "loss": 0.656, "lr": 4.789426944444231e-07, "epoch": 9.438486744116771, "percentage": 94.38, "elapsed_time": "4:23:08", "remaining_time": "0:15:39", "throughput": 2315.25, "total_tokens": 36554056} {"current_steps": 63375, "total_steps": 67140, "loss": 0.6046, "lr": 4.776775257276267e-07, "epoch": 9.43923145665773, "percentage": 94.39, "elapsed_time": "4:23:09", "remaining_time": "0:15:38", "throughput": 2315.27, "total_tokens": 36557032} {"current_steps": 63380, "total_steps": 67140, "loss": 0.6646, "lr": 4.7641401412968357e-07, "epoch": 9.439976169198689, "percentage": 94.4, "elapsed_time": "4:23:10", "remaining_time": "0:15:36", "throughput": 2315.29, "total_tokens": 36559912} {"current_steps": 63385, "total_steps": 67140, "loss": 0.6272, "lr": 4.7515215973597815e-07, "epoch": 9.440720881739649, "percentage": 94.41, "elapsed_time": "4:23:11", "remaining_time": "0:15:35", "throughput": 2315.31, "total_tokens": 36562952} {"current_steps": 63390, "total_steps": 67140, "loss": 0.6023, "lr": 4.738919626317756e-07, "epoch": 9.441465594280608, "percentage": 94.41, "elapsed_time": "4:23:12", "remaining_time": "0:15:34", "throughput": 2315.33, "total_tokens": 36565864} {"current_steps": 63395, "total_steps": 67140, "loss": 0.6153, "lr": 4.726334229022383e-07, "epoch": 9.442210306821567, "percentage": 94.42, "elapsed_time": "4:23:14", "remaining_time": "0:15:33", "throughput": 2315.35, "total_tokens": 36568840} {"current_steps": 63400, "total_steps": 67140, "loss": 0.5333, "lr": 4.71376540632415e-07, "epoch": 9.442955019362525, "percentage": 94.43, "elapsed_time": "4:23:15", "remaining_time": "0:15:31", "throughput": 2315.36, "total_tokens": 36571528} {"current_steps": 63405, "total_steps": 67140, "loss": 0.6789, "lr": 4.7012131590723765e-07, "epoch": 9.443699731903486, "percentage": 94.44, "elapsed_time": "4:23:16", "remaining_time": "0:15:30", "throughput": 2315.36, "total_tokens": 36574120} {"current_steps": 63410, "total_steps": 67140, "loss": 0.4733, "lr": 4.688677488115328e-07, "epoch": 9.444444444444445, "percentage": 94.44, "elapsed_time": "4:23:17", "remaining_time": "0:15:29", "throughput": 2315.39, "total_tokens": 36577288} {"current_steps": 63415, "total_steps": 67140, "loss": 0.5549, "lr": 4.676158394300051e-07, "epoch": 9.445189156985403, "percentage": 94.45, "elapsed_time": "4:23:18", "remaining_time": "0:15:28", "throughput": 2315.4, "total_tokens": 36580072} {"current_steps": 63420, "total_steps": 67140, "loss": 0.4999, "lr": 4.663655878472617e-07, "epoch": 9.445933869526362, "percentage": 94.46, "elapsed_time": "4:23:19", "remaining_time": "0:15:26", "throughput": 2315.43, "total_tokens": 36583144} {"current_steps": 63425, "total_steps": 67140, "loss": 0.5172, "lr": 4.651169941477851e-07, "epoch": 9.446678582067323, "percentage": 94.47, "elapsed_time": "4:23:20", "remaining_time": "0:15:25", "throughput": 2315.44, "total_tokens": 36585896} {"current_steps": 63430, "total_steps": 67140, "loss": 0.682, "lr": 4.6387005841594943e-07, "epoch": 9.447423294608281, "percentage": 94.47, "elapsed_time": "4:23:22", "remaining_time": "0:15:24", "throughput": 2315.46, "total_tokens": 36589032} {"current_steps": 63435, "total_steps": 67140, "loss": 0.4484, "lr": 4.626247807360151e-07, "epoch": 9.44816800714924, "percentage": 94.48, "elapsed_time": "4:23:23", "remaining_time": "0:15:23", "throughput": 2315.48, "total_tokens": 36592072} {"current_steps": 63440, "total_steps": 67140, "loss": 0.599, "lr": 4.613811611921398e-07, "epoch": 9.448912719690199, "percentage": 94.49, "elapsed_time": "4:23:24", "remaining_time": "0:15:21", "throughput": 2315.5, "total_tokens": 36595080} {"current_steps": 63445, "total_steps": 67140, "loss": 0.5096, "lr": 4.6013919986836187e-07, "epoch": 9.44965743223116, "percentage": 94.5, "elapsed_time": "4:23:25", "remaining_time": "0:15:20", "throughput": 2315.53, "total_tokens": 36598152} {"current_steps": 63450, "total_steps": 67140, "loss": 0.677, "lr": 4.588988968486002e-07, "epoch": 9.450402144772118, "percentage": 94.5, "elapsed_time": "4:23:26", "remaining_time": "0:15:19", "throughput": 2315.55, "total_tokens": 36601096} {"current_steps": 63455, "total_steps": 67140, "loss": 0.8806, "lr": 4.5766025221667674e-07, "epoch": 9.451146857313077, "percentage": 94.51, "elapsed_time": "4:23:27", "remaining_time": "0:15:17", "throughput": 2315.57, "total_tokens": 36604008} {"current_steps": 63460, "total_steps": 67140, "loss": 0.5626, "lr": 4.5642326605629116e-07, "epoch": 9.451891569854036, "percentage": 94.52, "elapsed_time": "4:23:28", "remaining_time": "0:15:16", "throughput": 2315.59, "total_tokens": 36606888} {"current_steps": 63465, "total_steps": 67140, "loss": 0.5063, "lr": 4.5518793845103215e-07, "epoch": 9.452636282394996, "percentage": 94.53, "elapsed_time": "4:23:30", "remaining_time": "0:15:15", "throughput": 2315.61, "total_tokens": 36609928} {"current_steps": 63470, "total_steps": 67140, "loss": 0.6522, "lr": 4.539542694843829e-07, "epoch": 9.453380994935955, "percentage": 94.53, "elapsed_time": "4:23:31", "remaining_time": "0:15:14", "throughput": 2315.62, "total_tokens": 36612712} {"current_steps": 63475, "total_steps": 67140, "loss": 0.4455, "lr": 4.527222592397046e-07, "epoch": 9.454125707476914, "percentage": 94.54, "elapsed_time": "4:23:32", "remaining_time": "0:15:12", "throughput": 2315.63, "total_tokens": 36615400} {"current_steps": 63480, "total_steps": 67140, "loss": 0.5834, "lr": 4.514919078002583e-07, "epoch": 9.454870420017873, "percentage": 94.55, "elapsed_time": "4:23:33", "remaining_time": "0:15:11", "throughput": 2315.65, "total_tokens": 36618344} {"current_steps": 63485, "total_steps": 67140, "loss": 0.5943, "lr": 4.502632152491776e-07, "epoch": 9.455615132558833, "percentage": 94.56, "elapsed_time": "4:23:34", "remaining_time": "0:15:10", "throughput": 2315.67, "total_tokens": 36621352} {"current_steps": 63490, "total_steps": 67140, "loss": 0.5695, "lr": 4.490361816694988e-07, "epoch": 9.456359845099792, "percentage": 94.56, "elapsed_time": "4:23:35", "remaining_time": "0:15:09", "throughput": 2315.69, "total_tokens": 36624264} {"current_steps": 63495, "total_steps": 67140, "loss": 0.7017, "lr": 4.478108071441389e-07, "epoch": 9.45710455764075, "percentage": 94.57, "elapsed_time": "4:23:36", "remaining_time": "0:15:07", "throughput": 2315.7, "total_tokens": 36626952} {"current_steps": 63500, "total_steps": 67140, "loss": 0.6136, "lr": 4.4658709175590116e-07, "epoch": 9.45784927018171, "percentage": 94.58, "elapsed_time": "4:23:37", "remaining_time": "0:15:06", "throughput": 2315.71, "total_tokens": 36629672} {"current_steps": 63505, "total_steps": 67140, "loss": 0.4713, "lr": 4.4536503558748057e-07, "epoch": 9.458593982722668, "percentage": 94.59, "elapsed_time": "4:23:39", "remaining_time": "0:15:05", "throughput": 2315.72, "total_tokens": 36632488} {"current_steps": 63510, "total_steps": 67140, "loss": 0.631, "lr": 4.441446387214582e-07, "epoch": 9.459338695263629, "percentage": 94.59, "elapsed_time": "4:23:40", "remaining_time": "0:15:04", "throughput": 2315.72, "total_tokens": 36635112} {"current_steps": 63515, "total_steps": 67140, "loss": 0.6653, "lr": 4.4292590124030697e-07, "epoch": 9.460083407804587, "percentage": 94.6, "elapsed_time": "4:23:41", "remaining_time": "0:15:02", "throughput": 2315.73, "total_tokens": 36637800} {"current_steps": 63520, "total_steps": 67140, "loss": 0.3668, "lr": 4.4170882322638053e-07, "epoch": 9.460828120345546, "percentage": 94.61, "elapsed_time": "4:23:42", "remaining_time": "0:15:01", "throughput": 2315.75, "total_tokens": 36640616} {"current_steps": 63525, "total_steps": 67140, "loss": 0.5814, "lr": 4.4049340476192414e-07, "epoch": 9.461572832886505, "percentage": 94.62, "elapsed_time": "4:23:43", "remaining_time": "0:15:00", "throughput": 2315.78, "total_tokens": 36643816} {"current_steps": 63530, "total_steps": 67140, "loss": 0.549, "lr": 4.392796459290721e-07, "epoch": 9.462317545427466, "percentage": 94.62, "elapsed_time": "4:23:44", "remaining_time": "0:14:59", "throughput": 2315.79, "total_tokens": 36646536} {"current_steps": 63535, "total_steps": 67140, "loss": 0.5184, "lr": 4.380675468098477e-07, "epoch": 9.463062257968424, "percentage": 94.63, "elapsed_time": "4:23:45", "remaining_time": "0:14:57", "throughput": 2315.79, "total_tokens": 36649128} {"current_steps": 63540, "total_steps": 67140, "loss": 0.6107, "lr": 4.3685710748615493e-07, "epoch": 9.463806970509383, "percentage": 94.64, "elapsed_time": "4:23:46", "remaining_time": "0:14:56", "throughput": 2315.81, "total_tokens": 36651976} {"current_steps": 63545, "total_steps": 67140, "loss": 0.4255, "lr": 4.356483280397894e-07, "epoch": 9.464551683050342, "percentage": 94.65, "elapsed_time": "4:23:48", "remaining_time": "0:14:55", "throughput": 2315.83, "total_tokens": 36654920} {"current_steps": 63550, "total_steps": 67140, "loss": 0.5336, "lr": 4.344412085524441e-07, "epoch": 9.465296395591302, "percentage": 94.65, "elapsed_time": "4:23:49", "remaining_time": "0:14:54", "throughput": 2315.84, "total_tokens": 36657832} {"current_steps": 63555, "total_steps": 67140, "loss": 0.7083, "lr": 4.3323574910568157e-07, "epoch": 9.466041108132261, "percentage": 94.66, "elapsed_time": "4:23:50", "remaining_time": "0:14:52", "throughput": 2315.86, "total_tokens": 36660712} {"current_steps": 63560, "total_steps": 67140, "loss": 0.6641, "lr": 4.320319497809672e-07, "epoch": 9.46678582067322, "percentage": 94.67, "elapsed_time": "4:23:51", "remaining_time": "0:14:51", "throughput": 2315.87, "total_tokens": 36663432} {"current_steps": 63565, "total_steps": 67140, "loss": 0.644, "lr": 4.30829810659647e-07, "epoch": 9.467530533214179, "percentage": 94.68, "elapsed_time": "4:23:52", "remaining_time": "0:14:50", "throughput": 2315.89, "total_tokens": 36666344} {"current_steps": 63570, "total_steps": 67140, "loss": 0.4729, "lr": 4.2962933182295606e-07, "epoch": 9.46827524575514, "percentage": 94.68, "elapsed_time": "4:23:53", "remaining_time": "0:14:49", "throughput": 2315.9, "total_tokens": 36669128} {"current_steps": 63575, "total_steps": 67140, "loss": 0.7709, "lr": 4.2843051335202386e-07, "epoch": 9.469019958296098, "percentage": 94.69, "elapsed_time": "4:23:54", "remaining_time": "0:14:47", "throughput": 2315.92, "total_tokens": 36672104} {"current_steps": 63580, "total_steps": 67140, "loss": 0.9489, "lr": 4.2723335532785235e-07, "epoch": 9.469764670837057, "percentage": 94.7, "elapsed_time": "4:23:55", "remaining_time": "0:14:46", "throughput": 2315.93, "total_tokens": 36674984} {"current_steps": 63585, "total_steps": 67140, "loss": 0.5754, "lr": 4.26037857831349e-07, "epoch": 9.470509383378015, "percentage": 94.71, "elapsed_time": "4:23:57", "remaining_time": "0:14:45", "throughput": 2315.97, "total_tokens": 36678408} {"current_steps": 63590, "total_steps": 67140, "loss": 0.5633, "lr": 4.2484402094329354e-07, "epoch": 9.471254095918976, "percentage": 94.71, "elapsed_time": "4:23:58", "remaining_time": "0:14:44", "throughput": 2315.99, "total_tokens": 36681352} {"current_steps": 63595, "total_steps": 67140, "loss": 0.7291, "lr": 4.2365184474436327e-07, "epoch": 9.471998808459935, "percentage": 94.72, "elapsed_time": "4:23:59", "remaining_time": "0:14:42", "throughput": 2316.02, "total_tokens": 36684552} {"current_steps": 63600, "total_steps": 67140, "loss": 0.3877, "lr": 4.224613293151214e-07, "epoch": 9.472743521000893, "percentage": 94.73, "elapsed_time": "4:24:00", "remaining_time": "0:14:41", "throughput": 2316.03, "total_tokens": 36687304} {"current_steps": 63605, "total_steps": 67140, "loss": 0.3459, "lr": 4.212724747360175e-07, "epoch": 9.473488233541852, "percentage": 94.73, "elapsed_time": "4:24:01", "remaining_time": "0:14:40", "throughput": 2316.05, "total_tokens": 36690344} {"current_steps": 63610, "total_steps": 67140, "loss": 0.6168, "lr": 4.2008528108739287e-07, "epoch": 9.474232946082813, "percentage": 94.74, "elapsed_time": "4:24:02", "remaining_time": "0:14:39", "throughput": 2316.05, "total_tokens": 36692936} {"current_steps": 63615, "total_steps": 67140, "loss": 0.3564, "lr": 4.1889974844946947e-07, "epoch": 9.474977658623772, "percentage": 94.75, "elapsed_time": "4:24:04", "remaining_time": "0:14:37", "throughput": 2316.07, "total_tokens": 36695816} {"current_steps": 63620, "total_steps": 67140, "loss": 0.6684, "lr": 4.177158769023609e-07, "epoch": 9.47572237116473, "percentage": 94.76, "elapsed_time": "4:24:05", "remaining_time": "0:14:36", "throughput": 2316.1, "total_tokens": 36699208} {"current_steps": 63625, "total_steps": 67140, "loss": 0.5882, "lr": 4.1653366652607e-07, "epoch": 9.476467083705689, "percentage": 94.76, "elapsed_time": "4:24:06", "remaining_time": "0:14:35", "throughput": 2316.11, "total_tokens": 36701896} {"current_steps": 63630, "total_steps": 67140, "loss": 0.5627, "lr": 4.153531174004827e-07, "epoch": 9.47721179624665, "percentage": 94.77, "elapsed_time": "4:24:07", "remaining_time": "0:14:34", "throughput": 2316.12, "total_tokens": 36704680} {"current_steps": 63635, "total_steps": 67140, "loss": 0.6184, "lr": 4.141742296053769e-07, "epoch": 9.477956508787608, "percentage": 94.78, "elapsed_time": "4:24:08", "remaining_time": "0:14:32", "throughput": 2316.14, "total_tokens": 36707528} {"current_steps": 63640, "total_steps": 67140, "loss": 0.5959, "lr": 4.1299700322041945e-07, "epoch": 9.478701221328567, "percentage": 94.79, "elapsed_time": "4:24:09", "remaining_time": "0:14:31", "throughput": 2316.16, "total_tokens": 36710600} {"current_steps": 63645, "total_steps": 67140, "loss": 0.5222, "lr": 4.118214383251634e-07, "epoch": 9.479445933869526, "percentage": 94.79, "elapsed_time": "4:24:10", "remaining_time": "0:14:30", "throughput": 2316.18, "total_tokens": 36713544} {"current_steps": 63650, "total_steps": 67140, "loss": 0.5256, "lr": 4.106475349990452e-07, "epoch": 9.480190646410486, "percentage": 94.8, "elapsed_time": "4:24:12", "remaining_time": "0:14:29", "throughput": 2316.21, "total_tokens": 36716616} {"current_steps": 63655, "total_steps": 67140, "loss": 0.6102, "lr": 4.09475293321393e-07, "epoch": 9.480935358951445, "percentage": 94.81, "elapsed_time": "4:24:13", "remaining_time": "0:14:27", "throughput": 2316.22, "total_tokens": 36719528} {"current_steps": 63660, "total_steps": 67140, "loss": 0.809, "lr": 4.0830471337142407e-07, "epoch": 9.481680071492404, "percentage": 94.82, "elapsed_time": "4:24:14", "remaining_time": "0:14:26", "throughput": 2316.24, "total_tokens": 36722440} {"current_steps": 63665, "total_steps": 67140, "loss": 0.5804, "lr": 4.071357952282362e-07, "epoch": 9.482424784033363, "percentage": 94.82, "elapsed_time": "4:24:15", "remaining_time": "0:14:25", "throughput": 2316.26, "total_tokens": 36725352} {"current_steps": 63670, "total_steps": 67140, "loss": 0.6604, "lr": 4.059685389708273e-07, "epoch": 9.483169496574323, "percentage": 94.83, "elapsed_time": "4:24:16", "remaining_time": "0:14:24", "throughput": 2316.27, "total_tokens": 36728168} {"current_steps": 63675, "total_steps": 67140, "loss": 0.6468, "lr": 4.048029446780704e-07, "epoch": 9.483914209115282, "percentage": 94.84, "elapsed_time": "4:24:17", "remaining_time": "0:14:22", "throughput": 2316.28, "total_tokens": 36730856} {"current_steps": 63680, "total_steps": 67140, "loss": 0.6771, "lr": 4.0363901242873594e-07, "epoch": 9.48465892165624, "percentage": 94.85, "elapsed_time": "4:24:18", "remaining_time": "0:14:21", "throughput": 2316.29, "total_tokens": 36733608} {"current_steps": 63685, "total_steps": 67140, "loss": 0.5796, "lr": 4.0247674230147467e-07, "epoch": 9.4854036341972, "percentage": 94.85, "elapsed_time": "4:24:19", "remaining_time": "0:14:20", "throughput": 2316.3, "total_tokens": 36736360} {"current_steps": 63690, "total_steps": 67140, "loss": 0.6611, "lr": 4.0131613437482674e-07, "epoch": 9.486148346738158, "percentage": 94.86, "elapsed_time": "4:24:21", "remaining_time": "0:14:19", "throughput": 2316.31, "total_tokens": 36739048} {"current_steps": 63695, "total_steps": 67140, "loss": 0.5064, "lr": 4.001571887272293e-07, "epoch": 9.486893059279119, "percentage": 94.87, "elapsed_time": "4:24:22", "remaining_time": "0:14:17", "throughput": 2316.32, "total_tokens": 36741864} {"current_steps": 63700, "total_steps": 67140, "loss": 0.4864, "lr": 3.989999054369864e-07, "epoch": 9.487637771820078, "percentage": 94.88, "elapsed_time": "4:24:23", "remaining_time": "0:14:16", "throughput": 2316.34, "total_tokens": 36744776} {"current_steps": 63705, "total_steps": 67140, "loss": 0.5953, "lr": 3.978442845823133e-07, "epoch": 9.488382484361036, "percentage": 94.88, "elapsed_time": "4:24:24", "remaining_time": "0:14:15", "throughput": 2316.35, "total_tokens": 36747624} {"current_steps": 63710, "total_steps": 67140, "loss": 0.5414, "lr": 3.966903262412974e-07, "epoch": 9.489127196901995, "percentage": 94.89, "elapsed_time": "4:24:25", "remaining_time": "0:14:14", "throughput": 2316.36, "total_tokens": 36750216} {"current_steps": 63715, "total_steps": 67140, "loss": 0.5941, "lr": 3.9553803049192096e-07, "epoch": 9.489871909442956, "percentage": 94.9, "elapsed_time": "4:24:26", "remaining_time": "0:14:12", "throughput": 2316.36, "total_tokens": 36752872} {"current_steps": 63720, "total_steps": 67140, "loss": 0.4957, "lr": 3.9438739741204935e-07, "epoch": 9.490616621983914, "percentage": 94.91, "elapsed_time": "4:24:27", "remaining_time": "0:14:11", "throughput": 2316.39, "total_tokens": 36755912} {"current_steps": 63725, "total_steps": 67140, "loss": 0.5062, "lr": 3.9323842707943703e-07, "epoch": 9.491361334524873, "percentage": 94.91, "elapsed_time": "4:24:28", "remaining_time": "0:14:10", "throughput": 2316.4, "total_tokens": 36758696} {"current_steps": 63730, "total_steps": 67140, "loss": 0.5313, "lr": 3.920911195717275e-07, "epoch": 9.492106047065832, "percentage": 94.92, "elapsed_time": "4:24:30", "remaining_time": "0:14:09", "throughput": 2316.41, "total_tokens": 36761416} {"current_steps": 63735, "total_steps": 67140, "loss": 0.7744, "lr": 3.909454749664532e-07, "epoch": 9.492850759606792, "percentage": 94.93, "elapsed_time": "4:24:31", "remaining_time": "0:14:07", "throughput": 2316.41, "total_tokens": 36764040} {"current_steps": 63740, "total_steps": 67140, "loss": 0.9648, "lr": 3.898014933410299e-07, "epoch": 9.493595472147751, "percentage": 94.94, "elapsed_time": "4:24:32", "remaining_time": "0:14:06", "throughput": 2316.42, "total_tokens": 36766760} {"current_steps": 63745, "total_steps": 67140, "loss": 0.6072, "lr": 3.8865917477276527e-07, "epoch": 9.49434018468871, "percentage": 94.94, "elapsed_time": "4:24:33", "remaining_time": "0:14:05", "throughput": 2316.43, "total_tokens": 36769352} {"current_steps": 63750, "total_steps": 67140, "loss": 0.6354, "lr": 3.875185193388503e-07, "epoch": 9.495084897229669, "percentage": 94.95, "elapsed_time": "4:24:34", "remaining_time": "0:14:04", "throughput": 2316.44, "total_tokens": 36772200} {"current_steps": 63755, "total_steps": 67140, "loss": 0.5453, "lr": 3.8637952711636504e-07, "epoch": 9.49582960977063, "percentage": 94.96, "elapsed_time": "4:24:35", "remaining_time": "0:14:02", "throughput": 2316.44, "total_tokens": 36774760} {"current_steps": 63760, "total_steps": 67140, "loss": 0.5702, "lr": 3.8524219818228123e-07, "epoch": 9.496574322311588, "percentage": 94.97, "elapsed_time": "4:24:36", "remaining_time": "0:14:01", "throughput": 2316.46, "total_tokens": 36777672} {"current_steps": 63765, "total_steps": 67140, "loss": 0.708, "lr": 3.8410653261345407e-07, "epoch": 9.497319034852547, "percentage": 94.97, "elapsed_time": "4:24:37", "remaining_time": "0:14:00", "throughput": 2316.48, "total_tokens": 36780712} {"current_steps": 63770, "total_steps": 67140, "loss": 0.4853, "lr": 3.8297253048662494e-07, "epoch": 9.498063747393505, "percentage": 94.98, "elapsed_time": "4:24:38", "remaining_time": "0:13:59", "throughput": 2316.5, "total_tokens": 36783464} {"current_steps": 63775, "total_steps": 67140, "loss": 0.8836, "lr": 3.818401918784298e-07, "epoch": 9.498808459934466, "percentage": 94.99, "elapsed_time": "4:24:40", "remaining_time": "0:13:57", "throughput": 2316.5, "total_tokens": 36785992} {"current_steps": 63780, "total_steps": 67140, "loss": 0.4761, "lr": 3.807095168653796e-07, "epoch": 9.499553172475425, "percentage": 95.0, "elapsed_time": "4:24:41", "remaining_time": "0:13:56", "throughput": 2316.52, "total_tokens": 36789032} {"current_steps": 63783, "total_steps": 67140, "eval_loss": 0.6832270622253418, "epoch": 9.5, "percentage": 95.0, "elapsed_time": "4:25:55", "remaining_time": "0:13:59", "throughput": 2305.79, "total_tokens": 36790952} {"current_steps": 63785, "total_steps": 67140, "loss": 0.7175, "lr": 3.7958050552389104e-07, "epoch": 9.500297885016384, "percentage": 95.0, "elapsed_time": "4:25:58", "remaining_time": "0:13:59", "throughput": 2305.43, "total_tokens": 36792136} {"current_steps": 63790, "total_steps": 67140, "loss": 0.4485, "lr": 3.784531579302475e-07, "epoch": 9.501042597557342, "percentage": 95.01, "elapsed_time": "4:26:00", "remaining_time": "0:13:58", "throughput": 2305.44, "total_tokens": 36795016} {"current_steps": 63795, "total_steps": 67140, "loss": 0.7141, "lr": 3.7732747416063805e-07, "epoch": 9.501787310098303, "percentage": 95.02, "elapsed_time": "4:26:01", "remaining_time": "0:13:56", "throughput": 2305.46, "total_tokens": 36797832} {"current_steps": 63800, "total_steps": 67140, "loss": 0.6933, "lr": 3.762034542911269e-07, "epoch": 9.502532022639262, "percentage": 95.03, "elapsed_time": "4:26:02", "remaining_time": "0:13:55", "throughput": 2305.47, "total_tokens": 36800616} {"current_steps": 63805, "total_steps": 67140, "loss": 0.6043, "lr": 3.7508109839767546e-07, "epoch": 9.50327673518022, "percentage": 95.03, "elapsed_time": "4:26:03", "remaining_time": "0:13:54", "throughput": 2305.48, "total_tokens": 36803464} {"current_steps": 63810, "total_steps": 67140, "loss": 0.5571, "lr": 3.7396040655612587e-07, "epoch": 9.504021447721179, "percentage": 95.04, "elapsed_time": "4:26:04", "remaining_time": "0:13:53", "throughput": 2305.5, "total_tokens": 36806376} {"current_steps": 63815, "total_steps": 67140, "loss": 0.3487, "lr": 3.728413788422119e-07, "epoch": 9.50476616026214, "percentage": 95.05, "elapsed_time": "4:26:05", "remaining_time": "0:13:51", "throughput": 2305.52, "total_tokens": 36809352} {"current_steps": 63820, "total_steps": 67140, "loss": 0.5427, "lr": 3.7172401533154823e-07, "epoch": 9.505510872803098, "percentage": 95.06, "elapsed_time": "4:26:06", "remaining_time": "0:13:50", "throughput": 2305.53, "total_tokens": 36812072} {"current_steps": 63825, "total_steps": 67140, "loss": 0.43, "lr": 3.706083160996437e-07, "epoch": 9.506255585344057, "percentage": 95.06, "elapsed_time": "4:26:08", "remaining_time": "0:13:49", "throughput": 2305.56, "total_tokens": 36815176} {"current_steps": 63830, "total_steps": 67140, "loss": 0.5525, "lr": 3.6949428122189375e-07, "epoch": 9.507000297885016, "percentage": 95.07, "elapsed_time": "4:26:09", "remaining_time": "0:13:48", "throughput": 2305.57, "total_tokens": 36818056} {"current_steps": 63835, "total_steps": 67140, "loss": 0.7606, "lr": 3.6838191077357975e-07, "epoch": 9.507745010425975, "percentage": 95.08, "elapsed_time": "4:26:10", "remaining_time": "0:13:46", "throughput": 2305.59, "total_tokens": 36821032} {"current_steps": 63840, "total_steps": 67140, "loss": 0.6374, "lr": 3.672712048298721e-07, "epoch": 9.508489722966935, "percentage": 95.08, "elapsed_time": "4:26:11", "remaining_time": "0:13:45", "throughput": 2305.61, "total_tokens": 36824008} {"current_steps": 63845, "total_steps": 67140, "loss": 0.6843, "lr": 3.661621634658274e-07, "epoch": 9.509234435507894, "percentage": 95.09, "elapsed_time": "4:26:12", "remaining_time": "0:13:44", "throughput": 2305.63, "total_tokens": 36826888} {"current_steps": 63850, "total_steps": 67140, "loss": 0.5857, "lr": 3.650547867563886e-07, "epoch": 9.509979148048853, "percentage": 95.1, "elapsed_time": "4:26:13", "remaining_time": "0:13:43", "throughput": 2305.66, "total_tokens": 36830056} {"current_steps": 63855, "total_steps": 67140, "loss": 0.5722, "lr": 3.6394907477639294e-07, "epoch": 9.510723860589813, "percentage": 95.11, "elapsed_time": "4:26:14", "remaining_time": "0:13:41", "throughput": 2305.68, "total_tokens": 36832968} {"current_steps": 63860, "total_steps": 67140, "loss": 0.6179, "lr": 3.628450276005502e-07, "epoch": 9.511468573130772, "percentage": 95.11, "elapsed_time": "4:26:16", "remaining_time": "0:13:40", "throughput": 2305.69, "total_tokens": 36835784} {"current_steps": 63865, "total_steps": 67140, "loss": 0.6995, "lr": 3.6174264530347557e-07, "epoch": 9.51221328567173, "percentage": 95.12, "elapsed_time": "4:26:17", "remaining_time": "0:13:39", "throughput": 2305.7, "total_tokens": 36838536} {"current_steps": 63870, "total_steps": 67140, "loss": 0.6808, "lr": 3.6064192795965956e-07, "epoch": 9.51295799821269, "percentage": 95.13, "elapsed_time": "4:26:18", "remaining_time": "0:13:38", "throughput": 2305.73, "total_tokens": 36841736} {"current_steps": 63875, "total_steps": 67140, "loss": 0.514, "lr": 3.595428756434871e-07, "epoch": 9.513702710753648, "percentage": 95.14, "elapsed_time": "4:26:19", "remaining_time": "0:13:36", "throughput": 2305.74, "total_tokens": 36844392} {"current_steps": 63880, "total_steps": 67140, "loss": 0.6306, "lr": 3.584454884292293e-07, "epoch": 9.514447423294609, "percentage": 95.14, "elapsed_time": "4:26:20", "remaining_time": "0:13:35", "throughput": 2305.76, "total_tokens": 36847272} {"current_steps": 63885, "total_steps": 67140, "loss": 0.7076, "lr": 3.5734976639103525e-07, "epoch": 9.515192135835568, "percentage": 95.15, "elapsed_time": "4:26:21", "remaining_time": "0:13:34", "throughput": 2305.77, "total_tokens": 36850056} {"current_steps": 63890, "total_steps": 67140, "loss": 0.5753, "lr": 3.5625570960295674e-07, "epoch": 9.515936848376526, "percentage": 95.16, "elapsed_time": "4:26:22", "remaining_time": "0:13:33", "throughput": 2305.79, "total_tokens": 36853128} {"current_steps": 63895, "total_steps": 67140, "loss": 0.4459, "lr": 3.5516331813892355e-07, "epoch": 9.516681560917485, "percentage": 95.17, "elapsed_time": "4:26:23", "remaining_time": "0:13:31", "throughput": 2305.81, "total_tokens": 36856104} {"current_steps": 63900, "total_steps": 67140, "loss": 0.4975, "lr": 3.5407259207275444e-07, "epoch": 9.517426273458446, "percentage": 95.17, "elapsed_time": "4:26:25", "remaining_time": "0:13:30", "throughput": 2305.84, "total_tokens": 36859112} {"current_steps": 63905, "total_steps": 67140, "loss": 0.5163, "lr": 3.529835314781543e-07, "epoch": 9.518170985999404, "percentage": 95.18, "elapsed_time": "4:26:26", "remaining_time": "0:13:29", "throughput": 2305.87, "total_tokens": 36862376} {"current_steps": 63910, "total_steps": 67140, "loss": 0.516, "lr": 3.5189613642872264e-07, "epoch": 9.518915698540363, "percentage": 95.19, "elapsed_time": "4:26:27", "remaining_time": "0:13:28", "throughput": 2305.89, "total_tokens": 36865512} {"current_steps": 63915, "total_steps": 67140, "loss": 0.4869, "lr": 3.508104069979368e-07, "epoch": 9.519660411081322, "percentage": 95.2, "elapsed_time": "4:26:28", "remaining_time": "0:13:26", "throughput": 2305.91, "total_tokens": 36868488} {"current_steps": 63920, "total_steps": 67140, "loss": 0.5994, "lr": 3.4972634325916854e-07, "epoch": 9.520405123622282, "percentage": 95.2, "elapsed_time": "4:26:29", "remaining_time": "0:13:25", "throughput": 2305.92, "total_tokens": 36871240} {"current_steps": 63925, "total_steps": 67140, "loss": 0.5477, "lr": 3.486439452856705e-07, "epoch": 9.521149836163241, "percentage": 95.21, "elapsed_time": "4:26:30", "remaining_time": "0:13:24", "throughput": 2305.94, "total_tokens": 36874120} {"current_steps": 63930, "total_steps": 67140, "loss": 0.4656, "lr": 3.4756321315058957e-07, "epoch": 9.5218945487042, "percentage": 95.22, "elapsed_time": "4:26:32", "remaining_time": "0:13:22", "throughput": 2305.96, "total_tokens": 36877128} {"current_steps": 63935, "total_steps": 67140, "loss": 0.7014, "lr": 3.4648414692696196e-07, "epoch": 9.522639261245159, "percentage": 95.23, "elapsed_time": "4:26:33", "remaining_time": "0:13:21", "throughput": 2305.98, "total_tokens": 36879976} {"current_steps": 63940, "total_steps": 67140, "loss": 0.632, "lr": 3.4540674668769866e-07, "epoch": 9.52338397378612, "percentage": 95.23, "elapsed_time": "4:26:34", "remaining_time": "0:13:20", "throughput": 2305.99, "total_tokens": 36882760} {"current_steps": 63945, "total_steps": 67140, "loss": 0.7991, "lr": 3.443310125056082e-07, "epoch": 9.524128686327078, "percentage": 95.24, "elapsed_time": "4:26:35", "remaining_time": "0:13:19", "throughput": 2306.01, "total_tokens": 36885672} {"current_steps": 63950, "total_steps": 67140, "loss": 0.7016, "lr": 3.4325694445338783e-07, "epoch": 9.524873398868037, "percentage": 95.25, "elapsed_time": "4:26:36", "remaining_time": "0:13:17", "throughput": 2306.02, "total_tokens": 36888456} {"current_steps": 63955, "total_steps": 67140, "loss": 0.5795, "lr": 3.42184542603613e-07, "epoch": 9.525618111408996, "percentage": 95.26, "elapsed_time": "4:26:37", "remaining_time": "0:13:16", "throughput": 2306.05, "total_tokens": 36891496} {"current_steps": 63960, "total_steps": 67140, "loss": 0.6575, "lr": 3.411138070287562e-07, "epoch": 9.526362823949956, "percentage": 95.26, "elapsed_time": "4:26:38", "remaining_time": "0:13:15", "throughput": 2306.06, "total_tokens": 36894376} {"current_steps": 63965, "total_steps": 67140, "loss": 0.5804, "lr": 3.400447378011734e-07, "epoch": 9.527107536490915, "percentage": 95.27, "elapsed_time": "4:26:39", "remaining_time": "0:13:14", "throughput": 2306.08, "total_tokens": 36897128} {"current_steps": 63970, "total_steps": 67140, "loss": 0.5185, "lr": 3.389773349931069e-07, "epoch": 9.527852249031874, "percentage": 95.28, "elapsed_time": "4:26:41", "remaining_time": "0:13:12", "throughput": 2306.1, "total_tokens": 36900040} {"current_steps": 63975, "total_steps": 67140, "loss": 0.5183, "lr": 3.3791159867668786e-07, "epoch": 9.528596961572832, "percentage": 95.29, "elapsed_time": "4:26:42", "remaining_time": "0:13:11", "throughput": 2306.11, "total_tokens": 36902984} {"current_steps": 63980, "total_steps": 67140, "loss": 0.594, "lr": 3.3684752892393643e-07, "epoch": 9.529341674113793, "percentage": 95.29, "elapsed_time": "4:26:43", "remaining_time": "0:13:10", "throughput": 2306.14, "total_tokens": 36906152} {"current_steps": 63985, "total_steps": 67140, "loss": 0.4083, "lr": 3.357851258067535e-07, "epoch": 9.530086386654752, "percentage": 95.3, "elapsed_time": "4:26:44", "remaining_time": "0:13:09", "throughput": 2306.16, "total_tokens": 36909000} {"current_steps": 63990, "total_steps": 67140, "loss": 0.5787, "lr": 3.347243893969343e-07, "epoch": 9.53083109919571, "percentage": 95.31, "elapsed_time": "4:26:45", "remaining_time": "0:13:07", "throughput": 2306.17, "total_tokens": 36911848} {"current_steps": 63995, "total_steps": 67140, "loss": 0.4753, "lr": 3.3366531976615767e-07, "epoch": 9.53157581173667, "percentage": 95.32, "elapsed_time": "4:26:46", "remaining_time": "0:13:06", "throughput": 2306.19, "total_tokens": 36914824} {"current_steps": 64000, "total_steps": 67140, "loss": 0.3836, "lr": 3.326079169859941e-07, "epoch": 9.53232052427763, "percentage": 95.32, "elapsed_time": "4:26:47", "remaining_time": "0:13:05", "throughput": 2306.2, "total_tokens": 36917384} {"current_steps": 64005, "total_steps": 67140, "loss": 0.5527, "lr": 3.3155218112789763e-07, "epoch": 9.533065236818588, "percentage": 95.33, "elapsed_time": "4:26:49", "remaining_time": "0:13:04", "throughput": 2306.22, "total_tokens": 36920488} {"current_steps": 64010, "total_steps": 67140, "loss": 0.5622, "lr": 3.3049811226321113e-07, "epoch": 9.533809949359547, "percentage": 95.34, "elapsed_time": "4:26:50", "remaining_time": "0:13:02", "throughput": 2306.25, "total_tokens": 36923688} {"current_steps": 64015, "total_steps": 67140, "loss": 0.5872, "lr": 3.2944571046316373e-07, "epoch": 9.534554661900506, "percentage": 95.35, "elapsed_time": "4:26:51", "remaining_time": "0:13:01", "throughput": 2306.28, "total_tokens": 36926728} {"current_steps": 64020, "total_steps": 67140, "loss": 0.5256, "lr": 3.283949757988708e-07, "epoch": 9.535299374441465, "percentage": 95.35, "elapsed_time": "4:26:52", "remaining_time": "0:13:00", "throughput": 2306.29, "total_tokens": 36929480} {"current_steps": 64025, "total_steps": 67140, "loss": 0.5816, "lr": 3.273459083413366e-07, "epoch": 9.536044086982425, "percentage": 95.36, "elapsed_time": "4:26:53", "remaining_time": "0:12:59", "throughput": 2306.32, "total_tokens": 36932680} {"current_steps": 64030, "total_steps": 67140, "loss": 0.4728, "lr": 3.2629850816145723e-07, "epoch": 9.536788799523384, "percentage": 95.37, "elapsed_time": "4:26:54", "remaining_time": "0:12:57", "throughput": 2306.34, "total_tokens": 36935688} {"current_steps": 64035, "total_steps": 67140, "loss": 0.6092, "lr": 3.2525277533000667e-07, "epoch": 9.537533512064343, "percentage": 95.38, "elapsed_time": "4:26:55", "remaining_time": "0:12:56", "throughput": 2306.36, "total_tokens": 36938664} {"current_steps": 64040, "total_steps": 67140, "loss": 0.4603, "lr": 3.242087099176533e-07, "epoch": 9.538278224605303, "percentage": 95.38, "elapsed_time": "4:26:57", "remaining_time": "0:12:55", "throughput": 2306.38, "total_tokens": 36941736} {"current_steps": 64045, "total_steps": 67140, "loss": 0.5788, "lr": 3.2316631199495186e-07, "epoch": 9.539022937146262, "percentage": 95.39, "elapsed_time": "4:26:58", "remaining_time": "0:12:54", "throughput": 2306.4, "total_tokens": 36944680} {"current_steps": 64050, "total_steps": 67140, "loss": 0.4246, "lr": 3.2212558163234043e-07, "epoch": 9.53976764968722, "percentage": 95.4, "elapsed_time": "4:26:59", "remaining_time": "0:12:52", "throughput": 2306.42, "total_tokens": 36947496} {"current_steps": 64055, "total_steps": 67140, "loss": 0.5655, "lr": 3.2108651890014884e-07, "epoch": 9.54051236222818, "percentage": 95.41, "elapsed_time": "4:27:00", "remaining_time": "0:12:51", "throughput": 2306.44, "total_tokens": 36950504} {"current_steps": 64060, "total_steps": 67140, "loss": 0.5043, "lr": 3.20049123868596e-07, "epoch": 9.541257074769138, "percentage": 95.41, "elapsed_time": "4:27:01", "remaining_time": "0:12:50", "throughput": 2306.45, "total_tokens": 36953160} {"current_steps": 64065, "total_steps": 67140, "loss": 0.4377, "lr": 3.1901339660778127e-07, "epoch": 9.542001787310099, "percentage": 95.42, "elapsed_time": "4:27:02", "remaining_time": "0:12:49", "throughput": 2306.47, "total_tokens": 36956072} {"current_steps": 64070, "total_steps": 67140, "loss": 0.5765, "lr": 3.17979337187696e-07, "epoch": 9.542746499851058, "percentage": 95.43, "elapsed_time": "4:27:03", "remaining_time": "0:12:47", "throughput": 2306.49, "total_tokens": 36959080} {"current_steps": 64075, "total_steps": 67140, "loss": 0.6395, "lr": 3.169469456782148e-07, "epoch": 9.543491212392016, "percentage": 95.43, "elapsed_time": "4:27:05", "remaining_time": "0:12:46", "throughput": 2306.51, "total_tokens": 36961960} {"current_steps": 64080, "total_steps": 67140, "loss": 0.5998, "lr": 3.1591622214910686e-07, "epoch": 9.544235924932975, "percentage": 95.44, "elapsed_time": "4:27:06", "remaining_time": "0:12:45", "throughput": 2306.52, "total_tokens": 36964680} {"current_steps": 64085, "total_steps": 67140, "loss": 0.5985, "lr": 3.1488716667002204e-07, "epoch": 9.544980637473936, "percentage": 95.45, "elapsed_time": "4:27:07", "remaining_time": "0:12:44", "throughput": 2306.54, "total_tokens": 36967720} {"current_steps": 64090, "total_steps": 67140, "loss": 0.5745, "lr": 3.138597793105019e-07, "epoch": 9.545725350014894, "percentage": 95.46, "elapsed_time": "4:27:08", "remaining_time": "0:12:42", "throughput": 2306.56, "total_tokens": 36970760} {"current_steps": 64095, "total_steps": 67140, "loss": 0.6421, "lr": 3.1283406013996874e-07, "epoch": 9.546470062555853, "percentage": 95.46, "elapsed_time": "4:27:09", "remaining_time": "0:12:41", "throughput": 2306.59, "total_tokens": 36973864} {"current_steps": 64100, "total_steps": 67140, "loss": 0.6273, "lr": 3.118100092277421e-07, "epoch": 9.547214775096812, "percentage": 95.47, "elapsed_time": "4:27:10", "remaining_time": "0:12:40", "throughput": 2306.61, "total_tokens": 36976840} {"current_steps": 64105, "total_steps": 67140, "loss": 0.5234, "lr": 3.1078762664301655e-07, "epoch": 9.547959487637772, "percentage": 95.48, "elapsed_time": "4:27:11", "remaining_time": "0:12:39", "throughput": 2306.63, "total_tokens": 36979784} {"current_steps": 64110, "total_steps": 67140, "loss": 0.6763, "lr": 3.097669124548869e-07, "epoch": 9.548704200178731, "percentage": 95.49, "elapsed_time": "4:27:13", "remaining_time": "0:12:37", "throughput": 2306.65, "total_tokens": 36982760} {"current_steps": 64115, "total_steps": 67140, "loss": 0.8655, "lr": 3.087478667323257e-07, "epoch": 9.54944891271969, "percentage": 95.49, "elapsed_time": "4:27:14", "remaining_time": "0:12:36", "throughput": 2306.66, "total_tokens": 36985544} {"current_steps": 64120, "total_steps": 67140, "loss": 0.523, "lr": 3.0773048954419457e-07, "epoch": 9.550193625260649, "percentage": 95.5, "elapsed_time": "4:27:15", "remaining_time": "0:12:35", "throughput": 2306.68, "total_tokens": 36988456} {"current_steps": 64125, "total_steps": 67140, "loss": 0.4737, "lr": 3.0671478095924687e-07, "epoch": 9.55093833780161, "percentage": 95.51, "elapsed_time": "4:27:16", "remaining_time": "0:12:33", "throughput": 2306.68, "total_tokens": 36991112} {"current_steps": 64130, "total_steps": 67140, "loss": 0.5085, "lr": 3.057007410461166e-07, "epoch": 9.551683050342568, "percentage": 95.52, "elapsed_time": "4:27:17", "remaining_time": "0:12:32", "throughput": 2306.7, "total_tokens": 36993960} {"current_steps": 64135, "total_steps": 67140, "loss": 0.6115, "lr": 3.046883698733322e-07, "epoch": 9.552427762883527, "percentage": 95.52, "elapsed_time": "4:27:18", "remaining_time": "0:12:31", "throughput": 2306.71, "total_tokens": 36996680} {"current_steps": 64140, "total_steps": 67140, "loss": 0.4275, "lr": 3.036776675093056e-07, "epoch": 9.553172475424486, "percentage": 95.53, "elapsed_time": "4:27:19", "remaining_time": "0:12:30", "throughput": 2306.73, "total_tokens": 36999624} {"current_steps": 64145, "total_steps": 67140, "loss": 0.3517, "lr": 3.02668634022335e-07, "epoch": 9.553917187965446, "percentage": 95.54, "elapsed_time": "4:27:20", "remaining_time": "0:12:28", "throughput": 2306.74, "total_tokens": 37002408} {"current_steps": 64150, "total_steps": 67140, "loss": 0.5553, "lr": 3.016612694806048e-07, "epoch": 9.554661900506405, "percentage": 95.55, "elapsed_time": "4:27:22", "remaining_time": "0:12:27", "throughput": 2306.76, "total_tokens": 37005448} {"current_steps": 64155, "total_steps": 67140, "loss": 0.6675, "lr": 3.0065557395218825e-07, "epoch": 9.555406613047364, "percentage": 95.55, "elapsed_time": "4:27:23", "remaining_time": "0:12:26", "throughput": 2306.78, "total_tokens": 37008424} {"current_steps": 64160, "total_steps": 67140, "loss": 0.6468, "lr": 2.9965154750504764e-07, "epoch": 9.556151325588322, "percentage": 95.56, "elapsed_time": "4:27:24", "remaining_time": "0:12:25", "throughput": 2306.79, "total_tokens": 37010952} {"current_steps": 64165, "total_steps": 67140, "loss": 0.7953, "lr": 2.9864919020703155e-07, "epoch": 9.556896038129283, "percentage": 95.57, "elapsed_time": "4:27:25", "remaining_time": "0:12:23", "throughput": 2306.81, "total_tokens": 37013864} {"current_steps": 64170, "total_steps": 67140, "loss": 0.5274, "lr": 2.976485021258746e-07, "epoch": 9.557640750670242, "percentage": 95.58, "elapsed_time": "4:27:26", "remaining_time": "0:12:22", "throughput": 2306.82, "total_tokens": 37016584} {"current_steps": 64175, "total_steps": 67140, "loss": 0.5111, "lr": 2.966494833292005e-07, "epoch": 9.5583854632112, "percentage": 95.58, "elapsed_time": "4:27:27", "remaining_time": "0:12:21", "throughput": 2306.83, "total_tokens": 37019528} {"current_steps": 64180, "total_steps": 67140, "loss": 0.4899, "lr": 2.9565213388451917e-07, "epoch": 9.55913017575216, "percentage": 95.59, "elapsed_time": "4:27:28", "remaining_time": "0:12:20", "throughput": 2306.86, "total_tokens": 37022600} {"current_steps": 64185, "total_steps": 67140, "loss": 0.5742, "lr": 2.9465645385922394e-07, "epoch": 9.55987488829312, "percentage": 95.6, "elapsed_time": "4:27:30", "remaining_time": "0:12:18", "throughput": 2306.89, "total_tokens": 37025736} {"current_steps": 64190, "total_steps": 67140, "loss": 0.4068, "lr": 2.9366244332060257e-07, "epoch": 9.560619600834078, "percentage": 95.61, "elapsed_time": "4:27:31", "remaining_time": "0:12:17", "throughput": 2306.91, "total_tokens": 37028776} {"current_steps": 64195, "total_steps": 67140, "loss": 0.4276, "lr": 2.926701023358208e-07, "epoch": 9.561364313375037, "percentage": 95.61, "elapsed_time": "4:27:32", "remaining_time": "0:12:16", "throughput": 2306.92, "total_tokens": 37031496} {"current_steps": 64200, "total_steps": 67140, "loss": 0.3961, "lr": 2.916794309719445e-07, "epoch": 9.562109025915996, "percentage": 95.62, "elapsed_time": "4:27:33", "remaining_time": "0:12:15", "throughput": 2306.93, "total_tokens": 37034440} {"current_steps": 64205, "total_steps": 67140, "loss": 0.3584, "lr": 2.906904292959145e-07, "epoch": 9.562853738456955, "percentage": 95.63, "elapsed_time": "4:27:34", "remaining_time": "0:12:13", "throughput": 2306.95, "total_tokens": 37037256} {"current_steps": 64210, "total_steps": 67140, "loss": 0.5458, "lr": 2.8970309737456625e-07, "epoch": 9.563598450997915, "percentage": 95.64, "elapsed_time": "4:27:35", "remaining_time": "0:12:12", "throughput": 2306.96, "total_tokens": 37040072} {"current_steps": 64215, "total_steps": 67140, "loss": 0.6591, "lr": 2.8871743527461583e-07, "epoch": 9.564343163538874, "percentage": 95.64, "elapsed_time": "4:27:36", "remaining_time": "0:12:11", "throughput": 2306.98, "total_tokens": 37042984} {"current_steps": 64220, "total_steps": 67140, "loss": 0.5998, "lr": 2.877334430626738e-07, "epoch": 9.565087876079833, "percentage": 95.65, "elapsed_time": "4:27:38", "remaining_time": "0:12:10", "throughput": 2306.99, "total_tokens": 37045768} {"current_steps": 64225, "total_steps": 67140, "loss": 0.4549, "lr": 2.867511208052315e-07, "epoch": 9.565832588620792, "percentage": 95.66, "elapsed_time": "4:27:39", "remaining_time": "0:12:08", "throughput": 2307.0, "total_tokens": 37048456} {"current_steps": 64230, "total_steps": 67140, "loss": 0.6853, "lr": 2.857704685686718e-07, "epoch": 9.566577301161752, "percentage": 95.67, "elapsed_time": "4:27:40", "remaining_time": "0:12:07", "throughput": 2307.01, "total_tokens": 37051208} {"current_steps": 64235, "total_steps": 67140, "loss": 0.4332, "lr": 2.8479148641926134e-07, "epoch": 9.56732201370271, "percentage": 95.67, "elapsed_time": "4:27:41", "remaining_time": "0:12:06", "throughput": 2307.02, "total_tokens": 37053992} {"current_steps": 64240, "total_steps": 67140, "loss": 0.4388, "lr": 2.8381417442316093e-07, "epoch": 9.56806672624367, "percentage": 95.68, "elapsed_time": "4:27:42", "remaining_time": "0:12:05", "throughput": 2307.04, "total_tokens": 37056840} {"current_steps": 64245, "total_steps": 67140, "loss": 0.7394, "lr": 2.8283853264640947e-07, "epoch": 9.568811438784628, "percentage": 95.69, "elapsed_time": "4:27:43", "remaining_time": "0:12:03", "throughput": 2307.06, "total_tokens": 37059944} {"current_steps": 64250, "total_steps": 67140, "loss": 0.5635, "lr": 2.8186456115493475e-07, "epoch": 9.569556151325589, "percentage": 95.7, "elapsed_time": "4:27:44", "remaining_time": "0:12:02", "throughput": 2307.09, "total_tokens": 37063112} {"current_steps": 64255, "total_steps": 67140, "loss": 0.753, "lr": 2.8089226001455913e-07, "epoch": 9.570300863866548, "percentage": 95.7, "elapsed_time": "4:27:46", "remaining_time": "0:12:01", "throughput": 2307.11, "total_tokens": 37066216} {"current_steps": 64260, "total_steps": 67140, "loss": 0.5211, "lr": 2.799216292909829e-07, "epoch": 9.571045576407506, "percentage": 95.71, "elapsed_time": "4:27:47", "remaining_time": "0:12:00", "throughput": 2307.12, "total_tokens": 37068904} {"current_steps": 64265, "total_steps": 67140, "loss": 0.5399, "lr": 2.789526690497979e-07, "epoch": 9.571790288948465, "percentage": 95.72, "elapsed_time": "4:27:48", "remaining_time": "0:11:58", "throughput": 2307.13, "total_tokens": 37071656} {"current_steps": 64270, "total_steps": 67140, "loss": 0.5143, "lr": 2.779853793564852e-07, "epoch": 9.572535001489426, "percentage": 95.73, "elapsed_time": "4:27:49", "remaining_time": "0:11:57", "throughput": 2307.15, "total_tokens": 37074600} {"current_steps": 64275, "total_steps": 67140, "loss": 0.3624, "lr": 2.7701976027640353e-07, "epoch": 9.573279714030384, "percentage": 95.73, "elapsed_time": "4:27:50", "remaining_time": "0:11:56", "throughput": 2307.17, "total_tokens": 37077384} {"current_steps": 64280, "total_steps": 67140, "loss": 0.5466, "lr": 2.7605581187481467e-07, "epoch": 9.574024426571343, "percentage": 95.74, "elapsed_time": "4:27:51", "remaining_time": "0:11:55", "throughput": 2307.2, "total_tokens": 37080584} {"current_steps": 64285, "total_steps": 67140, "loss": 0.5785, "lr": 2.750935342168526e-07, "epoch": 9.574769139112302, "percentage": 95.75, "elapsed_time": "4:27:52", "remaining_time": "0:11:53", "throughput": 2307.21, "total_tokens": 37083400} {"current_steps": 64290, "total_steps": 67140, "loss": 0.7834, "lr": 2.741329273675458e-07, "epoch": 9.575513851653263, "percentage": 95.76, "elapsed_time": "4:27:53", "remaining_time": "0:11:52", "throughput": 2307.24, "total_tokens": 37086600} {"current_steps": 64295, "total_steps": 67140, "loss": 0.4762, "lr": 2.7317399139180634e-07, "epoch": 9.576258564194221, "percentage": 95.76, "elapsed_time": "4:27:55", "remaining_time": "0:11:51", "throughput": 2307.25, "total_tokens": 37089288} {"current_steps": 64300, "total_steps": 67140, "loss": 0.7314, "lr": 2.7221672635443783e-07, "epoch": 9.57700327673518, "percentage": 95.77, "elapsed_time": "4:27:56", "remaining_time": "0:11:50", "throughput": 2307.27, "total_tokens": 37092136} {"current_steps": 64305, "total_steps": 67140, "loss": 0.5038, "lr": 2.712611323201275e-07, "epoch": 9.577747989276139, "percentage": 95.78, "elapsed_time": "4:27:57", "remaining_time": "0:11:48", "throughput": 2307.29, "total_tokens": 37095208} {"current_steps": 64310, "total_steps": 67140, "loss": 0.4916, "lr": 2.7030720935344867e-07, "epoch": 9.5784927018171, "percentage": 95.78, "elapsed_time": "4:27:58", "remaining_time": "0:11:47", "throughput": 2307.3, "total_tokens": 37097928} {"current_steps": 64315, "total_steps": 67140, "loss": 0.4959, "lr": 2.6935495751886644e-07, "epoch": 9.579237414358058, "percentage": 95.79, "elapsed_time": "4:27:59", "remaining_time": "0:11:46", "throughput": 2307.31, "total_tokens": 37100712} {"current_steps": 64320, "total_steps": 67140, "loss": 0.6956, "lr": 2.6840437688072653e-07, "epoch": 9.579982126899017, "percentage": 95.8, "elapsed_time": "4:28:00", "remaining_time": "0:11:45", "throughput": 2307.33, "total_tokens": 37103656} {"current_steps": 64325, "total_steps": 67140, "loss": 0.626, "lr": 2.6745546750326924e-07, "epoch": 9.580726839439976, "percentage": 95.81, "elapsed_time": "4:28:01", "remaining_time": "0:11:43", "throughput": 2307.35, "total_tokens": 37106568} {"current_steps": 64330, "total_steps": 67140, "loss": 0.509, "lr": 2.665082294506155e-07, "epoch": 9.581471551980936, "percentage": 95.81, "elapsed_time": "4:28:02", "remaining_time": "0:11:42", "throughput": 2307.35, "total_tokens": 37109128} {"current_steps": 64335, "total_steps": 67140, "loss": 0.5224, "lr": 2.655626627867752e-07, "epoch": 9.582216264521895, "percentage": 95.82, "elapsed_time": "4:28:04", "remaining_time": "0:11:41", "throughput": 2307.38, "total_tokens": 37112168} {"current_steps": 64340, "total_steps": 67140, "loss": 0.6531, "lr": 2.6461876757565007e-07, "epoch": 9.582960977062854, "percentage": 95.83, "elapsed_time": "4:28:05", "remaining_time": "0:11:40", "throughput": 2307.39, "total_tokens": 37114952} {"current_steps": 64345, "total_steps": 67140, "loss": 0.2998, "lr": 2.6367654388102236e-07, "epoch": 9.583705689603812, "percentage": 95.84, "elapsed_time": "4:28:06", "remaining_time": "0:11:38", "throughput": 2307.42, "total_tokens": 37118248} {"current_steps": 64350, "total_steps": 67140, "loss": 0.4964, "lr": 2.6273599176656063e-07, "epoch": 9.584450402144771, "percentage": 95.84, "elapsed_time": "4:28:07", "remaining_time": "0:11:37", "throughput": 2307.44, "total_tokens": 37121160} {"current_steps": 64355, "total_steps": 67140, "loss": 0.5219, "lr": 2.617971112958278e-07, "epoch": 9.585195114685732, "percentage": 95.85, "elapsed_time": "4:28:08", "remaining_time": "0:11:36", "throughput": 2307.46, "total_tokens": 37124264} {"current_steps": 64360, "total_steps": 67140, "loss": 0.5559, "lr": 2.6085990253226776e-07, "epoch": 9.58593982722669, "percentage": 95.86, "elapsed_time": "4:28:09", "remaining_time": "0:11:34", "throughput": 2307.47, "total_tokens": 37126888} {"current_steps": 64365, "total_steps": 67140, "loss": 0.5602, "lr": 2.5992436553921304e-07, "epoch": 9.58668453976765, "percentage": 95.87, "elapsed_time": "4:28:11", "remaining_time": "0:11:33", "throughput": 2307.5, "total_tokens": 37130056} {"current_steps": 64370, "total_steps": 67140, "loss": 0.5478, "lr": 2.589905003798826e-07, "epoch": 9.58742925230861, "percentage": 95.87, "elapsed_time": "4:28:12", "remaining_time": "0:11:32", "throughput": 2307.51, "total_tokens": 37132840} {"current_steps": 64375, "total_steps": 67140, "loss": 0.7384, "lr": 2.58058307117387e-07, "epoch": 9.588173964849569, "percentage": 95.88, "elapsed_time": "4:28:13", "remaining_time": "0:11:31", "throughput": 2307.53, "total_tokens": 37135976} {"current_steps": 64380, "total_steps": 67140, "loss": 0.5953, "lr": 2.571277858147175e-07, "epoch": 9.588918677390527, "percentage": 95.89, "elapsed_time": "4:28:14", "remaining_time": "0:11:29", "throughput": 2307.56, "total_tokens": 37139112} {"current_steps": 64385, "total_steps": 67140, "loss": 0.7857, "lr": 2.561989365347545e-07, "epoch": 9.589663389931486, "percentage": 95.9, "elapsed_time": "4:28:15", "remaining_time": "0:11:28", "throughput": 2307.56, "total_tokens": 37141704} {"current_steps": 64390, "total_steps": 67140, "loss": 0.5345, "lr": 2.5527175934026426e-07, "epoch": 9.590408102472445, "percentage": 95.9, "elapsed_time": "4:28:16", "remaining_time": "0:11:27", "throughput": 2307.58, "total_tokens": 37144424} {"current_steps": 64395, "total_steps": 67140, "loss": 0.5142, "lr": 2.5434625429390515e-07, "epoch": 9.591152815013405, "percentage": 95.91, "elapsed_time": "4:28:17", "remaining_time": "0:11:26", "throughput": 2307.59, "total_tokens": 37147368} {"current_steps": 64400, "total_steps": 67140, "loss": 0.5172, "lr": 2.534224214582187e-07, "epoch": 9.591897527554364, "percentage": 95.92, "elapsed_time": "4:28:18", "remaining_time": "0:11:24", "throughput": 2307.6, "total_tokens": 37149992} {"current_steps": 64405, "total_steps": 67140, "loss": 0.4283, "lr": 2.5250026089563004e-07, "epoch": 9.592642240095323, "percentage": 95.93, "elapsed_time": "4:28:20", "remaining_time": "0:11:23", "throughput": 2307.62, "total_tokens": 37152904} {"current_steps": 64410, "total_steps": 67140, "loss": 0.517, "lr": 2.5157977266846157e-07, "epoch": 9.593386952636282, "percentage": 95.93, "elapsed_time": "4:28:21", "remaining_time": "0:11:22", "throughput": 2307.63, "total_tokens": 37155784} {"current_steps": 64415, "total_steps": 67140, "loss": 0.5525, "lr": 2.5066095683891067e-07, "epoch": 9.594131665177242, "percentage": 95.94, "elapsed_time": "4:28:22", "remaining_time": "0:11:21", "throughput": 2307.65, "total_tokens": 37158632} {"current_steps": 64420, "total_steps": 67140, "loss": 0.7836, "lr": 2.497438134690694e-07, "epoch": 9.594876377718201, "percentage": 95.95, "elapsed_time": "4:28:23", "remaining_time": "0:11:19", "throughput": 2307.66, "total_tokens": 37161416} {"current_steps": 64425, "total_steps": 67140, "loss": 0.7056, "lr": 2.4882834262091317e-07, "epoch": 9.59562109025916, "percentage": 95.96, "elapsed_time": "4:28:24", "remaining_time": "0:11:18", "throughput": 2307.67, "total_tokens": 37164232} {"current_steps": 64430, "total_steps": 67140, "loss": 0.6802, "lr": 2.4791454435630634e-07, "epoch": 9.596365802800118, "percentage": 95.96, "elapsed_time": "4:28:25", "remaining_time": "0:11:17", "throughput": 2307.7, "total_tokens": 37167272} {"current_steps": 64435, "total_steps": 67140, "loss": 0.478, "lr": 2.4700241873699957e-07, "epoch": 9.597110515341079, "percentage": 95.97, "elapsed_time": "4:28:26", "remaining_time": "0:11:16", "throughput": 2307.71, "total_tokens": 37169992} {"current_steps": 64440, "total_steps": 67140, "loss": 0.5415, "lr": 2.460919658246297e-07, "epoch": 9.597855227882038, "percentage": 95.98, "elapsed_time": "4:28:28", "remaining_time": "0:11:14", "throughput": 2307.72, "total_tokens": 37172840} {"current_steps": 64445, "total_steps": 67140, "loss": 0.526, "lr": 2.4518318568072797e-07, "epoch": 9.598599940422996, "percentage": 95.99, "elapsed_time": "4:28:29", "remaining_time": "0:11:13", "throughput": 2307.74, "total_tokens": 37175848} {"current_steps": 64450, "total_steps": 67140, "loss": 0.5846, "lr": 2.442760783666953e-07, "epoch": 9.599344652963955, "percentage": 95.99, "elapsed_time": "4:28:30", "remaining_time": "0:11:12", "throughput": 2307.75, "total_tokens": 37178632} {"current_steps": 64455, "total_steps": 67140, "loss": 0.6623, "lr": 2.433706439438382e-07, "epoch": 9.600089365504916, "percentage": 96.0, "elapsed_time": "4:28:31", "remaining_time": "0:11:11", "throughput": 2307.78, "total_tokens": 37181736} {"current_steps": 64460, "total_steps": 67140, "loss": 0.6489, "lr": 2.4246688247334117e-07, "epoch": 9.600834078045875, "percentage": 96.01, "elapsed_time": "4:28:32", "remaining_time": "0:11:09", "throughput": 2307.79, "total_tokens": 37184552} {"current_steps": 64465, "total_steps": 67140, "loss": 0.5062, "lr": 2.4156479401627465e-07, "epoch": 9.601578790586833, "percentage": 96.02, "elapsed_time": "4:28:33", "remaining_time": "0:11:08", "throughput": 2307.82, "total_tokens": 37187592} {"current_steps": 64470, "total_steps": 67140, "loss": 0.4381, "lr": 2.4066437863359545e-07, "epoch": 9.602323503127792, "percentage": 96.02, "elapsed_time": "4:28:34", "remaining_time": "0:11:07", "throughput": 2307.83, "total_tokens": 37190248} {"current_steps": 64475, "total_steps": 67140, "loss": 0.542, "lr": 2.397656363861578e-07, "epoch": 9.603068215668753, "percentage": 96.03, "elapsed_time": "4:28:35", "remaining_time": "0:11:06", "throughput": 2307.84, "total_tokens": 37193096} {"current_steps": 64480, "total_steps": 67140, "loss": 0.5842, "lr": 2.388685673346908e-07, "epoch": 9.603812928209711, "percentage": 96.04, "elapsed_time": "4:28:37", "remaining_time": "0:11:04", "throughput": 2307.85, "total_tokens": 37195784} {"current_steps": 64485, "total_steps": 67140, "loss": 0.5692, "lr": 2.379731715398098e-07, "epoch": 9.60455764075067, "percentage": 96.05, "elapsed_time": "4:28:38", "remaining_time": "0:11:03", "throughput": 2307.86, "total_tokens": 37198536} {"current_steps": 64490, "total_steps": 67140, "loss": 0.4392, "lr": 2.3707944906203038e-07, "epoch": 9.605302353291629, "percentage": 96.05, "elapsed_time": "4:28:39", "remaining_time": "0:11:02", "throughput": 2307.87, "total_tokens": 37201256} {"current_steps": 64495, "total_steps": 67140, "loss": 0.6846, "lr": 2.361873999617431e-07, "epoch": 9.60604706583259, "percentage": 96.06, "elapsed_time": "4:28:40", "remaining_time": "0:11:01", "throughput": 2307.88, "total_tokens": 37203912} {"current_steps": 64500, "total_steps": 67140, "loss": 0.4465, "lr": 2.352970242992303e-07, "epoch": 9.606791778373548, "percentage": 96.07, "elapsed_time": "4:28:41", "remaining_time": "0:10:59", "throughput": 2307.89, "total_tokens": 37206664} {"current_steps": 64505, "total_steps": 67140, "loss": 0.4978, "lr": 2.344083221346549e-07, "epoch": 9.607536490914507, "percentage": 96.08, "elapsed_time": "4:28:42", "remaining_time": "0:10:58", "throughput": 2307.92, "total_tokens": 37209800} {"current_steps": 64510, "total_steps": 67140, "loss": 0.4822, "lr": 2.3352129352808007e-07, "epoch": 9.608281203455466, "percentage": 96.08, "elapsed_time": "4:28:43", "remaining_time": "0:10:57", "throughput": 2307.93, "total_tokens": 37212712} {"current_steps": 64515, "total_steps": 67140, "loss": 0.4961, "lr": 2.326359385394383e-07, "epoch": 9.609025915996426, "percentage": 96.09, "elapsed_time": "4:28:44", "remaining_time": "0:10:56", "throughput": 2307.95, "total_tokens": 37215656} {"current_steps": 64520, "total_steps": 67140, "loss": 0.673, "lr": 2.317522572285652e-07, "epoch": 9.609770628537385, "percentage": 96.1, "elapsed_time": "4:28:46", "remaining_time": "0:10:54", "throughput": 2307.97, "total_tokens": 37218472} {"current_steps": 64525, "total_steps": 67140, "loss": 0.8316, "lr": 2.30870249655174e-07, "epoch": 9.610515341078344, "percentage": 96.11, "elapsed_time": "4:28:47", "remaining_time": "0:10:53", "throughput": 2307.97, "total_tokens": 37221064} {"current_steps": 64530, "total_steps": 67140, "loss": 0.6464, "lr": 2.2998991587886709e-07, "epoch": 9.611260053619302, "percentage": 96.11, "elapsed_time": "4:28:48", "remaining_time": "0:10:52", "throughput": 2307.98, "total_tokens": 37223816} {"current_steps": 64535, "total_steps": 67140, "loss": 0.4905, "lr": 2.2911125595913296e-07, "epoch": 9.612004766160261, "percentage": 96.12, "elapsed_time": "4:28:49", "remaining_time": "0:10:51", "throughput": 2307.99, "total_tokens": 37226600} {"current_steps": 64540, "total_steps": 67140, "loss": 0.5535, "lr": 2.2823426995535192e-07, "epoch": 9.612749478701222, "percentage": 96.13, "elapsed_time": "4:28:50", "remaining_time": "0:10:49", "throughput": 2308.01, "total_tokens": 37229512} {"current_steps": 64545, "total_steps": 67140, "loss": 0.4405, "lr": 2.2735895792678485e-07, "epoch": 9.61349419124218, "percentage": 96.13, "elapsed_time": "4:28:51", "remaining_time": "0:10:48", "throughput": 2308.03, "total_tokens": 37232360} {"current_steps": 64550, "total_steps": 67140, "loss": 0.592, "lr": 2.2648531993257893e-07, "epoch": 9.61423890378314, "percentage": 96.14, "elapsed_time": "4:28:52", "remaining_time": "0:10:47", "throughput": 2308.04, "total_tokens": 37235304} {"current_steps": 64555, "total_steps": 67140, "loss": 0.6399, "lr": 2.2561335603177302e-07, "epoch": 9.6149836163241, "percentage": 96.15, "elapsed_time": "4:28:53", "remaining_time": "0:10:46", "throughput": 2308.06, "total_tokens": 37238216} {"current_steps": 64560, "total_steps": 67140, "loss": 0.536, "lr": 2.2474306628329222e-07, "epoch": 9.615728328865059, "percentage": 96.16, "elapsed_time": "4:28:55", "remaining_time": "0:10:44", "throughput": 2308.07, "total_tokens": 37240904} {"current_steps": 64565, "total_steps": 67140, "loss": 0.616, "lr": 2.2387445074594505e-07, "epoch": 9.616473041406017, "percentage": 96.16, "elapsed_time": "4:28:56", "remaining_time": "0:10:43", "throughput": 2308.09, "total_tokens": 37243976} {"current_steps": 64570, "total_steps": 67140, "loss": 0.532, "lr": 2.2300750947843174e-07, "epoch": 9.617217753946976, "percentage": 96.17, "elapsed_time": "4:28:57", "remaining_time": "0:10:42", "throughput": 2308.1, "total_tokens": 37246728} {"current_steps": 64575, "total_steps": 67140, "loss": 0.5989, "lr": 2.2214224253933326e-07, "epoch": 9.617962466487935, "percentage": 96.18, "elapsed_time": "4:28:58", "remaining_time": "0:10:41", "throughput": 2308.12, "total_tokens": 37249512} {"current_steps": 64580, "total_steps": 67140, "loss": 0.5566, "lr": 2.21278649987125e-07, "epoch": 9.618707179028895, "percentage": 96.19, "elapsed_time": "4:28:59", "remaining_time": "0:10:39", "throughput": 2308.14, "total_tokens": 37252552} {"current_steps": 64585, "total_steps": 67140, "loss": 0.4614, "lr": 2.204167318801603e-07, "epoch": 9.619451891569854, "percentage": 96.19, "elapsed_time": "4:29:00", "remaining_time": "0:10:38", "throughput": 2308.16, "total_tokens": 37255560} {"current_steps": 64590, "total_steps": 67140, "loss": 0.5828, "lr": 2.1955648827668708e-07, "epoch": 9.620196604110813, "percentage": 96.2, "elapsed_time": "4:29:01", "remaining_time": "0:10:37", "throughput": 2308.17, "total_tokens": 37258280} {"current_steps": 64595, "total_steps": 67140, "loss": 0.4826, "lr": 2.186979192348365e-07, "epoch": 9.620941316651772, "percentage": 96.21, "elapsed_time": "4:29:03", "remaining_time": "0:10:36", "throughput": 2308.18, "total_tokens": 37261064} {"current_steps": 64600, "total_steps": 67140, "loss": 0.5713, "lr": 2.178410248126289e-07, "epoch": 9.621686029192732, "percentage": 96.22, "elapsed_time": "4:29:04", "remaining_time": "0:10:34", "throughput": 2308.2, "total_tokens": 37263880} {"current_steps": 64605, "total_steps": 67140, "loss": 0.643, "lr": 2.1698580506796517e-07, "epoch": 9.622430741733691, "percentage": 96.22, "elapsed_time": "4:29:05", "remaining_time": "0:10:33", "throughput": 2308.2, "total_tokens": 37266504} {"current_steps": 64610, "total_steps": 67140, "loss": 0.4831, "lr": 2.1613226005864074e-07, "epoch": 9.62317545427465, "percentage": 96.23, "elapsed_time": "4:29:06", "remaining_time": "0:10:32", "throughput": 2308.22, "total_tokens": 37269320} {"current_steps": 64615, "total_steps": 67140, "loss": 0.5841, "lr": 2.1528038984233722e-07, "epoch": 9.623920166815608, "percentage": 96.24, "elapsed_time": "4:29:07", "remaining_time": "0:10:31", "throughput": 2308.23, "total_tokens": 37272200} {"current_steps": 64620, "total_steps": 67140, "loss": 0.582, "lr": 2.1443019447661417e-07, "epoch": 9.624664879356569, "percentage": 96.25, "elapsed_time": "4:29:08", "remaining_time": "0:10:29", "throughput": 2308.26, "total_tokens": 37275208} {"current_steps": 64625, "total_steps": 67140, "loss": 0.7142, "lr": 2.1358167401892838e-07, "epoch": 9.625409591897528, "percentage": 96.25, "elapsed_time": "4:29:09", "remaining_time": "0:10:28", "throughput": 2308.27, "total_tokens": 37278088} {"current_steps": 64630, "total_steps": 67140, "loss": 0.652, "lr": 2.1273482852662007e-07, "epoch": 9.626154304438487, "percentage": 96.26, "elapsed_time": "4:29:10", "remaining_time": "0:10:27", "throughput": 2308.29, "total_tokens": 37280872} {"current_steps": 64635, "total_steps": 67140, "loss": 0.6991, "lr": 2.1188965805691297e-07, "epoch": 9.626899016979445, "percentage": 96.27, "elapsed_time": "4:29:12", "remaining_time": "0:10:25", "throughput": 2308.31, "total_tokens": 37283848} {"current_steps": 64640, "total_steps": 67140, "loss": 0.3679, "lr": 2.1104616266692524e-07, "epoch": 9.627643729520406, "percentage": 96.28, "elapsed_time": "4:29:13", "remaining_time": "0:10:24", "throughput": 2308.33, "total_tokens": 37286760} {"current_steps": 64645, "total_steps": 67140, "loss": 0.455, "lr": 2.1020434241365017e-07, "epoch": 9.628388442061365, "percentage": 96.28, "elapsed_time": "4:29:14", "remaining_time": "0:10:23", "throughput": 2308.33, "total_tokens": 37289448} {"current_steps": 64650, "total_steps": 67140, "loss": 0.5633, "lr": 2.0936419735397562e-07, "epoch": 9.629133154602323, "percentage": 96.29, "elapsed_time": "4:29:15", "remaining_time": "0:10:22", "throughput": 2308.34, "total_tokens": 37292168} {"current_steps": 64655, "total_steps": 67140, "loss": 0.6376, "lr": 2.0852572754468113e-07, "epoch": 9.629877867143282, "percentage": 96.3, "elapsed_time": "4:29:16", "remaining_time": "0:10:20", "throughput": 2308.37, "total_tokens": 37295432} {"current_steps": 64660, "total_steps": 67140, "loss": 0.5785, "lr": 2.0768893304242142e-07, "epoch": 9.630622579684243, "percentage": 96.31, "elapsed_time": "4:29:17", "remaining_time": "0:10:19", "throughput": 2308.38, "total_tokens": 37298088} {"current_steps": 64665, "total_steps": 67140, "loss": 0.7293, "lr": 2.0685381390374568e-07, "epoch": 9.631367292225201, "percentage": 96.31, "elapsed_time": "4:29:18", "remaining_time": "0:10:18", "throughput": 2308.39, "total_tokens": 37300904} {"current_steps": 64670, "total_steps": 67140, "loss": 0.5017, "lr": 2.0602037018508658e-07, "epoch": 9.63211200476616, "percentage": 96.32, "elapsed_time": "4:29:19", "remaining_time": "0:10:17", "throughput": 2308.41, "total_tokens": 37303912} {"current_steps": 64675, "total_steps": 67140, "loss": 0.625, "lr": 2.0518860194276846e-07, "epoch": 9.632856717307119, "percentage": 96.33, "elapsed_time": "4:29:21", "remaining_time": "0:10:15", "throughput": 2308.42, "total_tokens": 37306728} {"current_steps": 64680, "total_steps": 67140, "loss": 0.6707, "lr": 2.043585092329936e-07, "epoch": 9.63360142984808, "percentage": 96.34, "elapsed_time": "4:29:22", "remaining_time": "0:10:14", "throughput": 2308.43, "total_tokens": 37309256} {"current_steps": 64685, "total_steps": 67140, "loss": 0.5681, "lr": 2.035300921118616e-07, "epoch": 9.634346142389038, "percentage": 96.34, "elapsed_time": "4:29:23", "remaining_time": "0:10:13", "throughput": 2308.44, "total_tokens": 37311976} {"current_steps": 64690, "total_steps": 67140, "loss": 0.7116, "lr": 2.0270335063534706e-07, "epoch": 9.635090854929997, "percentage": 96.35, "elapsed_time": "4:29:24", "remaining_time": "0:10:12", "throughput": 2308.45, "total_tokens": 37314728} {"current_steps": 64695, "total_steps": 67140, "loss": 0.5958, "lr": 2.018782848593248e-07, "epoch": 9.635835567470956, "percentage": 96.36, "elapsed_time": "4:29:25", "remaining_time": "0:10:10", "throughput": 2308.47, "total_tokens": 37317768} {"current_steps": 64700, "total_steps": 67140, "loss": 0.618, "lr": 2.0105489483954466e-07, "epoch": 9.636580280011916, "percentage": 96.37, "elapsed_time": "4:29:26", "remaining_time": "0:10:09", "throughput": 2308.49, "total_tokens": 37320776} {"current_steps": 64705, "total_steps": 67140, "loss": 0.6903, "lr": 2.0023318063165098e-07, "epoch": 9.637324992552875, "percentage": 96.37, "elapsed_time": "4:29:27", "remaining_time": "0:10:08", "throughput": 2308.51, "total_tokens": 37323656} {"current_steps": 64710, "total_steps": 67140, "loss": 0.6191, "lr": 1.9941314229117157e-07, "epoch": 9.638069705093834, "percentage": 96.38, "elapsed_time": "4:29:29", "remaining_time": "0:10:07", "throughput": 2308.54, "total_tokens": 37326792} {"current_steps": 64715, "total_steps": 67140, "loss": 0.4541, "lr": 1.9859477987351771e-07, "epoch": 9.638814417634793, "percentage": 96.39, "elapsed_time": "4:29:30", "remaining_time": "0:10:05", "throughput": 2308.55, "total_tokens": 37329736} {"current_steps": 64720, "total_steps": 67140, "loss": 0.5233, "lr": 1.9777809343399234e-07, "epoch": 9.639559130175751, "percentage": 96.4, "elapsed_time": "4:29:31", "remaining_time": "0:10:04", "throughput": 2308.57, "total_tokens": 37332648} {"current_steps": 64725, "total_steps": 67140, "loss": 0.5302, "lr": 1.9696308302778744e-07, "epoch": 9.640303842716712, "percentage": 96.4, "elapsed_time": "4:29:32", "remaining_time": "0:10:03", "throughput": 2308.6, "total_tokens": 37335752} {"current_steps": 64730, "total_steps": 67140, "loss": 0.564, "lr": 1.961497487099756e-07, "epoch": 9.64104855525767, "percentage": 96.41, "elapsed_time": "4:29:33", "remaining_time": "0:10:02", "throughput": 2308.61, "total_tokens": 37338472} {"current_steps": 64735, "total_steps": 67140, "loss": 0.5656, "lr": 1.9533809053551565e-07, "epoch": 9.64179326779863, "percentage": 96.42, "elapsed_time": "4:29:34", "remaining_time": "0:10:00", "throughput": 2308.63, "total_tokens": 37341448} {"current_steps": 64740, "total_steps": 67140, "loss": 0.4542, "lr": 1.9452810855926372e-07, "epoch": 9.642537980339588, "percentage": 96.43, "elapsed_time": "4:29:35", "remaining_time": "0:09:59", "throughput": 2308.65, "total_tokens": 37344392} {"current_steps": 64745, "total_steps": 67140, "loss": 0.5345, "lr": 1.9371980283594826e-07, "epoch": 9.643282692880549, "percentage": 96.43, "elapsed_time": "4:29:36", "remaining_time": "0:09:58", "throughput": 2308.65, "total_tokens": 37347080} {"current_steps": 64750, "total_steps": 67140, "loss": 0.5156, "lr": 1.929131734201922e-07, "epoch": 9.644027405421507, "percentage": 96.44, "elapsed_time": "4:29:38", "remaining_time": "0:09:57", "throughput": 2308.67, "total_tokens": 37349896} {"current_steps": 64755, "total_steps": 67140, "loss": 0.7253, "lr": 1.9210822036650755e-07, "epoch": 9.644772117962466, "percentage": 96.45, "elapsed_time": "4:29:39", "remaining_time": "0:09:55", "throughput": 2308.68, "total_tokens": 37352712} {"current_steps": 64760, "total_steps": 67140, "loss": 0.584, "lr": 1.9130494372928688e-07, "epoch": 9.645516830503425, "percentage": 96.46, "elapsed_time": "4:29:40", "remaining_time": "0:09:54", "throughput": 2308.7, "total_tokens": 37355720} {"current_steps": 64765, "total_steps": 67140, "loss": 0.4348, "lr": 1.9050334356281175e-07, "epoch": 9.646261543044385, "percentage": 96.46, "elapsed_time": "4:29:41", "remaining_time": "0:09:53", "throughput": 2308.71, "total_tokens": 37358408} {"current_steps": 64770, "total_steps": 67140, "loss": 0.4173, "lr": 1.897034199212555e-07, "epoch": 9.647006255585344, "percentage": 96.47, "elapsed_time": "4:29:42", "remaining_time": "0:09:52", "throughput": 2308.74, "total_tokens": 37361544} {"current_steps": 64775, "total_steps": 67140, "loss": 0.5596, "lr": 1.8890517285866938e-07, "epoch": 9.647750968126303, "percentage": 96.48, "elapsed_time": "4:29:43", "remaining_time": "0:09:50", "throughput": 2308.75, "total_tokens": 37364328} {"current_steps": 64780, "total_steps": 67140, "loss": 0.4575, "lr": 1.881086024289963e-07, "epoch": 9.648495680667262, "percentage": 96.48, "elapsed_time": "4:29:44", "remaining_time": "0:09:49", "throughput": 2308.78, "total_tokens": 37367464} {"current_steps": 64785, "total_steps": 67140, "loss": 0.8725, "lr": 1.8731370868606824e-07, "epoch": 9.649240393208222, "percentage": 96.49, "elapsed_time": "4:29:46", "remaining_time": "0:09:48", "throughput": 2308.79, "total_tokens": 37370216} {"current_steps": 64790, "total_steps": 67140, "loss": 0.507, "lr": 1.8652049168359774e-07, "epoch": 9.649985105749181, "percentage": 96.5, "elapsed_time": "4:29:47", "remaining_time": "0:09:47", "throughput": 2308.79, "total_tokens": 37372840} {"current_steps": 64795, "total_steps": 67140, "loss": 0.6047, "lr": 1.857289514751892e-07, "epoch": 9.65072981829014, "percentage": 96.51, "elapsed_time": "4:29:48", "remaining_time": "0:09:45", "throughput": 2308.81, "total_tokens": 37375816} {"current_steps": 64800, "total_steps": 67140, "loss": 0.4805, "lr": 1.849390881143276e-07, "epoch": 9.651474530831099, "percentage": 96.51, "elapsed_time": "4:29:49", "remaining_time": "0:09:44", "throughput": 2308.83, "total_tokens": 37378664} {"current_steps": 64805, "total_steps": 67140, "loss": 0.5228, "lr": 1.8415090165439519e-07, "epoch": 9.652219243372059, "percentage": 96.52, "elapsed_time": "4:29:50", "remaining_time": "0:09:43", "throughput": 2308.84, "total_tokens": 37381384} {"current_steps": 64810, "total_steps": 67140, "loss": 0.7236, "lr": 1.8336439214864943e-07, "epoch": 9.652963955913018, "percentage": 96.53, "elapsed_time": "4:29:51", "remaining_time": "0:09:42", "throughput": 2308.85, "total_tokens": 37384072} {"current_steps": 64815, "total_steps": 67140, "loss": 0.6372, "lr": 1.8257955965023943e-07, "epoch": 9.653708668453977, "percentage": 96.54, "elapsed_time": "4:29:52", "remaining_time": "0:09:40", "throughput": 2308.86, "total_tokens": 37386856} {"current_steps": 64820, "total_steps": 67140, "loss": 0.2705, "lr": 1.8179640421220333e-07, "epoch": 9.654453380994935, "percentage": 96.54, "elapsed_time": "4:29:53", "remaining_time": "0:09:39", "throughput": 2308.87, "total_tokens": 37389480} {"current_steps": 64825, "total_steps": 67140, "loss": 0.7577, "lr": 1.8101492588746549e-07, "epoch": 9.655198093535896, "percentage": 96.55, "elapsed_time": "4:29:54", "remaining_time": "0:09:38", "throughput": 2308.88, "total_tokens": 37392200} {"current_steps": 64830, "total_steps": 67140, "loss": 0.6343, "lr": 1.8023512472883087e-07, "epoch": 9.655942806076855, "percentage": 96.56, "elapsed_time": "4:29:56", "remaining_time": "0:09:37", "throughput": 2308.89, "total_tokens": 37395016} {"current_steps": 64835, "total_steps": 67140, "loss": 0.6426, "lr": 1.794570007889962e-07, "epoch": 9.656687518617813, "percentage": 96.57, "elapsed_time": "4:29:57", "remaining_time": "0:09:35", "throughput": 2308.9, "total_tokens": 37397704} {"current_steps": 64840, "total_steps": 67140, "loss": 0.5828, "lr": 1.7868055412054442e-07, "epoch": 9.657432231158772, "percentage": 96.57, "elapsed_time": "4:29:58", "remaining_time": "0:09:34", "throughput": 2308.91, "total_tokens": 37400424} {"current_steps": 64845, "total_steps": 67140, "loss": 0.4309, "lr": 1.7790578477594466e-07, "epoch": 9.658176943699733, "percentage": 96.58, "elapsed_time": "4:29:59", "remaining_time": "0:09:33", "throughput": 2308.97, "total_tokens": 37404648} {"current_steps": 64850, "total_steps": 67140, "loss": 0.5393, "lr": 1.771326928075523e-07, "epoch": 9.658921656240691, "percentage": 96.59, "elapsed_time": "4:30:00", "remaining_time": "0:09:32", "throughput": 2308.99, "total_tokens": 37407656} {"current_steps": 64855, "total_steps": 67140, "loss": 0.5174, "lr": 1.7636127826760884e-07, "epoch": 9.65966636878165, "percentage": 96.6, "elapsed_time": "4:30:01", "remaining_time": "0:09:30", "throughput": 2309.0, "total_tokens": 37410408} {"current_steps": 64860, "total_steps": 67140, "loss": 0.3296, "lr": 1.7559154120824483e-07, "epoch": 9.660411081322609, "percentage": 96.6, "elapsed_time": "4:30:03", "remaining_time": "0:09:29", "throughput": 2309.01, "total_tokens": 37413064} {"current_steps": 64865, "total_steps": 67140, "loss": 0.5769, "lr": 1.7482348168147978e-07, "epoch": 9.66115579386357, "percentage": 96.61, "elapsed_time": "4:30:04", "remaining_time": "0:09:28", "throughput": 2309.03, "total_tokens": 37416040} {"current_steps": 64870, "total_steps": 67140, "loss": 0.5517, "lr": 1.7405709973920824e-07, "epoch": 9.661900506404528, "percentage": 96.62, "elapsed_time": "4:30:05", "remaining_time": "0:09:27", "throughput": 2309.05, "total_tokens": 37419176} {"current_steps": 64875, "total_steps": 67140, "loss": 0.4678, "lr": 1.7329239543322494e-07, "epoch": 9.662645218945487, "percentage": 96.63, "elapsed_time": "4:30:06", "remaining_time": "0:09:25", "throughput": 2309.07, "total_tokens": 37421992} {"current_steps": 64880, "total_steps": 67140, "loss": 0.6845, "lr": 1.7252936881520244e-07, "epoch": 9.663389931486446, "percentage": 96.63, "elapsed_time": "4:30:07", "remaining_time": "0:09:24", "throughput": 2309.1, "total_tokens": 37425128} {"current_steps": 64885, "total_steps": 67140, "loss": 0.5467, "lr": 1.7176801993670499e-07, "epoch": 9.664134644027406, "percentage": 96.64, "elapsed_time": "4:30:08", "remaining_time": "0:09:23", "throughput": 2309.11, "total_tokens": 37427976} {"current_steps": 64890, "total_steps": 67140, "loss": 0.676, "lr": 1.7100834884918037e-07, "epoch": 9.664879356568365, "percentage": 96.65, "elapsed_time": "4:30:09", "remaining_time": "0:09:22", "throughput": 2309.13, "total_tokens": 37430952} {"current_steps": 64895, "total_steps": 67140, "loss": 0.6928, "lr": 1.7025035560396252e-07, "epoch": 9.665624069109324, "percentage": 96.66, "elapsed_time": "4:30:11", "remaining_time": "0:09:20", "throughput": 2309.14, "total_tokens": 37433576} {"current_steps": 64900, "total_steps": 67140, "loss": 0.5414, "lr": 1.6949404025227435e-07, "epoch": 9.666368781650283, "percentage": 96.66, "elapsed_time": "4:30:12", "remaining_time": "0:09:19", "throughput": 2309.17, "total_tokens": 37436904} {"current_steps": 64905, "total_steps": 67140, "loss": 0.4824, "lr": 1.6873940284523048e-07, "epoch": 9.667113494191241, "percentage": 96.67, "elapsed_time": "4:30:13", "remaining_time": "0:09:18", "throughput": 2309.19, "total_tokens": 37439880} {"current_steps": 64910, "total_steps": 67140, "loss": 0.658, "lr": 1.6798644343381798e-07, "epoch": 9.667858206732202, "percentage": 96.68, "elapsed_time": "4:30:14", "remaining_time": "0:09:17", "throughput": 2309.21, "total_tokens": 37442760} {"current_steps": 64915, "total_steps": 67140, "loss": 0.5023, "lr": 1.672351620689211e-07, "epoch": 9.66860291927316, "percentage": 96.69, "elapsed_time": "4:30:15", "remaining_time": "0:09:15", "throughput": 2309.23, "total_tokens": 37445736} {"current_steps": 64920, "total_steps": 67140, "loss": 0.5163, "lr": 1.6648555880131033e-07, "epoch": 9.66934763181412, "percentage": 96.69, "elapsed_time": "4:30:16", "remaining_time": "0:09:14", "throughput": 2309.25, "total_tokens": 37448904} {"current_steps": 64925, "total_steps": 67140, "loss": 0.6329, "lr": 1.6573763368163964e-07, "epoch": 9.670092344355078, "percentage": 96.7, "elapsed_time": "4:30:18", "remaining_time": "0:09:13", "throughput": 2309.27, "total_tokens": 37451752} {"current_steps": 64930, "total_steps": 67140, "loss": 0.3721, "lr": 1.6499138676045188e-07, "epoch": 9.670837056896039, "percentage": 96.71, "elapsed_time": "4:30:19", "remaining_time": "0:09:12", "throughput": 2309.29, "total_tokens": 37454728} {"current_steps": 64935, "total_steps": 67140, "loss": 0.6193, "lr": 1.6424681808817343e-07, "epoch": 9.671581769436997, "percentage": 96.72, "elapsed_time": "4:30:20", "remaining_time": "0:09:10", "throughput": 2309.3, "total_tokens": 37457416} {"current_steps": 64940, "total_steps": 67140, "loss": 0.4722, "lr": 1.6350392771512234e-07, "epoch": 9.672326481977956, "percentage": 96.72, "elapsed_time": "4:30:21", "remaining_time": "0:09:09", "throughput": 2309.32, "total_tokens": 37460424} {"current_steps": 64945, "total_steps": 67140, "loss": 0.4787, "lr": 1.6276271569149738e-07, "epoch": 9.673071194518915, "percentage": 96.73, "elapsed_time": "4:30:22", "remaining_time": "0:09:08", "throughput": 2309.34, "total_tokens": 37463560} {"current_steps": 64950, "total_steps": 67140, "loss": 0.6606, "lr": 1.6202318206738342e-07, "epoch": 9.673815907059875, "percentage": 96.74, "elapsed_time": "4:30:23", "remaining_time": "0:09:07", "throughput": 2309.36, "total_tokens": 37466376} {"current_steps": 64955, "total_steps": 67140, "loss": 0.7093, "lr": 1.6128532689276277e-07, "epoch": 9.674560619600834, "percentage": 96.75, "elapsed_time": "4:30:24", "remaining_time": "0:09:05", "throughput": 2309.37, "total_tokens": 37469256} {"current_steps": 64960, "total_steps": 67140, "loss": 0.6794, "lr": 1.6054915021748996e-07, "epoch": 9.675305332141793, "percentage": 96.75, "elapsed_time": "4:30:26", "remaining_time": "0:09:04", "throughput": 2309.39, "total_tokens": 37472264} {"current_steps": 64965, "total_steps": 67140, "loss": 0.692, "lr": 1.5981465209131686e-07, "epoch": 9.676050044682752, "percentage": 96.76, "elapsed_time": "4:30:27", "remaining_time": "0:09:03", "throughput": 2309.41, "total_tokens": 37475272} {"current_steps": 64970, "total_steps": 67140, "loss": 0.6427, "lr": 1.5908183256387877e-07, "epoch": 9.676794757223712, "percentage": 96.77, "elapsed_time": "4:30:28", "remaining_time": "0:09:02", "throughput": 2309.43, "total_tokens": 37478024} {"current_steps": 64975, "total_steps": 67140, "loss": 0.5052, "lr": 1.583506916846944e-07, "epoch": 9.677539469764671, "percentage": 96.78, "elapsed_time": "4:30:29", "remaining_time": "0:09:00", "throughput": 2309.44, "total_tokens": 37480808} {"current_steps": 64980, "total_steps": 67140, "loss": 0.5647, "lr": 1.5762122950316871e-07, "epoch": 9.67828418230563, "percentage": 96.78, "elapsed_time": "4:30:30", "remaining_time": "0:08:59", "throughput": 2309.45, "total_tokens": 37483624} {"current_steps": 64985, "total_steps": 67140, "loss": 0.6449, "lr": 1.5689344606860112e-07, "epoch": 9.679028894846589, "percentage": 96.79, "elapsed_time": "4:30:31", "remaining_time": "0:08:58", "throughput": 2309.48, "total_tokens": 37486696} {"current_steps": 64990, "total_steps": 67140, "loss": 0.6747, "lr": 1.5616734143016898e-07, "epoch": 9.679773607387549, "percentage": 96.8, "elapsed_time": "4:30:32", "remaining_time": "0:08:57", "throughput": 2309.48, "total_tokens": 37489384} {"current_steps": 64995, "total_steps": 67140, "loss": 0.5152, "lr": 1.5544291563693858e-07, "epoch": 9.680518319928508, "percentage": 96.81, "elapsed_time": "4:30:33", "remaining_time": "0:08:55", "throughput": 2309.49, "total_tokens": 37492104} {"current_steps": 65000, "total_steps": 67140, "loss": 0.5336, "lr": 1.5472016873786798e-07, "epoch": 9.681263032469467, "percentage": 96.81, "elapsed_time": "4:30:35", "remaining_time": "0:08:54", "throughput": 2309.52, "total_tokens": 37495336} {"current_steps": 65005, "total_steps": 67140, "loss": 0.5841, "lr": 1.5399910078179314e-07, "epoch": 9.682007745010425, "percentage": 96.82, "elapsed_time": "4:30:36", "remaining_time": "0:08:53", "throughput": 2309.54, "total_tokens": 37498120} {"current_steps": 65010, "total_steps": 67140, "loss": 0.5389, "lr": 1.532797118174417e-07, "epoch": 9.682752457551386, "percentage": 96.83, "elapsed_time": "4:30:37", "remaining_time": "0:08:52", "throughput": 2309.55, "total_tokens": 37500936} {"current_steps": 65015, "total_steps": 67140, "loss": 0.4969, "lr": 1.5256200189343038e-07, "epoch": 9.683497170092345, "percentage": 96.83, "elapsed_time": "4:30:38", "remaining_time": "0:08:50", "throughput": 2309.55, "total_tokens": 37503464} {"current_steps": 65020, "total_steps": 67140, "loss": 0.5795, "lr": 1.518459710582565e-07, "epoch": 9.684241882633303, "percentage": 96.84, "elapsed_time": "4:30:39", "remaining_time": "0:08:49", "throughput": 2309.57, "total_tokens": 37506312} {"current_steps": 65025, "total_steps": 67140, "loss": 0.5774, "lr": 1.511316193603063e-07, "epoch": 9.684986595174262, "percentage": 96.85, "elapsed_time": "4:30:40", "remaining_time": "0:08:48", "throughput": 2309.58, "total_tokens": 37509128} {"current_steps": 65030, "total_steps": 67140, "loss": 0.5755, "lr": 1.504189468478523e-07, "epoch": 9.685731307715223, "percentage": 96.86, "elapsed_time": "4:30:41", "remaining_time": "0:08:46", "throughput": 2309.6, "total_tokens": 37511976} {"current_steps": 65035, "total_steps": 67140, "loss": 0.4497, "lr": 1.497079535690532e-07, "epoch": 9.686476020256181, "percentage": 96.86, "elapsed_time": "4:30:42", "remaining_time": "0:08:45", "throughput": 2309.62, "total_tokens": 37514952} {"current_steps": 65040, "total_steps": 67140, "loss": 0.3607, "lr": 1.4899863957195948e-07, "epoch": 9.68722073279714, "percentage": 96.87, "elapsed_time": "4:30:44", "remaining_time": "0:08:44", "throughput": 2309.63, "total_tokens": 37517704} {"current_steps": 65045, "total_steps": 67140, "loss": 0.5758, "lr": 1.4829100490449942e-07, "epoch": 9.687965445338099, "percentage": 96.88, "elapsed_time": "4:30:45", "remaining_time": "0:08:43", "throughput": 2309.64, "total_tokens": 37520488} {"current_steps": 65050, "total_steps": 67140, "loss": 0.4932, "lr": 1.4758504961449315e-07, "epoch": 9.688710157879058, "percentage": 96.89, "elapsed_time": "4:30:46", "remaining_time": "0:08:41", "throughput": 2309.67, "total_tokens": 37523624} {"current_steps": 65055, "total_steps": 67140, "loss": 0.6046, "lr": 1.468807737496497e-07, "epoch": 9.689454870420018, "percentage": 96.89, "elapsed_time": "4:30:47", "remaining_time": "0:08:40", "throughput": 2309.68, "total_tokens": 37526344} {"current_steps": 65060, "total_steps": 67140, "loss": 0.5608, "lr": 1.4617817735755323e-07, "epoch": 9.690199582960977, "percentage": 96.9, "elapsed_time": "4:30:48", "remaining_time": "0:08:39", "throughput": 2309.69, "total_tokens": 37529032} {"current_steps": 65065, "total_steps": 67140, "loss": 0.5105, "lr": 1.4547726048569077e-07, "epoch": 9.690944295501936, "percentage": 96.91, "elapsed_time": "4:30:49", "remaining_time": "0:08:38", "throughput": 2309.71, "total_tokens": 37531976} {"current_steps": 65070, "total_steps": 67140, "loss": 0.7003, "lr": 1.447780231814244e-07, "epoch": 9.691689008042896, "percentage": 96.92, "elapsed_time": "4:30:50", "remaining_time": "0:08:36", "throughput": 2309.73, "total_tokens": 37535016} {"current_steps": 65075, "total_steps": 67140, "loss": 0.6672, "lr": 1.4408046549200528e-07, "epoch": 9.692433720583855, "percentage": 96.92, "elapsed_time": "4:30:51", "remaining_time": "0:08:35", "throughput": 2309.74, "total_tokens": 37537800} {"current_steps": 65080, "total_steps": 67140, "loss": 0.3572, "lr": 1.4338458746457062e-07, "epoch": 9.693178433124814, "percentage": 96.93, "elapsed_time": "4:30:53", "remaining_time": "0:08:34", "throughput": 2309.78, "total_tokens": 37541192} {"current_steps": 65085, "total_steps": 67140, "loss": 0.4754, "lr": 1.4269038914614397e-07, "epoch": 9.693923145665773, "percentage": 96.94, "elapsed_time": "4:30:54", "remaining_time": "0:08:33", "throughput": 2309.79, "total_tokens": 37543976} {"current_steps": 65090, "total_steps": 67140, "loss": 0.4569, "lr": 1.4199787058364056e-07, "epoch": 9.694667858206731, "percentage": 96.95, "elapsed_time": "4:30:55", "remaining_time": "0:08:31", "throughput": 2309.81, "total_tokens": 37547080} {"current_steps": 65095, "total_steps": 67140, "loss": 0.4788, "lr": 1.413070318238535e-07, "epoch": 9.695412570747692, "percentage": 96.95, "elapsed_time": "4:30:56", "remaining_time": "0:08:30", "throughput": 2309.83, "total_tokens": 37550120} {"current_steps": 65100, "total_steps": 67140, "loss": 0.5622, "lr": 1.4061787291347051e-07, "epoch": 9.69615728328865, "percentage": 96.96, "elapsed_time": "4:30:57", "remaining_time": "0:08:29", "throughput": 2309.85, "total_tokens": 37553032} {"current_steps": 65105, "total_steps": 67140, "loss": 0.5059, "lr": 1.399303938990626e-07, "epoch": 9.69690199582961, "percentage": 96.97, "elapsed_time": "4:30:58", "remaining_time": "0:08:28", "throughput": 2309.88, "total_tokens": 37556232} {"current_steps": 65110, "total_steps": 67140, "loss": 0.7961, "lr": 1.392445948270843e-07, "epoch": 9.697646708370568, "percentage": 96.98, "elapsed_time": "4:31:00", "remaining_time": "0:08:26", "throughput": 2309.9, "total_tokens": 37559144} {"current_steps": 65115, "total_steps": 67140, "loss": 0.4049, "lr": 1.385604757438791e-07, "epoch": 9.698391420911529, "percentage": 96.98, "elapsed_time": "4:31:01", "remaining_time": "0:08:25", "throughput": 2309.91, "total_tokens": 37561992} {"current_steps": 65120, "total_steps": 67140, "loss": 0.6254, "lr": 1.3787803669567667e-07, "epoch": 9.699136133452487, "percentage": 96.99, "elapsed_time": "4:31:02", "remaining_time": "0:08:24", "throughput": 2309.92, "total_tokens": 37564616} {"current_steps": 65125, "total_steps": 67140, "loss": 0.6991, "lr": 1.371972777285957e-07, "epoch": 9.699880845993446, "percentage": 97.0, "elapsed_time": "4:31:03", "remaining_time": "0:08:23", "throughput": 2309.95, "total_tokens": 37567816} {"current_steps": 65130, "total_steps": 67140, "loss": 0.5241, "lr": 1.3651819888863548e-07, "epoch": 9.700625558534405, "percentage": 97.01, "elapsed_time": "4:31:04", "remaining_time": "0:08:21", "throughput": 2309.96, "total_tokens": 37570696} {"current_steps": 65135, "total_steps": 67140, "loss": 0.554, "lr": 1.3584080022169266e-07, "epoch": 9.701370271075366, "percentage": 97.01, "elapsed_time": "4:31:05", "remaining_time": "0:08:20", "throughput": 2310.0, "total_tokens": 37574024} {"current_steps": 65140, "total_steps": 67140, "loss": 0.4765, "lr": 1.3516508177353337e-07, "epoch": 9.702114983616324, "percentage": 97.02, "elapsed_time": "4:31:06", "remaining_time": "0:08:19", "throughput": 2310.01, "total_tokens": 37576904} {"current_steps": 65145, "total_steps": 67140, "loss": 0.5119, "lr": 1.3449104358982944e-07, "epoch": 9.702859696157283, "percentage": 97.03, "elapsed_time": "4:31:08", "remaining_time": "0:08:18", "throughput": 2310.03, "total_tokens": 37579720} {"current_steps": 65150, "total_steps": 67140, "loss": 0.5765, "lr": 1.3381868571612222e-07, "epoch": 9.703604408698242, "percentage": 97.04, "elapsed_time": "4:31:09", "remaining_time": "0:08:16", "throughput": 2310.03, "total_tokens": 37582280} {"current_steps": 65155, "total_steps": 67140, "loss": 0.6146, "lr": 1.3314800819785035e-07, "epoch": 9.704349121239202, "percentage": 97.04, "elapsed_time": "4:31:10", "remaining_time": "0:08:15", "throughput": 2310.03, "total_tokens": 37584808} {"current_steps": 65160, "total_steps": 67140, "loss": 0.4891, "lr": 1.3247901108033313e-07, "epoch": 9.705093833780161, "percentage": 97.05, "elapsed_time": "4:31:11", "remaining_time": "0:08:14", "throughput": 2310.06, "total_tokens": 37587848} {"current_steps": 65165, "total_steps": 67140, "loss": 0.456, "lr": 1.318116944087816e-07, "epoch": 9.70583854632112, "percentage": 97.06, "elapsed_time": "4:31:12", "remaining_time": "0:08:13", "throughput": 2310.08, "total_tokens": 37590888} {"current_steps": 65170, "total_steps": 67140, "loss": 0.439, "lr": 1.3114605822829028e-07, "epoch": 9.706583258862079, "percentage": 97.07, "elapsed_time": "4:31:13", "remaining_time": "0:08:11", "throughput": 2310.08, "total_tokens": 37593416} {"current_steps": 65175, "total_steps": 67140, "loss": 0.57, "lr": 1.304821025838371e-07, "epoch": 9.70732797140304, "percentage": 97.07, "elapsed_time": "4:31:14", "remaining_time": "0:08:10", "throughput": 2310.1, "total_tokens": 37596552} {"current_steps": 65180, "total_steps": 67140, "loss": 0.5763, "lr": 1.2981982752029164e-07, "epoch": 9.708072683943998, "percentage": 97.08, "elapsed_time": "4:31:15", "remaining_time": "0:08:09", "throughput": 2310.12, "total_tokens": 37599464} {"current_steps": 65185, "total_steps": 67140, "loss": 0.5279, "lr": 1.2915923308240984e-07, "epoch": 9.708817396484957, "percentage": 97.09, "elapsed_time": "4:31:17", "remaining_time": "0:08:08", "throughput": 2310.13, "total_tokens": 37602248} {"current_steps": 65190, "total_steps": 67140, "loss": 0.6054, "lr": 1.2850031931482543e-07, "epoch": 9.709562109025915, "percentage": 97.1, "elapsed_time": "4:31:18", "remaining_time": "0:08:06", "throughput": 2310.15, "total_tokens": 37605288} {"current_steps": 65195, "total_steps": 67140, "loss": 0.4207, "lr": 1.278430862620722e-07, "epoch": 9.710306821566876, "percentage": 97.1, "elapsed_time": "4:31:19", "remaining_time": "0:08:05", "throughput": 2310.16, "total_tokens": 37607976} {"current_steps": 65200, "total_steps": 67140, "loss": 0.7239, "lr": 1.2718753396855908e-07, "epoch": 9.711051534107835, "percentage": 97.11, "elapsed_time": "4:31:20", "remaining_time": "0:08:04", "throughput": 2310.18, "total_tokens": 37610888} {"current_steps": 65205, "total_steps": 67140, "loss": 0.5086, "lr": 1.2653366247858955e-07, "epoch": 9.711796246648793, "percentage": 97.12, "elapsed_time": "4:31:21", "remaining_time": "0:08:03", "throughput": 2310.19, "total_tokens": 37613704} {"current_steps": 65210, "total_steps": 67140, "loss": 0.5984, "lr": 1.258814718363449e-07, "epoch": 9.712540959189752, "percentage": 97.13, "elapsed_time": "4:31:22", "remaining_time": "0:08:01", "throughput": 2310.2, "total_tokens": 37616520} {"current_steps": 65215, "total_steps": 67140, "loss": 0.6378, "lr": 1.2523096208589823e-07, "epoch": 9.713285671730713, "percentage": 97.13, "elapsed_time": "4:31:23", "remaining_time": "0:08:00", "throughput": 2310.22, "total_tokens": 37619432} {"current_steps": 65220, "total_steps": 67140, "loss": 0.7606, "lr": 1.245821332712116e-07, "epoch": 9.714030384271672, "percentage": 97.14, "elapsed_time": "4:31:25", "remaining_time": "0:07:59", "throughput": 2310.24, "total_tokens": 37622344} {"current_steps": 65225, "total_steps": 67140, "loss": 0.5424, "lr": 1.2393498543612769e-07, "epoch": 9.71477509681263, "percentage": 97.15, "elapsed_time": "4:31:26", "remaining_time": "0:07:58", "throughput": 2310.25, "total_tokens": 37625000} {"current_steps": 65230, "total_steps": 67140, "loss": 0.509, "lr": 1.232895186243782e-07, "epoch": 9.715519809353589, "percentage": 97.16, "elapsed_time": "4:31:27", "remaining_time": "0:07:56", "throughput": 2310.27, "total_tokens": 37627944} {"current_steps": 65235, "total_steps": 67140, "loss": 0.655, "lr": 1.2264573287958382e-07, "epoch": 9.716264521894548, "percentage": 97.16, "elapsed_time": "4:31:28", "remaining_time": "0:07:55", "throughput": 2310.28, "total_tokens": 37630696} {"current_steps": 65240, "total_steps": 67140, "loss": 0.6052, "lr": 1.220036282452458e-07, "epoch": 9.717009234435508, "percentage": 97.17, "elapsed_time": "4:31:29", "remaining_time": "0:07:54", "throughput": 2310.3, "total_tokens": 37633608} {"current_steps": 65245, "total_steps": 67140, "loss": 0.4327, "lr": 1.213632047647545e-07, "epoch": 9.717753946976467, "percentage": 97.18, "elapsed_time": "4:31:30", "remaining_time": "0:07:53", "throughput": 2310.31, "total_tokens": 37636488} {"current_steps": 65250, "total_steps": 67140, "loss": 0.4562, "lr": 1.2072446248138912e-07, "epoch": 9.718498659517426, "percentage": 97.18, "elapsed_time": "4:31:31", "remaining_time": "0:07:51", "throughput": 2310.33, "total_tokens": 37639560} {"current_steps": 65255, "total_steps": 67140, "loss": 0.6713, "lr": 1.200874014383152e-07, "epoch": 9.719243372058386, "percentage": 97.19, "elapsed_time": "4:31:32", "remaining_time": "0:07:50", "throughput": 2310.35, "total_tokens": 37642568} {"current_steps": 65260, "total_steps": 67140, "loss": 0.4902, "lr": 1.1945202167857882e-07, "epoch": 9.719988084599345, "percentage": 97.2, "elapsed_time": "4:31:34", "remaining_time": "0:07:49", "throughput": 2310.37, "total_tokens": 37645576} {"current_steps": 65265, "total_steps": 67140, "loss": 0.519, "lr": 1.188183232451151e-07, "epoch": 9.720732797140304, "percentage": 97.21, "elapsed_time": "4:31:35", "remaining_time": "0:07:48", "throughput": 2310.39, "total_tokens": 37648488} {"current_steps": 65270, "total_steps": 67140, "loss": 0.6285, "lr": 1.1818630618075366e-07, "epoch": 9.721477509681263, "percentage": 97.21, "elapsed_time": "4:31:36", "remaining_time": "0:07:46", "throughput": 2310.41, "total_tokens": 37651464} {"current_steps": 65275, "total_steps": 67140, "loss": 0.6441, "lr": 1.1755597052819922e-07, "epoch": 9.722222222222221, "percentage": 97.22, "elapsed_time": "4:31:37", "remaining_time": "0:07:45", "throughput": 2310.42, "total_tokens": 37654280} {"current_steps": 65280, "total_steps": 67140, "loss": 0.4966, "lr": 1.169273163300455e-07, "epoch": 9.722966934763182, "percentage": 97.23, "elapsed_time": "4:31:38", "remaining_time": "0:07:44", "throughput": 2310.42, "total_tokens": 37656840} {"current_steps": 65285, "total_steps": 67140, "loss": 0.5075, "lr": 1.1630034362877796e-07, "epoch": 9.72371164730414, "percentage": 97.24, "elapsed_time": "4:31:39", "remaining_time": "0:07:43", "throughput": 2310.44, "total_tokens": 37659752} {"current_steps": 65290, "total_steps": 67140, "loss": 0.6065, "lr": 1.1567505246676269e-07, "epoch": 9.7244563598451, "percentage": 97.24, "elapsed_time": "4:31:40", "remaining_time": "0:07:41", "throughput": 2310.47, "total_tokens": 37662888} {"current_steps": 65295, "total_steps": 67140, "loss": 0.511, "lr": 1.150514428862548e-07, "epoch": 9.725201072386058, "percentage": 97.25, "elapsed_time": "4:31:42", "remaining_time": "0:07:40", "throughput": 2310.49, "total_tokens": 37665896} {"current_steps": 65300, "total_steps": 67140, "loss": 0.6261, "lr": 1.1442951492939835e-07, "epoch": 9.725945784927019, "percentage": 97.26, "elapsed_time": "4:31:43", "remaining_time": "0:07:39", "throughput": 2310.51, "total_tokens": 37668904} {"current_steps": 65305, "total_steps": 67140, "loss": 0.5404, "lr": 1.1380926863821528e-07, "epoch": 9.726690497467978, "percentage": 97.27, "elapsed_time": "4:31:44", "remaining_time": "0:07:38", "throughput": 2310.51, "total_tokens": 37671592} {"current_steps": 65310, "total_steps": 67140, "loss": 0.8849, "lr": 1.1319070405462207e-07, "epoch": 9.727435210008936, "percentage": 97.27, "elapsed_time": "4:31:45", "remaining_time": "0:07:36", "throughput": 2310.54, "total_tokens": 37674824} {"current_steps": 65315, "total_steps": 67140, "loss": 0.7818, "lr": 1.1257382122041859e-07, "epoch": 9.728179922549895, "percentage": 97.28, "elapsed_time": "4:31:46", "remaining_time": "0:07:35", "throughput": 2310.56, "total_tokens": 37677640} {"current_steps": 65320, "total_steps": 67140, "loss": 0.4933, "lr": 1.1195862017729097e-07, "epoch": 9.728924635090856, "percentage": 97.29, "elapsed_time": "4:31:47", "remaining_time": "0:07:34", "throughput": 2310.57, "total_tokens": 37680520} {"current_steps": 65325, "total_steps": 67140, "loss": 0.4365, "lr": 1.1134510096681427e-07, "epoch": 9.729669347631814, "percentage": 97.3, "elapsed_time": "4:31:48", "remaining_time": "0:07:33", "throughput": 2310.59, "total_tokens": 37683368} {"current_steps": 65330, "total_steps": 67140, "loss": 0.52, "lr": 1.1073326363044423e-07, "epoch": 9.730414060172773, "percentage": 97.3, "elapsed_time": "4:31:50", "remaining_time": "0:07:31", "throughput": 2310.6, "total_tokens": 37686056} {"current_steps": 65335, "total_steps": 67140, "loss": 0.7101, "lr": 1.1012310820952831e-07, "epoch": 9.731158772713732, "percentage": 97.31, "elapsed_time": "4:31:51", "remaining_time": "0:07:30", "throughput": 2310.61, "total_tokens": 37688936} {"current_steps": 65340, "total_steps": 67140, "loss": 0.5534, "lr": 1.0951463474529744e-07, "epoch": 9.731903485254692, "percentage": 97.32, "elapsed_time": "4:31:52", "remaining_time": "0:07:29", "throughput": 2310.62, "total_tokens": 37691720} {"current_steps": 65345, "total_steps": 67140, "loss": 0.5766, "lr": 1.0890784327887149e-07, "epoch": 9.732648197795651, "percentage": 97.33, "elapsed_time": "4:31:53", "remaining_time": "0:07:28", "throughput": 2310.63, "total_tokens": 37694376} {"current_steps": 65350, "total_steps": 67140, "loss": 0.7535, "lr": 1.0830273385125378e-07, "epoch": 9.73339291033661, "percentage": 97.33, "elapsed_time": "4:31:54", "remaining_time": "0:07:26", "throughput": 2310.66, "total_tokens": 37697480} {"current_steps": 65355, "total_steps": 67140, "loss": 0.7571, "lr": 1.0769930650333382e-07, "epoch": 9.734137622877569, "percentage": 97.34, "elapsed_time": "4:31:55", "remaining_time": "0:07:25", "throughput": 2310.67, "total_tokens": 37700360} {"current_steps": 65360, "total_steps": 67140, "loss": 0.6205, "lr": 1.070975612758901e-07, "epoch": 9.73488233541853, "percentage": 97.35, "elapsed_time": "4:31:56", "remaining_time": "0:07:24", "throughput": 2310.67, "total_tokens": 37702888} {"current_steps": 65365, "total_steps": 67140, "loss": 0.5276, "lr": 1.0649749820958732e-07, "epoch": 9.735627047959488, "percentage": 97.36, "elapsed_time": "4:31:57", "remaining_time": "0:07:23", "throughput": 2310.68, "total_tokens": 37705512} {"current_steps": 65370, "total_steps": 67140, "loss": 0.4639, "lr": 1.058991173449736e-07, "epoch": 9.736371760500447, "percentage": 97.36, "elapsed_time": "4:31:59", "remaining_time": "0:07:21", "throughput": 2310.68, "total_tokens": 37708136} {"current_steps": 65375, "total_steps": 67140, "loss": 0.6132, "lr": 1.0530241872248326e-07, "epoch": 9.737116473041405, "percentage": 97.37, "elapsed_time": "4:32:00", "remaining_time": "0:07:20", "throughput": 2310.7, "total_tokens": 37710984} {"current_steps": 65380, "total_steps": 67140, "loss": 0.5358, "lr": 1.0470740238244237e-07, "epoch": 9.737861185582366, "percentage": 97.38, "elapsed_time": "4:32:01", "remaining_time": "0:07:19", "throughput": 2310.72, "total_tokens": 37714024} {"current_steps": 65385, "total_steps": 67140, "loss": 0.6323, "lr": 1.0411406836505766e-07, "epoch": 9.738605898123325, "percentage": 97.39, "elapsed_time": "4:32:02", "remaining_time": "0:07:18", "throughput": 2310.73, "total_tokens": 37716840} {"current_steps": 65390, "total_steps": 67140, "loss": 0.5748, "lr": 1.0352241671042762e-07, "epoch": 9.739350610664284, "percentage": 97.39, "elapsed_time": "4:32:03", "remaining_time": "0:07:16", "throughput": 2310.75, "total_tokens": 37719688} {"current_steps": 65395, "total_steps": 67140, "loss": 0.6633, "lr": 1.0293244745852859e-07, "epoch": 9.740095323205242, "percentage": 97.4, "elapsed_time": "4:32:04", "remaining_time": "0:07:15", "throughput": 2310.75, "total_tokens": 37722248} {"current_steps": 65400, "total_steps": 67140, "loss": 0.6711, "lr": 1.0234416064923146e-07, "epoch": 9.740840035746203, "percentage": 97.41, "elapsed_time": "4:32:05", "remaining_time": "0:07:14", "throughput": 2310.76, "total_tokens": 37724840} {"current_steps": 65405, "total_steps": 67140, "loss": 0.4913, "lr": 1.0175755632228779e-07, "epoch": 9.741584748287162, "percentage": 97.42, "elapsed_time": "4:32:06", "remaining_time": "0:07:13", "throughput": 2310.77, "total_tokens": 37727528} {"current_steps": 65410, "total_steps": 67140, "loss": 0.6797, "lr": 1.0117263451734083e-07, "epoch": 9.74232946082812, "percentage": 97.42, "elapsed_time": "4:32:07", "remaining_time": "0:07:11", "throughput": 2310.78, "total_tokens": 37730440} {"current_steps": 65415, "total_steps": 67140, "loss": 0.4555, "lr": 1.005893952739173e-07, "epoch": 9.743074173369079, "percentage": 97.43, "elapsed_time": "4:32:09", "remaining_time": "0:07:10", "throughput": 2310.8, "total_tokens": 37733320} {"current_steps": 65420, "total_steps": 67140, "loss": 0.4927, "lr": 1.0000783863142738e-07, "epoch": 9.743818885910038, "percentage": 97.44, "elapsed_time": "4:32:10", "remaining_time": "0:07:09", "throughput": 2310.83, "total_tokens": 37736456} {"current_steps": 65425, "total_steps": 67140, "loss": 0.6304, "lr": 9.942796462917014e-08, "epoch": 9.744563598450998, "percentage": 97.45, "elapsed_time": "4:32:11", "remaining_time": "0:07:08", "throughput": 2310.84, "total_tokens": 37739304} {"current_steps": 65430, "total_steps": 67140, "loss": 0.4897, "lr": 9.884977330633649e-08, "epoch": 9.745308310991957, "percentage": 97.45, "elapsed_time": "4:32:12", "remaining_time": "0:07:06", "throughput": 2310.85, "total_tokens": 37742024} {"current_steps": 65435, "total_steps": 67140, "loss": 0.7139, "lr": 9.827326470199239e-08, "epoch": 9.746053023532916, "percentage": 97.46, "elapsed_time": "4:32:13", "remaining_time": "0:07:05", "throughput": 2310.87, "total_tokens": 37745000} {"current_steps": 65440, "total_steps": 67140, "loss": 0.4703, "lr": 9.769843885509834e-08, "epoch": 9.746797736073875, "percentage": 97.47, "elapsed_time": "4:32:14", "remaining_time": "0:07:04", "throughput": 2310.88, "total_tokens": 37747848} {"current_steps": 65445, "total_steps": 67140, "loss": 0.5776, "lr": 9.712529580449825e-08, "epoch": 9.747542448614835, "percentage": 97.48, "elapsed_time": "4:32:15", "remaining_time": "0:07:03", "throughput": 2310.91, "total_tokens": 37751016} {"current_steps": 65450, "total_steps": 67140, "loss": 0.6234, "lr": 9.655383558892228e-08, "epoch": 9.748287161155794, "percentage": 97.48, "elapsed_time": "4:32:17", "remaining_time": "0:07:01", "throughput": 2310.93, "total_tokens": 37753896} {"current_steps": 65455, "total_steps": 67140, "loss": 0.5001, "lr": 9.598405824698953e-08, "epoch": 9.749031873696753, "percentage": 97.49, "elapsed_time": "4:32:18", "remaining_time": "0:07:00", "throughput": 2310.95, "total_tokens": 37756968} {"current_steps": 65460, "total_steps": 67140, "loss": 0.7189, "lr": 9.541596381719976e-08, "epoch": 9.749776586237711, "percentage": 97.5, "elapsed_time": "4:32:19", "remaining_time": "0:06:59", "throughput": 2310.97, "total_tokens": 37759880} {"current_steps": 65465, "total_steps": 67140, "loss": 0.3855, "lr": 9.484955233794723e-08, "epoch": 9.750521298778672, "percentage": 97.51, "elapsed_time": "4:32:20", "remaining_time": "0:06:58", "throughput": 2310.99, "total_tokens": 37762888} {"current_steps": 65470, "total_steps": 67140, "loss": 0.4854, "lr": 9.428482384750136e-08, "epoch": 9.75126601131963, "percentage": 97.51, "elapsed_time": "4:32:21", "remaining_time": "0:06:56", "throughput": 2310.99, "total_tokens": 37765544} {"current_steps": 65475, "total_steps": 67140, "loss": 0.685, "lr": 9.372177838403162e-08, "epoch": 9.75201072386059, "percentage": 97.52, "elapsed_time": "4:32:22", "remaining_time": "0:06:55", "throughput": 2311.01, "total_tokens": 37768520} {"current_steps": 65480, "total_steps": 67140, "loss": 0.5597, "lr": 9.316041598557979e-08, "epoch": 9.752755436401548, "percentage": 97.53, "elapsed_time": "4:32:23", "remaining_time": "0:06:54", "throughput": 2311.02, "total_tokens": 37771144} {"current_steps": 65485, "total_steps": 67140, "loss": 0.6972, "lr": 9.260073669008496e-08, "epoch": 9.753500148942509, "percentage": 97.54, "elapsed_time": "4:32:25", "remaining_time": "0:06:53", "throughput": 2311.03, "total_tokens": 37773928} {"current_steps": 65490, "total_steps": 67140, "loss": 0.5158, "lr": 9.20427405353641e-08, "epoch": 9.754244861483468, "percentage": 97.54, "elapsed_time": "4:32:26", "remaining_time": "0:06:51", "throughput": 2311.05, "total_tokens": 37776840} {"current_steps": 65495, "total_steps": 67140, "loss": 0.3668, "lr": 9.148642755912873e-08, "epoch": 9.754989574024426, "percentage": 97.55, "elapsed_time": "4:32:27", "remaining_time": "0:06:50", "throughput": 2311.07, "total_tokens": 37779784} {"current_steps": 65500, "total_steps": 67140, "loss": 0.5489, "lr": 9.093179779897099e-08, "epoch": 9.755734286565385, "percentage": 97.56, "elapsed_time": "4:32:28", "remaining_time": "0:06:49", "throughput": 2311.08, "total_tokens": 37782600} {"current_steps": 65505, "total_steps": 67140, "loss": 0.543, "lr": 9.037885129236645e-08, "epoch": 9.756478999106346, "percentage": 97.56, "elapsed_time": "4:32:29", "remaining_time": "0:06:48", "throughput": 2311.1, "total_tokens": 37785480} {"current_steps": 65510, "total_steps": 67140, "loss": 0.5628, "lr": 8.982758807668523e-08, "epoch": 9.757223711647304, "percentage": 97.57, "elapsed_time": "4:32:30", "remaining_time": "0:06:46", "throughput": 2311.12, "total_tokens": 37788456} {"current_steps": 65515, "total_steps": 67140, "loss": 0.5327, "lr": 8.927800818917809e-08, "epoch": 9.757968424188263, "percentage": 97.58, "elapsed_time": "4:32:31", "remaining_time": "0:06:45", "throughput": 2311.14, "total_tokens": 37791336} {"current_steps": 65520, "total_steps": 67140, "loss": 0.6102, "lr": 8.873011166698475e-08, "epoch": 9.758713136729222, "percentage": 97.59, "elapsed_time": "4:32:32", "remaining_time": "0:06:44", "throughput": 2311.16, "total_tokens": 37794344} {"current_steps": 65525, "total_steps": 67140, "loss": 0.5331, "lr": 8.818389854712561e-08, "epoch": 9.759457849270182, "percentage": 97.59, "elapsed_time": "4:32:34", "remaining_time": "0:06:43", "throughput": 2311.19, "total_tokens": 37797608} {"current_steps": 65530, "total_steps": 67140, "loss": 0.5679, "lr": 8.763936886651558e-08, "epoch": 9.760202561811141, "percentage": 97.6, "elapsed_time": "4:32:35", "remaining_time": "0:06:41", "throughput": 2311.2, "total_tokens": 37800296} {"current_steps": 65535, "total_steps": 67140, "loss": 0.5536, "lr": 8.709652266195301e-08, "epoch": 9.7609472743521, "percentage": 97.61, "elapsed_time": "4:32:36", "remaining_time": "0:06:40", "throughput": 2311.23, "total_tokens": 37803464} {"current_steps": 65540, "total_steps": 67140, "loss": 0.5046, "lr": 8.655535997011688e-08, "epoch": 9.761691986893059, "percentage": 97.62, "elapsed_time": "4:32:37", "remaining_time": "0:06:39", "throughput": 2311.25, "total_tokens": 37806632} {"current_steps": 65545, "total_steps": 67140, "loss": 0.4877, "lr": 8.601588082758073e-08, "epoch": 9.76243669943402, "percentage": 97.62, "elapsed_time": "4:32:38", "remaining_time": "0:06:38", "throughput": 2311.26, "total_tokens": 37809384} {"current_steps": 65550, "total_steps": 67140, "loss": 0.5278, "lr": 8.547808527079593e-08, "epoch": 9.763181411974978, "percentage": 97.63, "elapsed_time": "4:32:39", "remaining_time": "0:06:36", "throughput": 2311.28, "total_tokens": 37812168} {"current_steps": 65555, "total_steps": 67140, "loss": 0.4406, "lr": 8.494197333610843e-08, "epoch": 9.763926124515937, "percentage": 97.64, "elapsed_time": "4:32:40", "remaining_time": "0:06:35", "throughput": 2311.29, "total_tokens": 37814920} {"current_steps": 65560, "total_steps": 67140, "loss": 0.5451, "lr": 8.44075450597448e-08, "epoch": 9.764670837056896, "percentage": 97.65, "elapsed_time": "4:32:42", "remaining_time": "0:06:34", "throughput": 2311.29, "total_tokens": 37817480} {"current_steps": 65565, "total_steps": 67140, "loss": 0.6081, "lr": 8.38748004778206e-08, "epoch": 9.765415549597854, "percentage": 97.65, "elapsed_time": "4:32:43", "remaining_time": "0:06:33", "throughput": 2311.3, "total_tokens": 37820296} {"current_steps": 65570, "total_steps": 67140, "loss": 0.7329, "lr": 8.33437396263348e-08, "epoch": 9.766160262138815, "percentage": 97.66, "elapsed_time": "4:32:44", "remaining_time": "0:06:31", "throughput": 2311.32, "total_tokens": 37823144} {"current_steps": 65575, "total_steps": 67140, "loss": 0.5954, "lr": 8.281436254117536e-08, "epoch": 9.766904974679774, "percentage": 97.67, "elapsed_time": "4:32:45", "remaining_time": "0:06:30", "throughput": 2311.34, "total_tokens": 37826248} {"current_steps": 65580, "total_steps": 67140, "loss": 0.7887, "lr": 8.228666925811646e-08, "epoch": 9.767649687220732, "percentage": 97.68, "elapsed_time": "4:32:46", "remaining_time": "0:06:29", "throughput": 2311.36, "total_tokens": 37829128} {"current_steps": 65585, "total_steps": 67140, "loss": 0.6556, "lr": 8.176065981281567e-08, "epoch": 9.768394399761693, "percentage": 97.68, "elapsed_time": "4:32:47", "remaining_time": "0:06:28", "throughput": 2311.36, "total_tokens": 37831720} {"current_steps": 65590, "total_steps": 67140, "loss": 0.4897, "lr": 8.123633424081956e-08, "epoch": 9.769139112302652, "percentage": 97.69, "elapsed_time": "4:32:48", "remaining_time": "0:06:26", "throughput": 2311.38, "total_tokens": 37834664} {"current_steps": 65595, "total_steps": 67140, "loss": 0.574, "lr": 8.07136925775609e-08, "epoch": 9.76988382484361, "percentage": 97.7, "elapsed_time": "4:32:50", "remaining_time": "0:06:25", "throughput": 2311.41, "total_tokens": 37837832} {"current_steps": 65600, "total_steps": 67140, "loss": 0.5779, "lr": 8.01927348583531e-08, "epoch": 9.77062853738457, "percentage": 97.71, "elapsed_time": "4:32:51", "remaining_time": "0:06:24", "throughput": 2311.45, "total_tokens": 37841192} {"current_steps": 65605, "total_steps": 67140, "loss": 0.5631, "lr": 7.96734611184069e-08, "epoch": 9.771373249925528, "percentage": 97.71, "elapsed_time": "4:32:52", "remaining_time": "0:06:23", "throughput": 2311.46, "total_tokens": 37843880} {"current_steps": 65610, "total_steps": 67140, "loss": 0.4471, "lr": 7.915587139280811e-08, "epoch": 9.772117962466488, "percentage": 97.72, "elapsed_time": "4:32:53", "remaining_time": "0:06:21", "throughput": 2311.47, "total_tokens": 37846760} {"current_steps": 65615, "total_steps": 67140, "loss": 0.612, "lr": 7.863996571653431e-08, "epoch": 9.772862675007447, "percentage": 97.73, "elapsed_time": "4:32:54", "remaining_time": "0:06:20", "throughput": 2311.47, "total_tokens": 37849320} {"current_steps": 65620, "total_steps": 67140, "loss": 0.6776, "lr": 7.812574412444929e-08, "epoch": 9.773607387548406, "percentage": 97.74, "elapsed_time": "4:32:55", "remaining_time": "0:06:19", "throughput": 2311.47, "total_tokens": 37851816} {"current_steps": 65625, "total_steps": 67140, "loss": 0.472, "lr": 7.761320665130301e-08, "epoch": 9.774352100089365, "percentage": 97.74, "elapsed_time": "4:32:56", "remaining_time": "0:06:18", "throughput": 2311.49, "total_tokens": 37854600} {"current_steps": 65630, "total_steps": 67140, "loss": 0.8315, "lr": 7.71023533317261e-08, "epoch": 9.775096812630325, "percentage": 97.75, "elapsed_time": "4:32:57", "remaining_time": "0:06:16", "throughput": 2311.5, "total_tokens": 37857448} {"current_steps": 65635, "total_steps": 67140, "loss": 0.5427, "lr": 7.659318420024653e-08, "epoch": 9.775841525171284, "percentage": 97.76, "elapsed_time": "4:32:59", "remaining_time": "0:06:15", "throughput": 2311.52, "total_tokens": 37860392} {"current_steps": 65640, "total_steps": 67140, "loss": 0.499, "lr": 7.60856992912673e-08, "epoch": 9.776586237712243, "percentage": 97.77, "elapsed_time": "4:33:00", "remaining_time": "0:06:14", "throughput": 2311.55, "total_tokens": 37863752} {"current_steps": 65645, "total_steps": 67140, "loss": 0.4258, "lr": 7.557989863908044e-08, "epoch": 9.777330950253202, "percentage": 97.77, "elapsed_time": "4:33:01", "remaining_time": "0:06:13", "throughput": 2311.56, "total_tokens": 37866504} {"current_steps": 65650, "total_steps": 67140, "loss": 0.6804, "lr": 7.507578227787249e-08, "epoch": 9.778075662794162, "percentage": 97.78, "elapsed_time": "4:33:02", "remaining_time": "0:06:11", "throughput": 2311.59, "total_tokens": 37869640} {"current_steps": 65655, "total_steps": 67140, "loss": 0.5176, "lr": 7.457335024170231e-08, "epoch": 9.77882037533512, "percentage": 97.79, "elapsed_time": "4:33:03", "remaining_time": "0:06:10", "throughput": 2311.61, "total_tokens": 37872584} {"current_steps": 65660, "total_steps": 67140, "loss": 0.6334, "lr": 7.407260256452885e-08, "epoch": 9.77956508787608, "percentage": 97.8, "elapsed_time": "4:33:04", "remaining_time": "0:06:09", "throughput": 2311.63, "total_tokens": 37875592} {"current_steps": 65665, "total_steps": 67140, "loss": 0.6233, "lr": 7.357353928018618e-08, "epoch": 9.780309800417038, "percentage": 97.8, "elapsed_time": "4:33:05", "remaining_time": "0:06:08", "throughput": 2311.65, "total_tokens": 37878536} {"current_steps": 65670, "total_steps": 67140, "loss": 0.5903, "lr": 7.307616042240007e-08, "epoch": 9.781054512957999, "percentage": 97.81, "elapsed_time": "4:33:07", "remaining_time": "0:06:06", "throughput": 2311.66, "total_tokens": 37881288} {"current_steps": 65675, "total_steps": 67140, "loss": 0.4546, "lr": 7.258046602478252e-08, "epoch": 9.781799225498958, "percentage": 97.82, "elapsed_time": "4:33:08", "remaining_time": "0:06:05", "throughput": 2311.67, "total_tokens": 37884008} {"current_steps": 65680, "total_steps": 67140, "loss": 0.704, "lr": 7.208645612082899e-08, "epoch": 9.782543938039916, "percentage": 97.83, "elapsed_time": "4:33:09", "remaining_time": "0:06:04", "throughput": 2311.69, "total_tokens": 37886888} {"current_steps": 65685, "total_steps": 67140, "loss": 0.8513, "lr": 7.159413074392107e-08, "epoch": 9.783288650580875, "percentage": 97.83, "elapsed_time": "4:33:10", "remaining_time": "0:06:03", "throughput": 2311.71, "total_tokens": 37889896} {"current_steps": 65690, "total_steps": 67140, "loss": 0.6046, "lr": 7.110348992733217e-08, "epoch": 9.784033363121836, "percentage": 97.84, "elapsed_time": "4:33:11", "remaining_time": "0:06:01", "throughput": 2311.73, "total_tokens": 37892840} {"current_steps": 65695, "total_steps": 67140, "loss": 0.4809, "lr": 7.061453370421634e-08, "epoch": 9.784778075662794, "percentage": 97.85, "elapsed_time": "4:33:12", "remaining_time": "0:06:00", "throughput": 2311.74, "total_tokens": 37895560} {"current_steps": 65700, "total_steps": 67140, "loss": 0.518, "lr": 7.012726210761656e-08, "epoch": 9.785522788203753, "percentage": 97.86, "elapsed_time": "4:33:13", "remaining_time": "0:05:59", "throughput": 2311.74, "total_tokens": 37898120} {"current_steps": 65705, "total_steps": 67140, "loss": 0.3767, "lr": 6.96416751704565e-08, "epoch": 9.786267500744712, "percentage": 97.86, "elapsed_time": "4:33:14", "remaining_time": "0:05:58", "throughput": 2311.75, "total_tokens": 37900968} {"current_steps": 65710, "total_steps": 67140, "loss": 0.5597, "lr": 6.915777292555159e-08, "epoch": 9.787012213285673, "percentage": 97.87, "elapsed_time": "4:33:16", "remaining_time": "0:05:56", "throughput": 2311.77, "total_tokens": 37903912} {"current_steps": 65715, "total_steps": 67140, "loss": 0.6346, "lr": 6.867555540560621e-08, "epoch": 9.787756925826631, "percentage": 97.88, "elapsed_time": "4:33:17", "remaining_time": "0:05:55", "throughput": 2311.79, "total_tokens": 37906920} {"current_steps": 65720, "total_steps": 67140, "loss": 0.4291, "lr": 6.819502264319988e-08, "epoch": 9.78850163836759, "percentage": 97.89, "elapsed_time": "4:33:18", "remaining_time": "0:05:54", "throughput": 2311.81, "total_tokens": 37909768} {"current_steps": 65725, "total_steps": 67140, "loss": 0.4573, "lr": 6.771617467080938e-08, "epoch": 9.789246350908549, "percentage": 97.89, "elapsed_time": "4:33:19", "remaining_time": "0:05:53", "throughput": 2311.82, "total_tokens": 37912648} {"current_steps": 65730, "total_steps": 67140, "loss": 0.5444, "lr": 6.723901152079492e-08, "epoch": 9.78999106344951, "percentage": 97.9, "elapsed_time": "4:33:20", "remaining_time": "0:05:51", "throughput": 2311.83, "total_tokens": 37915240} {"current_steps": 65735, "total_steps": 67140, "loss": 0.3697, "lr": 6.676353322539741e-08, "epoch": 9.790735775990468, "percentage": 97.91, "elapsed_time": "4:33:21", "remaining_time": "0:05:50", "throughput": 2311.83, "total_tokens": 37917928} {"current_steps": 65740, "total_steps": 67140, "loss": 0.6885, "lr": 6.628973981674947e-08, "epoch": 9.791480488531427, "percentage": 97.91, "elapsed_time": "4:33:22", "remaining_time": "0:05:49", "throughput": 2311.88, "total_tokens": 37921704} {"current_steps": 65745, "total_steps": 67140, "loss": 0.5548, "lr": 6.581763132686714e-08, "epoch": 9.792225201072386, "percentage": 97.92, "elapsed_time": "4:33:24", "remaining_time": "0:05:48", "throughput": 2311.89, "total_tokens": 37924424} {"current_steps": 65750, "total_steps": 67140, "loss": 0.4161, "lr": 6.534720778765547e-08, "epoch": 9.792969913613344, "percentage": 97.93, "elapsed_time": "4:33:25", "remaining_time": "0:05:46", "throughput": 2311.9, "total_tokens": 37927144} {"current_steps": 65755, "total_steps": 67140, "loss": 0.4158, "lr": 6.487846923090012e-08, "epoch": 9.793714626154305, "percentage": 97.94, "elapsed_time": "4:33:26", "remaining_time": "0:05:45", "throughput": 2311.91, "total_tokens": 37929800} {"current_steps": 65760, "total_steps": 67140, "loss": 0.6195, "lr": 6.441141568828135e-08, "epoch": 9.794459338695264, "percentage": 97.94, "elapsed_time": "4:33:27", "remaining_time": "0:05:44", "throughput": 2311.92, "total_tokens": 37932616} {"current_steps": 65765, "total_steps": 67140, "loss": 0.5003, "lr": 6.394604719135722e-08, "epoch": 9.795204051236222, "percentage": 97.95, "elapsed_time": "4:33:28", "remaining_time": "0:05:43", "throughput": 2311.94, "total_tokens": 37935432} {"current_steps": 65770, "total_steps": 67140, "loss": 0.7786, "lr": 6.348236377157756e-08, "epoch": 9.795948763777183, "percentage": 97.96, "elapsed_time": "4:33:29", "remaining_time": "0:05:41", "throughput": 2311.96, "total_tokens": 37938440} {"current_steps": 65775, "total_steps": 67140, "loss": 0.7462, "lr": 6.30203654602729e-08, "epoch": 9.796693476318142, "percentage": 97.97, "elapsed_time": "4:33:30", "remaining_time": "0:05:40", "throughput": 2311.97, "total_tokens": 37941384} {"current_steps": 65780, "total_steps": 67140, "loss": 0.5663, "lr": 6.256005228866824e-08, "epoch": 9.7974381888591, "percentage": 97.97, "elapsed_time": "4:33:31", "remaining_time": "0:05:39", "throughput": 2311.99, "total_tokens": 37944296} {"current_steps": 65785, "total_steps": 67140, "loss": 0.5587, "lr": 6.210142428786647e-08, "epoch": 9.79818290140006, "percentage": 97.98, "elapsed_time": "4:33:33", "remaining_time": "0:05:38", "throughput": 2312.01, "total_tokens": 37947240} {"current_steps": 65790, "total_steps": 67140, "loss": 0.4268, "lr": 6.164448148885948e-08, "epoch": 9.798927613941018, "percentage": 97.99, "elapsed_time": "4:33:34", "remaining_time": "0:05:36", "throughput": 2312.03, "total_tokens": 37950376} {"current_steps": 65795, "total_steps": 67140, "loss": 0.5476, "lr": 6.118922392252813e-08, "epoch": 9.799672326481979, "percentage": 98.0, "elapsed_time": "4:33:35", "remaining_time": "0:05:35", "throughput": 2312.05, "total_tokens": 37953416} {"current_steps": 65800, "total_steps": 67140, "loss": 0.532, "lr": 6.07356516196339e-08, "epoch": 9.800417039022937, "percentage": 98.0, "elapsed_time": "4:33:36", "remaining_time": "0:05:34", "throughput": 2312.08, "total_tokens": 37956520} {"current_steps": 65805, "total_steps": 67140, "loss": 0.6366, "lr": 6.028376461082729e-08, "epoch": 9.801161751563896, "percentage": 98.01, "elapsed_time": "4:33:37", "remaining_time": "0:05:33", "throughput": 2312.09, "total_tokens": 37959272} {"current_steps": 65810, "total_steps": 67140, "loss": 0.4293, "lr": 5.983356292664776e-08, "epoch": 9.801906464104855, "percentage": 98.02, "elapsed_time": "4:33:38", "remaining_time": "0:05:31", "throughput": 2312.1, "total_tokens": 37962088} {"current_steps": 65815, "total_steps": 67140, "loss": 0.452, "lr": 5.9385046597518204e-08, "epoch": 9.802651176645815, "percentage": 98.03, "elapsed_time": "4:33:39", "remaining_time": "0:05:30", "throughput": 2312.11, "total_tokens": 37964680} {"current_steps": 65820, "total_steps": 67140, "loss": 0.5746, "lr": 5.893821565374491e-08, "epoch": 9.803395889186774, "percentage": 98.03, "elapsed_time": "4:33:41", "remaining_time": "0:05:29", "throughput": 2312.12, "total_tokens": 37967496} {"current_steps": 65825, "total_steps": 67140, "loss": 0.6436, "lr": 5.8493070125523184e-08, "epoch": 9.804140601727733, "percentage": 98.04, "elapsed_time": "4:33:42", "remaining_time": "0:05:28", "throughput": 2312.14, "total_tokens": 37970504} {"current_steps": 65830, "total_steps": 67140, "loss": 0.5039, "lr": 5.804961004293452e-08, "epoch": 9.804885314268692, "percentage": 98.05, "elapsed_time": "4:33:43", "remaining_time": "0:05:26", "throughput": 2312.16, "total_tokens": 37973288} {"current_steps": 65835, "total_steps": 67140, "loss": 0.7609, "lr": 5.760783543594939e-08, "epoch": 9.805630026809652, "percentage": 98.06, "elapsed_time": "4:33:44", "remaining_time": "0:05:25", "throughput": 2312.18, "total_tokens": 37976328} {"current_steps": 65840, "total_steps": 67140, "loss": 0.4474, "lr": 5.716774633441613e-08, "epoch": 9.80637473935061, "percentage": 98.06, "elapsed_time": "4:33:45", "remaining_time": "0:05:24", "throughput": 2312.2, "total_tokens": 37979304} {"current_steps": 65845, "total_steps": 67140, "loss": 0.4875, "lr": 5.672934276807762e-08, "epoch": 9.80711945189157, "percentage": 98.07, "elapsed_time": "4:33:46", "remaining_time": "0:05:23", "throughput": 2312.22, "total_tokens": 37982312} {"current_steps": 65850, "total_steps": 67140, "loss": 0.5851, "lr": 5.629262476655739e-08, "epoch": 9.807864164432528, "percentage": 98.08, "elapsed_time": "4:33:47", "remaining_time": "0:05:21", "throughput": 2312.26, "total_tokens": 37985768} {"current_steps": 65855, "total_steps": 67140, "loss": 0.6468, "lr": 5.585759235936794e-08, "epoch": 9.808608876973489, "percentage": 98.09, "elapsed_time": "4:33:49", "remaining_time": "0:05:20", "throughput": 2312.27, "total_tokens": 37988680} {"current_steps": 65860, "total_steps": 67140, "loss": 0.5323, "lr": 5.54242455759052e-08, "epoch": 9.809353589514448, "percentage": 98.09, "elapsed_time": "4:33:50", "remaining_time": "0:05:19", "throughput": 2312.3, "total_tokens": 37991784} {"current_steps": 65865, "total_steps": 67140, "loss": 0.5385, "lr": 5.499258444545685e-08, "epoch": 9.810098302055406, "percentage": 98.1, "elapsed_time": "4:33:51", "remaining_time": "0:05:18", "throughput": 2312.31, "total_tokens": 37994472} {"current_steps": 65870, "total_steps": 67140, "loss": 0.5359, "lr": 5.4562608997191234e-08, "epoch": 9.810843014596365, "percentage": 98.11, "elapsed_time": "4:33:52", "remaining_time": "0:05:16", "throughput": 2312.32, "total_tokens": 37997320} {"current_steps": 65875, "total_steps": 67140, "loss": 0.51, "lr": 5.413431926016288e-08, "epoch": 9.811587727137326, "percentage": 98.12, "elapsed_time": "4:33:53", "remaining_time": "0:05:15", "throughput": 2312.33, "total_tokens": 38000104} {"current_steps": 65880, "total_steps": 67140, "loss": 0.503, "lr": 5.3707715263315305e-08, "epoch": 9.812332439678285, "percentage": 98.12, "elapsed_time": "4:33:54", "remaining_time": "0:05:14", "throughput": 2312.34, "total_tokens": 38002856} {"current_steps": 65885, "total_steps": 67140, "loss": 0.4112, "lr": 5.328279703547545e-08, "epoch": 9.813077152219243, "percentage": 98.13, "elapsed_time": "4:33:55", "remaining_time": "0:05:13", "throughput": 2312.37, "total_tokens": 38005928} {"current_steps": 65890, "total_steps": 67140, "loss": 0.5482, "lr": 5.285956460535646e-08, "epoch": 9.813821864760202, "percentage": 98.14, "elapsed_time": "4:33:57", "remaining_time": "0:05:11", "throughput": 2312.38, "total_tokens": 38008744} {"current_steps": 65895, "total_steps": 67140, "loss": 0.5271, "lr": 5.243801800156323e-08, "epoch": 9.814566577301163, "percentage": 98.15, "elapsed_time": "4:33:58", "remaining_time": "0:05:10", "throughput": 2312.39, "total_tokens": 38011624} {"current_steps": 65900, "total_steps": 67140, "loss": 0.5905, "lr": 5.2018157252578525e-08, "epoch": 9.815311289842121, "percentage": 98.15, "elapsed_time": "4:33:59", "remaining_time": "0:05:09", "throughput": 2312.4, "total_tokens": 38014408} {"current_steps": 65905, "total_steps": 67140, "loss": 0.5455, "lr": 5.15999823867741e-08, "epoch": 9.81605600238308, "percentage": 98.16, "elapsed_time": "4:34:00", "remaining_time": "0:05:08", "throughput": 2312.42, "total_tokens": 38017256} {"current_steps": 65910, "total_steps": 67140, "loss": 0.5653, "lr": 5.118349343241069e-08, "epoch": 9.816800714924039, "percentage": 98.17, "elapsed_time": "4:34:01", "remaining_time": "0:05:06", "throughput": 2312.44, "total_tokens": 38020200} {"current_steps": 65915, "total_steps": 67140, "loss": 0.4749, "lr": 5.076869041763521e-08, "epoch": 9.817545427465, "percentage": 98.18, "elapsed_time": "4:34:02", "remaining_time": "0:05:05", "throughput": 2312.47, "total_tokens": 38023400} {"current_steps": 65920, "total_steps": 67140, "loss": 0.3981, "lr": 5.0355573370472475e-08, "epoch": 9.818290140005958, "percentage": 98.18, "elapsed_time": "4:34:03", "remaining_time": "0:05:04", "throughput": 2312.48, "total_tokens": 38026312} {"current_steps": 65925, "total_steps": 67140, "loss": 0.4578, "lr": 4.9944142318841816e-08, "epoch": 9.819034852546917, "percentage": 98.19, "elapsed_time": "4:34:05", "remaining_time": "0:05:03", "throughput": 2312.51, "total_tokens": 38029448} {"current_steps": 65930, "total_steps": 67140, "loss": 0.7293, "lr": 4.953439729054876e-08, "epoch": 9.819779565087876, "percentage": 98.2, "elapsed_time": "4:34:06", "remaining_time": "0:05:01", "throughput": 2312.52, "total_tokens": 38032200} {"current_steps": 65935, "total_steps": 67140, "loss": 0.6568, "lr": 4.9126338313279504e-08, "epoch": 9.820524277628834, "percentage": 98.21, "elapsed_time": "4:34:07", "remaining_time": "0:05:00", "throughput": 2312.54, "total_tokens": 38035208} {"current_steps": 65940, "total_steps": 67140, "loss": 0.5826, "lr": 4.8719965414606436e-08, "epoch": 9.821268990169795, "percentage": 98.21, "elapsed_time": "4:34:08", "remaining_time": "0:04:59", "throughput": 2312.55, "total_tokens": 38038088} {"current_steps": 65945, "total_steps": 67140, "loss": 0.7809, "lr": 4.831527862199647e-08, "epoch": 9.822013702710754, "percentage": 98.22, "elapsed_time": "4:34:09", "remaining_time": "0:04:58", "throughput": 2312.55, "total_tokens": 38040616} {"current_steps": 65950, "total_steps": 67140, "loss": 0.658, "lr": 4.791227796279163e-08, "epoch": 9.822758415251712, "percentage": 98.23, "elapsed_time": "4:34:10", "remaining_time": "0:04:56", "throughput": 2312.57, "total_tokens": 38043464} {"current_steps": 65955, "total_steps": 67140, "loss": 0.5429, "lr": 4.751096346423123e-08, "epoch": 9.823503127792671, "percentage": 98.24, "elapsed_time": "4:34:11", "remaining_time": "0:04:55", "throughput": 2312.59, "total_tokens": 38046376} {"current_steps": 65960, "total_steps": 67140, "loss": 0.4774, "lr": 4.711133515342692e-08, "epoch": 9.824247840333632, "percentage": 98.24, "elapsed_time": "4:34:13", "remaining_time": "0:04:54", "throughput": 2312.61, "total_tokens": 38049320} {"current_steps": 65965, "total_steps": 67140, "loss": 0.5356, "lr": 4.6713393057387646e-08, "epoch": 9.82499255287459, "percentage": 98.25, "elapsed_time": "4:34:14", "remaining_time": "0:04:53", "throughput": 2312.62, "total_tokens": 38052072} {"current_steps": 65970, "total_steps": 67140, "loss": 0.541, "lr": 4.631713720300856e-08, "epoch": 9.82573726541555, "percentage": 98.26, "elapsed_time": "4:34:15", "remaining_time": "0:04:51", "throughput": 2312.63, "total_tokens": 38054952} {"current_steps": 65975, "total_steps": 67140, "loss": 0.3824, "lr": 4.592256761705993e-08, "epoch": 9.826481977956508, "percentage": 98.26, "elapsed_time": "4:34:16", "remaining_time": "0:04:50", "throughput": 2312.65, "total_tokens": 38057832} {"current_steps": 65980, "total_steps": 67140, "loss": 0.4462, "lr": 4.5529684326206526e-08, "epoch": 9.827226690497469, "percentage": 98.27, "elapsed_time": "4:34:17", "remaining_time": "0:04:49", "throughput": 2312.66, "total_tokens": 38060744} {"current_steps": 65985, "total_steps": 67140, "loss": 0.5249, "lr": 4.51384873570021e-08, "epoch": 9.827971403038427, "percentage": 98.28, "elapsed_time": "4:34:18", "remaining_time": "0:04:48", "throughput": 2312.67, "total_tokens": 38063432} {"current_steps": 65990, "total_steps": 67140, "loss": 0.5583, "lr": 4.47489767358783e-08, "epoch": 9.828716115579386, "percentage": 98.29, "elapsed_time": "4:34:19", "remaining_time": "0:04:46", "throughput": 2312.68, "total_tokens": 38066120} {"current_steps": 65995, "total_steps": 67140, "loss": 0.5172, "lr": 4.436115248915851e-08, "epoch": 9.829460828120345, "percentage": 98.29, "elapsed_time": "4:34:20", "remaining_time": "0:04:45", "throughput": 2312.69, "total_tokens": 38068776} {"current_steps": 66000, "total_steps": 67140, "loss": 0.4651, "lr": 4.397501464304954e-08, "epoch": 9.830205540661305, "percentage": 98.3, "elapsed_time": "4:34:21", "remaining_time": "0:04:44", "throughput": 2312.71, "total_tokens": 38071816} {"current_steps": 66005, "total_steps": 67140, "loss": 0.4628, "lr": 4.3590563223647184e-08, "epoch": 9.830950253202264, "percentage": 98.31, "elapsed_time": "4:34:23", "remaining_time": "0:04:43", "throughput": 2312.72, "total_tokens": 38074536} {"current_steps": 66010, "total_steps": 67140, "loss": 0.5411, "lr": 4.320779825692789e-08, "epoch": 9.831694965743223, "percentage": 98.32, "elapsed_time": "4:34:24", "remaining_time": "0:04:41", "throughput": 2312.73, "total_tokens": 38077224} {"current_steps": 66015, "total_steps": 67140, "loss": 0.5839, "lr": 4.2826719768757074e-08, "epoch": 9.832439678284182, "percentage": 98.32, "elapsed_time": "4:34:25", "remaining_time": "0:04:40", "throughput": 2312.75, "total_tokens": 38080168} {"current_steps": 66020, "total_steps": 67140, "loss": 0.5794, "lr": 4.244732778489191e-08, "epoch": 9.833184390825142, "percentage": 98.33, "elapsed_time": "4:34:26", "remaining_time": "0:04:39", "throughput": 2312.77, "total_tokens": 38083176} {"current_steps": 66025, "total_steps": 67140, "loss": 0.5379, "lr": 4.20696223309619e-08, "epoch": 9.833929103366101, "percentage": 98.34, "elapsed_time": "4:34:27", "remaining_time": "0:04:38", "throughput": 2312.78, "total_tokens": 38086120} {"current_steps": 66030, "total_steps": 67140, "loss": 0.6161, "lr": 4.1693603432499396e-08, "epoch": 9.83467381590706, "percentage": 98.35, "elapsed_time": "4:34:28", "remaining_time": "0:04:36", "throughput": 2312.8, "total_tokens": 38089128} {"current_steps": 66035, "total_steps": 67140, "loss": 0.6207, "lr": 4.13192711149063e-08, "epoch": 9.835418528448018, "percentage": 98.35, "elapsed_time": "4:34:29", "remaining_time": "0:04:35", "throughput": 2312.82, "total_tokens": 38092040} {"current_steps": 66040, "total_steps": 67140, "loss": 0.59, "lr": 4.0946625403484593e-08, "epoch": 9.836163240988979, "percentage": 98.36, "elapsed_time": "4:34:31", "remaining_time": "0:04:34", "throughput": 2312.83, "total_tokens": 38094856} {"current_steps": 66045, "total_steps": 67140, "loss": 0.6007, "lr": 4.057566632341414e-08, "epoch": 9.836907953529938, "percentage": 98.37, "elapsed_time": "4:34:32", "remaining_time": "0:04:33", "throughput": 2312.85, "total_tokens": 38097800} {"current_steps": 66050, "total_steps": 67140, "loss": 0.5677, "lr": 4.0206393899761e-08, "epoch": 9.837652666070897, "percentage": 98.38, "elapsed_time": "4:34:33", "remaining_time": "0:04:31", "throughput": 2312.87, "total_tokens": 38100808} {"current_steps": 66055, "total_steps": 67140, "loss": 0.6779, "lr": 3.98388081574802e-08, "epoch": 9.838397378611855, "percentage": 98.38, "elapsed_time": "4:34:34", "remaining_time": "0:04:30", "throughput": 2312.89, "total_tokens": 38103784} {"current_steps": 66060, "total_steps": 67140, "loss": 0.5196, "lr": 3.9472909121412994e-08, "epoch": 9.839142091152816, "percentage": 98.39, "elapsed_time": "4:34:35", "remaining_time": "0:04:29", "throughput": 2312.9, "total_tokens": 38106664} {"current_steps": 66065, "total_steps": 67140, "loss": 0.565, "lr": 3.910869681628404e-08, "epoch": 9.839886803693775, "percentage": 98.4, "elapsed_time": "4:34:36", "remaining_time": "0:04:28", "throughput": 2312.92, "total_tokens": 38109672} {"current_steps": 66070, "total_steps": 67140, "loss": 0.3917, "lr": 3.8746171266706985e-08, "epoch": 9.840631516234733, "percentage": 98.41, "elapsed_time": "4:34:37", "remaining_time": "0:04:26", "throughput": 2312.93, "total_tokens": 38112392} {"current_steps": 66075, "total_steps": 67140, "loss": 0.3954, "lr": 3.838533249717891e-08, "epoch": 9.841376228775692, "percentage": 98.41, "elapsed_time": "4:34:39", "remaining_time": "0:04:25", "throughput": 2312.95, "total_tokens": 38115400} {"current_steps": 66080, "total_steps": 67140, "loss": 0.7201, "lr": 3.8026180532083066e-08, "epoch": 9.842120941316653, "percentage": 98.42, "elapsed_time": "4:34:40", "remaining_time": "0:04:24", "throughput": 2312.98, "total_tokens": 38118504} {"current_steps": 66085, "total_steps": 67140, "loss": 0.5566, "lr": 3.766871539568895e-08, "epoch": 9.842865653857611, "percentage": 98.43, "elapsed_time": "4:34:41", "remaining_time": "0:04:23", "throughput": 2312.99, "total_tokens": 38121352} {"current_steps": 66090, "total_steps": 67140, "loss": 0.3021, "lr": 3.7312937112152226e-08, "epoch": 9.84361036639857, "percentage": 98.44, "elapsed_time": "4:34:42", "remaining_time": "0:04:21", "throughput": 2313.01, "total_tokens": 38124200} {"current_steps": 66095, "total_steps": 67140, "loss": 0.6921, "lr": 3.695884570552033e-08, "epoch": 9.844355078939529, "percentage": 98.44, "elapsed_time": "4:34:43", "remaining_time": "0:04:20", "throughput": 2313.03, "total_tokens": 38127112} {"current_steps": 66100, "total_steps": 67140, "loss": 0.7024, "lr": 3.660644119971579e-08, "epoch": 9.84509979148049, "percentage": 98.45, "elapsed_time": "4:34:44", "remaining_time": "0:04:19", "throughput": 2313.04, "total_tokens": 38130088} {"current_steps": 66105, "total_steps": 67140, "loss": 0.623, "lr": 3.6255723618552895e-08, "epoch": 9.845844504021448, "percentage": 98.46, "elapsed_time": "4:34:45", "remaining_time": "0:04:18", "throughput": 2313.06, "total_tokens": 38132872} {"current_steps": 66110, "total_steps": 67140, "loss": 0.4497, "lr": 3.5906692985732124e-08, "epoch": 9.846589216562407, "percentage": 98.47, "elapsed_time": "4:34:47", "remaining_time": "0:04:16", "throughput": 2313.07, "total_tokens": 38135752} {"current_steps": 66115, "total_steps": 67140, "loss": 0.3476, "lr": 3.555934932484295e-08, "epoch": 9.847333929103366, "percentage": 98.47, "elapsed_time": "4:34:48", "remaining_time": "0:04:15", "throughput": 2313.09, "total_tokens": 38138728} {"current_steps": 66120, "total_steps": 67140, "loss": 0.5855, "lr": 3.521369265935548e-08, "epoch": 9.848078641644324, "percentage": 98.48, "elapsed_time": "4:34:49", "remaining_time": "0:04:14", "throughput": 2313.11, "total_tokens": 38141672} {"current_steps": 66125, "total_steps": 67140, "loss": 0.5584, "lr": 3.4869723012623254e-08, "epoch": 9.848823354185285, "percentage": 98.49, "elapsed_time": "4:34:50", "remaining_time": "0:04:13", "throughput": 2313.13, "total_tokens": 38144712} {"current_steps": 66130, "total_steps": 67140, "loss": 0.4571, "lr": 3.452744040789713e-08, "epoch": 9.849568066726244, "percentage": 98.5, "elapsed_time": "4:34:51", "remaining_time": "0:04:11", "throughput": 2313.16, "total_tokens": 38147816} {"current_steps": 66135, "total_steps": 67140, "loss": 0.5414, "lr": 3.418684486830581e-08, "epoch": 9.850312779267203, "percentage": 98.5, "elapsed_time": "4:34:52", "remaining_time": "0:04:10", "throughput": 2313.16, "total_tokens": 38150504} {"current_steps": 66140, "total_steps": 67140, "loss": 0.6478, "lr": 3.384793641686146e-08, "epoch": 9.851057491808161, "percentage": 98.51, "elapsed_time": "4:34:53", "remaining_time": "0:04:09", "throughput": 2313.18, "total_tokens": 38153288} {"current_steps": 66145, "total_steps": 67140, "loss": 0.7607, "lr": 3.351071507646797e-08, "epoch": 9.851802204349122, "percentage": 98.52, "elapsed_time": "4:34:55", "remaining_time": "0:04:08", "throughput": 2313.2, "total_tokens": 38156296} {"current_steps": 66150, "total_steps": 67140, "loss": 0.418, "lr": 3.3175180869915445e-08, "epoch": 9.85254691689008, "percentage": 98.53, "elapsed_time": "4:34:56", "remaining_time": "0:04:06", "throughput": 2313.22, "total_tokens": 38159240} {"current_steps": 66155, "total_steps": 67140, "loss": 0.7915, "lr": 3.2841333819877415e-08, "epoch": 9.85329162943104, "percentage": 98.53, "elapsed_time": "4:34:57", "remaining_time": "0:04:05", "throughput": 2313.24, "total_tokens": 38162440} {"current_steps": 66160, "total_steps": 67140, "loss": 0.4557, "lr": 3.250917394891084e-08, "epoch": 9.854036341971998, "percentage": 98.54, "elapsed_time": "4:34:58", "remaining_time": "0:04:04", "throughput": 2313.27, "total_tokens": 38165448} {"current_steps": 66165, "total_steps": 67140, "loss": 0.4017, "lr": 3.2178701279464426e-08, "epoch": 9.854781054512959, "percentage": 98.55, "elapsed_time": "4:34:59", "remaining_time": "0:04:03", "throughput": 2313.29, "total_tokens": 38168552} {"current_steps": 66170, "total_steps": 67140, "loss": 0.6406, "lr": 3.1849915833870313e-08, "epoch": 9.855525767053917, "percentage": 98.56, "elapsed_time": "4:35:00", "remaining_time": "0:04:01", "throughput": 2313.31, "total_tokens": 38171496} {"current_steps": 66175, "total_steps": 67140, "loss": 0.5519, "lr": 3.1522817634346834e-08, "epoch": 9.856270479594876, "percentage": 98.56, "elapsed_time": "4:35:01", "remaining_time": "0:04:00", "throughput": 2313.32, "total_tokens": 38174248} {"current_steps": 66180, "total_steps": 67140, "loss": 0.4975, "lr": 3.119740670299576e-08, "epoch": 9.857015192135835, "percentage": 98.57, "elapsed_time": "4:35:03", "remaining_time": "0:03:59", "throughput": 2313.33, "total_tokens": 38177000} {"current_steps": 66185, "total_steps": 67140, "loss": 0.5767, "lr": 3.0873683061807826e-08, "epoch": 9.857759904676795, "percentage": 98.58, "elapsed_time": "4:35:04", "remaining_time": "0:03:58", "throughput": 2313.36, "total_tokens": 38180104} {"current_steps": 66190, "total_steps": 67140, "loss": 0.6073, "lr": 3.0551646732659975e-08, "epoch": 9.858504617217754, "percentage": 98.59, "elapsed_time": "4:35:05", "remaining_time": "0:03:56", "throughput": 2313.38, "total_tokens": 38183144} {"current_steps": 66195, "total_steps": 67140, "loss": 0.5733, "lr": 3.0231297737312594e-08, "epoch": 9.859249329758713, "percentage": 98.59, "elapsed_time": "4:35:06", "remaining_time": "0:03:55", "throughput": 2313.39, "total_tokens": 38185864} {"current_steps": 66200, "total_steps": 67140, "loss": 0.6555, "lr": 2.991263609741502e-08, "epoch": 9.859994042299672, "percentage": 98.6, "elapsed_time": "4:35:07", "remaining_time": "0:03:54", "throughput": 2313.41, "total_tokens": 38189032} {"current_steps": 66205, "total_steps": 67140, "loss": 0.4951, "lr": 2.9595661834500023e-08, "epoch": 9.860738754840632, "percentage": 98.61, "elapsed_time": "4:35:08", "remaining_time": "0:03:53", "throughput": 2313.43, "total_tokens": 38191944} {"current_steps": 66210, "total_steps": 67140, "loss": 0.6144, "lr": 2.9280374969989366e-08, "epoch": 9.861483467381591, "percentage": 98.61, "elapsed_time": "4:35:09", "remaining_time": "0:03:51", "throughput": 2313.44, "total_tokens": 38194632} {"current_steps": 66215, "total_steps": 67140, "loss": 0.5729, "lr": 2.8966775525185453e-08, "epoch": 9.86222817992255, "percentage": 98.62, "elapsed_time": "4:35:11", "remaining_time": "0:03:50", "throughput": 2313.46, "total_tokens": 38197576} {"current_steps": 66220, "total_steps": 67140, "loss": 0.4637, "lr": 2.865486352128244e-08, "epoch": 9.862972892463509, "percentage": 98.63, "elapsed_time": "4:35:12", "remaining_time": "0:03:49", "throughput": 2313.48, "total_tokens": 38200520} {"current_steps": 66225, "total_steps": 67140, "loss": 0.5648, "lr": 2.8344638979357907e-08, "epoch": 9.863717605004469, "percentage": 98.64, "elapsed_time": "4:35:13", "remaining_time": "0:03:48", "throughput": 2313.5, "total_tokens": 38203496} {"current_steps": 66230, "total_steps": 67140, "loss": 0.6904, "lr": 2.8036101920375647e-08, "epoch": 9.864462317545428, "percentage": 98.64, "elapsed_time": "4:35:14", "remaining_time": "0:03:46", "throughput": 2313.51, "total_tokens": 38206312} {"current_steps": 66235, "total_steps": 67140, "loss": 0.6284, "lr": 2.7729252365185643e-08, "epoch": 9.865207030086387, "percentage": 98.65, "elapsed_time": "4:35:15", "remaining_time": "0:03:45", "throughput": 2313.52, "total_tokens": 38209064} {"current_steps": 66240, "total_steps": 67140, "loss": 0.5015, "lr": 2.7424090334521313e-08, "epoch": 9.865951742627345, "percentage": 98.66, "elapsed_time": "4:35:16", "remaining_time": "0:03:44", "throughput": 2313.53, "total_tokens": 38211848} {"current_steps": 66245, "total_steps": 67140, "loss": 0.9004, "lr": 2.7120615849007826e-08, "epoch": 9.866696455168306, "percentage": 98.67, "elapsed_time": "4:35:17", "remaining_time": "0:03:43", "throughput": 2313.54, "total_tokens": 38214536} {"current_steps": 66250, "total_steps": 67140, "loss": 0.6178, "lr": 2.681882892914822e-08, "epoch": 9.867441167709265, "percentage": 98.67, "elapsed_time": "4:35:18", "remaining_time": "0:03:41", "throughput": 2313.56, "total_tokens": 38217608} {"current_steps": 66255, "total_steps": 67140, "loss": 0.5273, "lr": 2.6518729595340075e-08, "epoch": 9.868185880250223, "percentage": 98.68, "elapsed_time": "4:35:20", "remaining_time": "0:03:40", "throughput": 2313.58, "total_tokens": 38220520} {"current_steps": 66260, "total_steps": 67140, "loss": 0.5383, "lr": 2.622031786786161e-08, "epoch": 9.868930592791182, "percentage": 98.69, "elapsed_time": "4:35:21", "remaining_time": "0:03:39", "throughput": 2313.6, "total_tokens": 38223368} {"current_steps": 66265, "total_steps": 67140, "loss": 0.3991, "lr": 2.5923593766880026e-08, "epoch": 9.86967530533214, "percentage": 98.7, "elapsed_time": "4:35:22", "remaining_time": "0:03:38", "throughput": 2313.6, "total_tokens": 38226024} {"current_steps": 66270, "total_steps": 67140, "loss": 0.4326, "lr": 2.5628557312440403e-08, "epoch": 9.870420017873101, "percentage": 98.7, "elapsed_time": "4:35:23", "remaining_time": "0:03:36", "throughput": 2313.62, "total_tokens": 38229032} {"current_steps": 66275, "total_steps": 67140, "loss": 0.4299, "lr": 2.5335208524487898e-08, "epoch": 9.87116473041406, "percentage": 98.71, "elapsed_time": "4:35:24", "remaining_time": "0:03:35", "throughput": 2313.64, "total_tokens": 38231880} {"current_steps": 66280, "total_steps": 67140, "loss": 0.5618, "lr": 2.5043547422839986e-08, "epoch": 9.871909442955019, "percentage": 98.72, "elapsed_time": "4:35:25", "remaining_time": "0:03:34", "throughput": 2313.65, "total_tokens": 38234760} {"current_steps": 66285, "total_steps": 67140, "loss": 0.6281, "lr": 2.4753574027211457e-08, "epoch": 9.87265415549598, "percentage": 98.73, "elapsed_time": "4:35:26", "remaining_time": "0:03:33", "throughput": 2313.66, "total_tokens": 38237448} {"current_steps": 66290, "total_steps": 67140, "loss": 0.4924, "lr": 2.4465288357192196e-08, "epoch": 9.873398868036938, "percentage": 98.73, "elapsed_time": "4:35:27", "remaining_time": "0:03:31", "throughput": 2313.67, "total_tokens": 38240104} {"current_steps": 66295, "total_steps": 67140, "loss": 0.6009, "lr": 2.4178690432266617e-08, "epoch": 9.874143580577897, "percentage": 98.74, "elapsed_time": "4:35:29", "remaining_time": "0:03:30", "throughput": 2313.69, "total_tokens": 38243048} {"current_steps": 66300, "total_steps": 67140, "loss": 0.6991, "lr": 2.389378027179978e-08, "epoch": 9.874888293118856, "percentage": 98.75, "elapsed_time": "4:35:30", "remaining_time": "0:03:29", "throughput": 2313.7, "total_tokens": 38245960} {"current_steps": 66305, "total_steps": 67140, "loss": 0.4699, "lr": 2.3610557895045736e-08, "epoch": 9.875633005659815, "percentage": 98.76, "elapsed_time": "4:35:31", "remaining_time": "0:03:28", "throughput": 2313.71, "total_tokens": 38248776} {"current_steps": 66310, "total_steps": 67140, "loss": 0.5829, "lr": 2.3329023321144727e-08, "epoch": 9.876377718200775, "percentage": 98.76, "elapsed_time": "4:35:32", "remaining_time": "0:03:26", "throughput": 2313.74, "total_tokens": 38251880} {"current_steps": 66315, "total_steps": 67140, "loss": 0.588, "lr": 2.304917656912042e-08, "epoch": 9.877122430741734, "percentage": 98.77, "elapsed_time": "4:35:33", "remaining_time": "0:03:25", "throughput": 2313.75, "total_tokens": 38254696} {"current_steps": 66320, "total_steps": 67140, "loss": 0.4962, "lr": 2.27710176578827e-08, "epoch": 9.877867143282693, "percentage": 98.78, "elapsed_time": "4:35:34", "remaining_time": "0:03:24", "throughput": 2313.77, "total_tokens": 38257640} {"current_steps": 66325, "total_steps": 67140, "loss": 0.7025, "lr": 2.2494546606230405e-08, "epoch": 9.878611855823651, "percentage": 98.79, "elapsed_time": "4:35:35", "remaining_time": "0:03:23", "throughput": 2313.79, "total_tokens": 38260680} {"current_steps": 66330, "total_steps": 67140, "loss": 0.4763, "lr": 2.221976343284582e-08, "epoch": 9.879356568364612, "percentage": 98.79, "elapsed_time": "4:35:37", "remaining_time": "0:03:21", "throughput": 2313.8, "total_tokens": 38263464} {"current_steps": 66335, "total_steps": 67140, "loss": 0.6409, "lr": 2.1946668156297422e-08, "epoch": 9.88010128090557, "percentage": 98.8, "elapsed_time": "4:35:38", "remaining_time": "0:03:20", "throughput": 2313.82, "total_tokens": 38266408} {"current_steps": 66340, "total_steps": 67140, "loss": 0.6434, "lr": 2.1675260795037122e-08, "epoch": 9.88084599344653, "percentage": 98.81, "elapsed_time": "4:35:39", "remaining_time": "0:03:19", "throughput": 2313.85, "total_tokens": 38269480} {"current_steps": 66345, "total_steps": 67140, "loss": 0.8816, "lr": 2.1405541367411353e-08, "epoch": 9.881590705987488, "percentage": 98.82, "elapsed_time": "4:35:40", "remaining_time": "0:03:18", "throughput": 2313.85, "total_tokens": 38272168} {"current_steps": 66350, "total_steps": 67140, "loss": 0.4713, "lr": 2.113750989164165e-08, "epoch": 9.882335418528449, "percentage": 98.82, "elapsed_time": "4:35:41", "remaining_time": "0:03:16", "throughput": 2313.88, "total_tokens": 38275304} {"current_steps": 66355, "total_steps": 67140, "loss": 0.6692, "lr": 2.0871166385844077e-08, "epoch": 9.883080131069407, "percentage": 98.83, "elapsed_time": "4:35:42", "remaining_time": "0:03:15", "throughput": 2313.9, "total_tokens": 38278344} {"current_steps": 66360, "total_steps": 67140, "loss": 0.5302, "lr": 2.060651086801535e-08, "epoch": 9.883824843610366, "percentage": 98.84, "elapsed_time": "4:35:43", "remaining_time": "0:03:14", "throughput": 2313.91, "total_tokens": 38281160} {"current_steps": 66365, "total_steps": 67140, "loss": 0.5236, "lr": 2.0343543356038385e-08, "epoch": 9.884569556151325, "percentage": 98.85, "elapsed_time": "4:35:45", "remaining_time": "0:03:13", "throughput": 2313.94, "total_tokens": 38284264} {"current_steps": 66370, "total_steps": 67140, "loss": 0.6002, "lr": 2.008226386768508e-08, "epoch": 9.885314268692285, "percentage": 98.85, "elapsed_time": "4:35:46", "remaining_time": "0:03:11", "throughput": 2313.96, "total_tokens": 38287272} {"current_steps": 66375, "total_steps": 67140, "loss": 0.5711, "lr": 1.982267242061353e-08, "epoch": 9.886058981233244, "percentage": 98.86, "elapsed_time": "4:35:47", "remaining_time": "0:03:10", "throughput": 2313.97, "total_tokens": 38290248} {"current_steps": 66380, "total_steps": 67140, "loss": 0.6859, "lr": 1.9564769032362485e-08, "epoch": 9.886803693774203, "percentage": 98.87, "elapsed_time": "4:35:48", "remaining_time": "0:03:09", "throughput": 2313.98, "total_tokens": 38292936} {"current_steps": 66385, "total_steps": 67140, "loss": 0.4625, "lr": 1.9308553720359667e-08, "epoch": 9.887548406315162, "percentage": 98.88, "elapsed_time": "4:35:49", "remaining_time": "0:03:08", "throughput": 2314.01, "total_tokens": 38296008} {"current_steps": 66390, "total_steps": 67140, "loss": 0.5549, "lr": 1.9054026501921785e-08, "epoch": 9.888293118856122, "percentage": 98.88, "elapsed_time": "4:35:50", "remaining_time": "0:03:06", "throughput": 2314.02, "total_tokens": 38298888} {"current_steps": 66395, "total_steps": 67140, "loss": 0.4309, "lr": 1.8801187394248965e-08, "epoch": 9.889037831397081, "percentage": 98.89, "elapsed_time": "4:35:51", "remaining_time": "0:03:05", "throughput": 2314.03, "total_tokens": 38301640} {"current_steps": 66400, "total_steps": 67140, "loss": 0.6297, "lr": 1.8550036414424765e-08, "epoch": 9.88978254393804, "percentage": 98.9, "elapsed_time": "4:35:53", "remaining_time": "0:03:04", "throughput": 2314.05, "total_tokens": 38304488} {"current_steps": 66405, "total_steps": 67140, "loss": 0.5524, "lr": 1.830057357942172e-08, "epoch": 9.890527256478999, "percentage": 98.91, "elapsed_time": "4:35:54", "remaining_time": "0:03:03", "throughput": 2314.06, "total_tokens": 38307272} {"current_steps": 66410, "total_steps": 67140, "loss": 0.6517, "lr": 1.8052798906098568e-08, "epoch": 9.891271969019959, "percentage": 98.91, "elapsed_time": "4:35:55", "remaining_time": "0:03:01", "throughput": 2314.06, "total_tokens": 38309896} {"current_steps": 66415, "total_steps": 67140, "loss": 0.3629, "lr": 1.780671241119469e-08, "epoch": 9.892016681560918, "percentage": 98.92, "elapsed_time": "4:35:56", "remaining_time": "0:03:00", "throughput": 2314.07, "total_tokens": 38312584} {"current_steps": 66420, "total_steps": 67140, "loss": 0.562, "lr": 1.756231411134679e-08, "epoch": 9.892761394101877, "percentage": 98.93, "elapsed_time": "4:35:57", "remaining_time": "0:02:59", "throughput": 2314.1, "total_tokens": 38315656} {"current_steps": 66425, "total_steps": 67140, "loss": 0.5753, "lr": 1.7319604023066648e-08, "epoch": 9.893506106642835, "percentage": 98.94, "elapsed_time": "4:35:58", "remaining_time": "0:02:58", "throughput": 2314.12, "total_tokens": 38318664} {"current_steps": 66430, "total_steps": 67140, "loss": 0.679, "lr": 1.7078582162752265e-08, "epoch": 9.894250819183796, "percentage": 98.94, "elapsed_time": "4:35:59", "remaining_time": "0:02:56", "throughput": 2314.13, "total_tokens": 38321544} {"current_steps": 66435, "total_steps": 67140, "loss": 0.4299, "lr": 1.6839248546696163e-08, "epoch": 9.894995531724755, "percentage": 98.95, "elapsed_time": "4:36:00", "remaining_time": "0:02:55", "throughput": 2314.15, "total_tokens": 38324456} {"current_steps": 66440, "total_steps": 67140, "loss": 0.6426, "lr": 1.6601603191071513e-08, "epoch": 9.895740244265713, "percentage": 98.96, "elapsed_time": "4:36:02", "remaining_time": "0:02:54", "throughput": 2314.17, "total_tokens": 38327464} {"current_steps": 66445, "total_steps": 67140, "loss": 0.6174, "lr": 1.6365646111932144e-08, "epoch": 9.896484956806672, "percentage": 98.96, "elapsed_time": "4:36:03", "remaining_time": "0:02:53", "throughput": 2314.18, "total_tokens": 38330312} {"current_steps": 66450, "total_steps": 67140, "loss": 0.4361, "lr": 1.6131377325226405e-08, "epoch": 9.897229669347631, "percentage": 98.97, "elapsed_time": "4:36:04", "remaining_time": "0:02:51", "throughput": 2314.2, "total_tokens": 38333160} {"current_steps": 66455, "total_steps": 67140, "loss": 0.6406, "lr": 1.589879684678608e-08, "epoch": 9.897974381888591, "percentage": 98.98, "elapsed_time": "4:36:05", "remaining_time": "0:02:50", "throughput": 2314.21, "total_tokens": 38335944} {"current_steps": 66460, "total_steps": 67140, "loss": 0.7698, "lr": 1.566790469232915e-08, "epoch": 9.89871909442955, "percentage": 98.99, "elapsed_time": "4:36:06", "remaining_time": "0:02:49", "throughput": 2314.24, "total_tokens": 38339016} {"current_steps": 66465, "total_steps": 67140, "loss": 0.6235, "lr": 1.543870087745425e-08, "epoch": 9.899463806970509, "percentage": 98.99, "elapsed_time": "4:36:07", "remaining_time": "0:02:48", "throughput": 2314.26, "total_tokens": 38341992} {"current_steps": 66470, "total_steps": 67140, "loss": 0.6032, "lr": 1.5211185417651762e-08, "epoch": 9.900208519511468, "percentage": 99.0, "elapsed_time": "4:36:08", "remaining_time": "0:02:47", "throughput": 2314.27, "total_tokens": 38344712} {"current_steps": 66475, "total_steps": 67140, "loss": 0.4832, "lr": 1.4985358328298284e-08, "epoch": 9.900953232052428, "percentage": 99.01, "elapsed_time": "4:36:09", "remaining_time": "0:02:45", "throughput": 2314.28, "total_tokens": 38347464} {"current_steps": 66480, "total_steps": 67140, "loss": 0.535, "lr": 1.4761219624651045e-08, "epoch": 9.901697944593387, "percentage": 99.02, "elapsed_time": "4:36:11", "remaining_time": "0:02:44", "throughput": 2314.3, "total_tokens": 38350632} {"current_steps": 66485, "total_steps": 67140, "loss": 0.6853, "lr": 1.4538769321859046e-08, "epoch": 9.902442657134346, "percentage": 99.02, "elapsed_time": "4:36:12", "remaining_time": "0:02:43", "throughput": 2314.31, "total_tokens": 38353448} {"current_steps": 66490, "total_steps": 67140, "loss": 0.5578, "lr": 1.431800743495193e-08, "epoch": 9.903187369675305, "percentage": 99.03, "elapsed_time": "4:36:13", "remaining_time": "0:02:42", "throughput": 2314.32, "total_tokens": 38356072} {"current_steps": 66495, "total_steps": 67140, "loss": 0.508, "lr": 1.4098933978851093e-08, "epoch": 9.903932082216265, "percentage": 99.04, "elapsed_time": "4:36:14", "remaining_time": "0:02:40", "throughput": 2314.33, "total_tokens": 38358984} {"current_steps": 66500, "total_steps": 67140, "loss": 0.6551, "lr": 1.3881548968358581e-08, "epoch": 9.904676794757224, "percentage": 99.05, "elapsed_time": "4:36:15", "remaining_time": "0:02:39", "throughput": 2314.34, "total_tokens": 38361736} {"current_steps": 66505, "total_steps": 67140, "loss": 0.563, "lr": 1.3665852418165426e-08, "epoch": 9.905421507298183, "percentage": 99.05, "elapsed_time": "4:36:16", "remaining_time": "0:02:38", "throughput": 2314.36, "total_tokens": 38364584} {"current_steps": 66510, "total_steps": 67140, "loss": 0.522, "lr": 1.3451844342846077e-08, "epoch": 9.906166219839141, "percentage": 99.06, "elapsed_time": "4:36:17", "remaining_time": "0:02:37", "throughput": 2314.37, "total_tokens": 38367496} {"current_steps": 66515, "total_steps": 67140, "loss": 0.4397, "lr": 1.3239524756863964e-08, "epoch": 9.906910932380102, "percentage": 99.07, "elapsed_time": "4:36:19", "remaining_time": "0:02:35", "throughput": 2314.4, "total_tokens": 38370536} {"current_steps": 66520, "total_steps": 67140, "loss": 0.5988, "lr": 1.302889367456317e-08, "epoch": 9.90765564492106, "percentage": 99.08, "elapsed_time": "4:36:20", "remaining_time": "0:02:34", "throughput": 2314.4, "total_tokens": 38373224} {"current_steps": 66525, "total_steps": 67140, "loss": 0.6691, "lr": 1.2819951110182305e-08, "epoch": 9.90840035746202, "percentage": 99.08, "elapsed_time": "4:36:21", "remaining_time": "0:02:33", "throughput": 2314.42, "total_tokens": 38376104} {"current_steps": 66530, "total_steps": 67140, "loss": 0.4688, "lr": 1.261269707784063e-08, "epoch": 9.909145070002978, "percentage": 99.09, "elapsed_time": "4:36:22", "remaining_time": "0:02:32", "throughput": 2314.43, "total_tokens": 38378888} {"current_steps": 66535, "total_steps": 67140, "loss": 0.5665, "lr": 1.2407131591538057e-08, "epoch": 9.909889782543939, "percentage": 99.1, "elapsed_time": "4:36:23", "remaining_time": "0:02:30", "throughput": 2314.45, "total_tokens": 38381832} {"current_steps": 66540, "total_steps": 67140, "loss": 0.5009, "lr": 1.2203254665171804e-08, "epoch": 9.910634495084897, "percentage": 99.11, "elapsed_time": "4:36:24", "remaining_time": "0:02:29", "throughput": 2314.46, "total_tokens": 38384744} {"current_steps": 66545, "total_steps": 67140, "loss": 0.6156, "lr": 1.2001066312516962e-08, "epoch": 9.911379207625856, "percentage": 99.11, "elapsed_time": "4:36:25", "remaining_time": "0:02:28", "throughput": 2314.49, "total_tokens": 38387816} {"current_steps": 66550, "total_steps": 67140, "loss": 0.4446, "lr": 1.1800566547234825e-08, "epoch": 9.912123920166815, "percentage": 99.12, "elapsed_time": "4:36:27", "remaining_time": "0:02:27", "throughput": 2314.5, "total_tokens": 38390696} {"current_steps": 66555, "total_steps": 67140, "loss": 0.5936, "lr": 1.1601755382875667e-08, "epoch": 9.912868632707776, "percentage": 99.13, "elapsed_time": "4:36:28", "remaining_time": "0:02:25", "throughput": 2314.5, "total_tokens": 38393224} {"current_steps": 66560, "total_steps": 67140, "loss": 0.532, "lr": 1.1404632832873186e-08, "epoch": 9.913613345248734, "percentage": 99.14, "elapsed_time": "4:36:29", "remaining_time": "0:02:24", "throughput": 2314.51, "total_tokens": 38395944} {"current_steps": 66565, "total_steps": 67140, "loss": 0.5573, "lr": 1.1209198910552831e-08, "epoch": 9.914358057789693, "percentage": 99.14, "elapsed_time": "4:36:30", "remaining_time": "0:02:23", "throughput": 2314.53, "total_tokens": 38398792} {"current_steps": 66570, "total_steps": 67140, "loss": 0.5217, "lr": 1.1015453629115158e-08, "epoch": 9.915102770330652, "percentage": 99.15, "elapsed_time": "4:36:31", "remaining_time": "0:02:22", "throughput": 2314.54, "total_tokens": 38401736} {"current_steps": 66575, "total_steps": 67140, "loss": 0.3517, "lr": 1.0823397001655244e-08, "epoch": 9.915847482871612, "percentage": 99.16, "elapsed_time": "4:36:32", "remaining_time": "0:02:20", "throughput": 2314.56, "total_tokens": 38404584} {"current_steps": 66580, "total_steps": 67140, "loss": 0.6516, "lr": 1.0633029041154374e-08, "epoch": 9.916592195412571, "percentage": 99.17, "elapsed_time": "4:36:33", "remaining_time": "0:02:19", "throughput": 2314.58, "total_tokens": 38407496} {"current_steps": 66585, "total_steps": 67140, "loss": 0.6476, "lr": 1.0444349760471705e-08, "epoch": 9.91733690795353, "percentage": 99.17, "elapsed_time": "4:36:34", "remaining_time": "0:02:18", "throughput": 2314.58, "total_tokens": 38410152} {"current_steps": 66590, "total_steps": 67140, "loss": 0.6072, "lr": 1.0257359172360925e-08, "epoch": 9.918081620494489, "percentage": 99.18, "elapsed_time": "4:36:35", "remaining_time": "0:02:17", "throughput": 2314.59, "total_tokens": 38412904} {"current_steps": 66595, "total_steps": 67140, "loss": 0.5355, "lr": 1.0072057289456371e-08, "epoch": 9.91882633303545, "percentage": 99.19, "elapsed_time": "4:36:37", "remaining_time": "0:02:15", "throughput": 2314.62, "total_tokens": 38416008} {"current_steps": 66600, "total_steps": 67140, "loss": 0.4863, "lr": 9.888444124278585e-09, "epoch": 9.919571045576408, "percentage": 99.2, "elapsed_time": "4:36:38", "remaining_time": "0:02:14", "throughput": 2314.64, "total_tokens": 38418952} {"current_steps": 66605, "total_steps": 67140, "loss": 0.7341, "lr": 9.706519689239857e-09, "epoch": 9.920315758117367, "percentage": 99.2, "elapsed_time": "4:36:39", "remaining_time": "0:02:13", "throughput": 2314.65, "total_tokens": 38421672} {"current_steps": 66610, "total_steps": 67140, "loss": 0.647, "lr": 9.526283996630359e-09, "epoch": 9.921060470658325, "percentage": 99.21, "elapsed_time": "4:36:40", "remaining_time": "0:02:12", "throughput": 2314.68, "total_tokens": 38425000} {"current_steps": 66615, "total_steps": 67140, "loss": 0.6145, "lr": 9.347737058632012e-09, "epoch": 9.921805183199286, "percentage": 99.22, "elapsed_time": "4:36:41", "remaining_time": "0:02:10", "throughput": 2314.69, "total_tokens": 38427688} {"current_steps": 66620, "total_steps": 67140, "loss": 0.5235, "lr": 9.170878887307388e-09, "epoch": 9.922549895740245, "percentage": 99.23, "elapsed_time": "4:36:42", "remaining_time": "0:02:09", "throughput": 2314.7, "total_tokens": 38430600} {"current_steps": 66625, "total_steps": 67140, "loss": 0.6301, "lr": 8.995709494610816e-09, "epoch": 9.923294608281203, "percentage": 99.23, "elapsed_time": "4:36:43", "remaining_time": "0:02:08", "throughput": 2314.72, "total_tokens": 38433448} {"current_steps": 66630, "total_steps": 67140, "loss": 0.5037, "lr": 8.82222889237727e-09, "epoch": 9.924039320822162, "percentage": 99.24, "elapsed_time": "4:36:45", "remaining_time": "0:02:07", "throughput": 2314.73, "total_tokens": 38436264} {"current_steps": 66635, "total_steps": 67140, "loss": 0.6592, "lr": 8.65043709233071e-09, "epoch": 9.924784033363121, "percentage": 99.25, "elapsed_time": "4:36:46", "remaining_time": "0:02:05", "throughput": 2314.74, "total_tokens": 38438984} {"current_steps": 66640, "total_steps": 67140, "loss": 0.4916, "lr": 8.480334106081289e-09, "epoch": 9.925528745904082, "percentage": 99.26, "elapsed_time": "4:36:47", "remaining_time": "0:02:04", "throughput": 2314.74, "total_tokens": 38441544} {"current_steps": 66645, "total_steps": 67140, "loss": 0.4762, "lr": 8.311919945119817e-09, "epoch": 9.92627345844504, "percentage": 99.26, "elapsed_time": "4:36:48", "remaining_time": "0:02:03", "throughput": 2314.75, "total_tokens": 38444456} {"current_steps": 66650, "total_steps": 67140, "loss": 0.4289, "lr": 8.145194620834407e-09, "epoch": 9.927018170985999, "percentage": 99.27, "elapsed_time": "4:36:49", "remaining_time": "0:02:02", "throughput": 2314.76, "total_tokens": 38447176} {"current_steps": 66655, "total_steps": 67140, "loss": 0.3566, "lr": 7.98015814448272e-09, "epoch": 9.927762883526958, "percentage": 99.28, "elapsed_time": "4:36:50", "remaining_time": "0:02:00", "throughput": 2314.79, "total_tokens": 38450408} {"current_steps": 66660, "total_steps": 67140, "loss": 0.5305, "lr": 7.81681052722527e-09, "epoch": 9.928507596067918, "percentage": 99.29, "elapsed_time": "4:36:51", "remaining_time": "0:01:59", "throughput": 2314.81, "total_tokens": 38453480} {"current_steps": 66665, "total_steps": 67140, "loss": 0.5682, "lr": 7.655151780094905e-09, "epoch": 9.929252308608877, "percentage": 99.29, "elapsed_time": "4:36:53", "remaining_time": "0:01:58", "throughput": 2314.83, "total_tokens": 38456456} {"current_steps": 66670, "total_steps": 67140, "loss": 0.5787, "lr": 7.49518191401899e-09, "epoch": 9.929997021149836, "percentage": 99.3, "elapsed_time": "4:36:54", "remaining_time": "0:01:57", "throughput": 2314.84, "total_tokens": 38459208} {"current_steps": 66675, "total_steps": 67140, "loss": 0.558, "lr": 7.336900939805546e-09, "epoch": 9.930741733690795, "percentage": 99.31, "elapsed_time": "4:36:55", "remaining_time": "0:01:55", "throughput": 2314.85, "total_tokens": 38461960} {"current_steps": 66680, "total_steps": 67140, "loss": 0.9178, "lr": 7.180308868154351e-09, "epoch": 9.931486446231755, "percentage": 99.31, "elapsed_time": "4:36:56", "remaining_time": "0:01:54", "throughput": 2314.87, "total_tokens": 38464904} {"current_steps": 66685, "total_steps": 67140, "loss": 0.5692, "lr": 7.025405709640276e-09, "epoch": 9.932231158772714, "percentage": 99.32, "elapsed_time": "4:36:57", "remaining_time": "0:01:53", "throughput": 2314.88, "total_tokens": 38467688} {"current_steps": 66690, "total_steps": 67140, "loss": 0.5588, "lr": 6.8721914747382764e-09, "epoch": 9.932975871313673, "percentage": 99.33, "elapsed_time": "4:36:58", "remaining_time": "0:01:52", "throughput": 2314.89, "total_tokens": 38470504} {"current_steps": 66695, "total_steps": 67140, "loss": 0.7774, "lr": 6.720666173798407e-09, "epoch": 9.933720583854631, "percentage": 99.34, "elapsed_time": "4:36:59", "remaining_time": "0:01:50", "throughput": 2314.92, "total_tokens": 38473736} {"current_steps": 66700, "total_steps": 67140, "loss": 0.565, "lr": 6.570829817059699e-09, "epoch": 9.934465296395592, "percentage": 99.34, "elapsed_time": "4:37:01", "remaining_time": "0:01:49", "throughput": 2314.94, "total_tokens": 38476776} {"current_steps": 66705, "total_steps": 67140, "loss": 0.4541, "lr": 6.422682414650161e-09, "epoch": 9.93521000893655, "percentage": 99.35, "elapsed_time": "4:37:02", "remaining_time": "0:01:48", "throughput": 2314.96, "total_tokens": 38479720} {"current_steps": 66710, "total_steps": 67140, "loss": 0.5756, "lr": 6.276223976578455e-09, "epoch": 9.93595472147751, "percentage": 99.36, "elapsed_time": "4:37:03", "remaining_time": "0:01:47", "throughput": 2314.98, "total_tokens": 38482568} {"current_steps": 66715, "total_steps": 67140, "loss": 0.5927, "lr": 6.131454512742218e-09, "epoch": 9.936699434018468, "percentage": 99.37, "elapsed_time": "4:37:04", "remaining_time": "0:01:45", "throughput": 2314.99, "total_tokens": 38485448} {"current_steps": 66720, "total_steps": 67140, "loss": 0.5148, "lr": 5.988374032922517e-09, "epoch": 9.937444146559429, "percentage": 99.37, "elapsed_time": "4:37:05", "remaining_time": "0:01:44", "throughput": 2315.0, "total_tokens": 38488200} {"current_steps": 66725, "total_steps": 67140, "loss": 0.5336, "lr": 5.846982546792168e-09, "epoch": 9.938188859100388, "percentage": 99.38, "elapsed_time": "4:37:06", "remaining_time": "0:01:43", "throughput": 2315.01, "total_tokens": 38490952} {"current_steps": 66730, "total_steps": 67140, "loss": 0.4825, "lr": 5.707280063904641e-09, "epoch": 9.938933571641346, "percentage": 99.39, "elapsed_time": "4:37:07", "remaining_time": "0:01:42", "throughput": 2315.03, "total_tokens": 38493736} {"current_steps": 66735, "total_steps": 67140, "loss": 0.7625, "lr": 5.569266593699607e-09, "epoch": 9.939678284182305, "percentage": 99.4, "elapsed_time": "4:37:08", "remaining_time": "0:01:40", "throughput": 2315.06, "total_tokens": 38497064} {"current_steps": 66740, "total_steps": 67140, "loss": 0.564, "lr": 5.4329421455029395e-09, "epoch": 9.940422996723266, "percentage": 99.4, "elapsed_time": "4:37:10", "remaining_time": "0:01:39", "throughput": 2315.07, "total_tokens": 38499976} {"current_steps": 66745, "total_steps": 67140, "loss": 0.3523, "lr": 5.298306728526714e-09, "epoch": 9.941167709264224, "percentage": 99.41, "elapsed_time": "4:37:11", "remaining_time": "0:01:38", "throughput": 2315.07, "total_tokens": 38502472} {"current_steps": 66750, "total_steps": 67140, "loss": 0.4112, "lr": 5.165360351871984e-09, "epoch": 9.941912421805183, "percentage": 99.42, "elapsed_time": "4:37:12", "remaining_time": "0:01:37", "throughput": 2315.08, "total_tokens": 38505096} {"current_steps": 66755, "total_steps": 67140, "loss": 0.6948, "lr": 5.0341030245204536e-09, "epoch": 9.942657134346142, "percentage": 99.43, "elapsed_time": "4:37:13", "remaining_time": "0:01:35", "throughput": 2315.09, "total_tokens": 38507944} {"current_steps": 66760, "total_steps": 67140, "loss": 0.6579, "lr": 4.904534755340029e-09, "epoch": 9.943401846887102, "percentage": 99.43, "elapsed_time": "4:37:14", "remaining_time": "0:01:34", "throughput": 2315.11, "total_tokens": 38510856} {"current_steps": 66765, "total_steps": 67140, "loss": 0.6982, "lr": 4.77665555309037e-09, "epoch": 9.944146559428061, "percentage": 99.44, "elapsed_time": "4:37:15", "remaining_time": "0:01:33", "throughput": 2315.13, "total_tokens": 38513864} {"current_steps": 66770, "total_steps": 67140, "loss": 0.5639, "lr": 4.650465426409012e-09, "epoch": 9.94489127196902, "percentage": 99.45, "elapsed_time": "4:37:16", "remaining_time": "0:01:32", "throughput": 2315.14, "total_tokens": 38516744} {"current_steps": 66775, "total_steps": 67140, "loss": 0.5432, "lr": 4.525964383828018e-09, "epoch": 9.945635984509979, "percentage": 99.46, "elapsed_time": "4:37:18", "remaining_time": "0:01:30", "throughput": 2315.2, "total_tokens": 38520808} {"current_steps": 66780, "total_steps": 67140, "loss": 0.4588, "lr": 4.40315243375733e-09, "epoch": 9.946380697050937, "percentage": 99.46, "elapsed_time": "4:37:19", "remaining_time": "0:01:29", "throughput": 2315.2, "total_tokens": 38523432} {"current_steps": 66785, "total_steps": 67140, "loss": 0.6551, "lr": 4.282029584495861e-09, "epoch": 9.947125409591898, "percentage": 99.47, "elapsed_time": "4:37:20", "remaining_time": "0:01:28", "throughput": 2315.23, "total_tokens": 38526536} {"current_steps": 66790, "total_steps": 67140, "loss": 0.6695, "lr": 4.1625958442315096e-09, "epoch": 9.947870122132857, "percentage": 99.48, "elapsed_time": "4:37:21", "remaining_time": "0:01:27", "throughput": 2315.25, "total_tokens": 38529640} {"current_steps": 66795, "total_steps": 67140, "loss": 0.7945, "lr": 4.0448512210300436e-09, "epoch": 9.948614834673815, "percentage": 99.49, "elapsed_time": "4:37:22", "remaining_time": "0:01:25", "throughput": 2315.26, "total_tokens": 38532488} {"current_steps": 66800, "total_steps": 67140, "loss": 0.755, "lr": 3.928795722854539e-09, "epoch": 9.949359547214776, "percentage": 99.49, "elapsed_time": "4:37:23", "remaining_time": "0:01:24", "throughput": 2315.28, "total_tokens": 38535464} {"current_steps": 66805, "total_steps": 67140, "loss": 0.5551, "lr": 3.81442935754317e-09, "epoch": 9.950104259755735, "percentage": 99.5, "elapsed_time": "4:37:25", "remaining_time": "0:01:23", "throughput": 2315.29, "total_tokens": 38538216} {"current_steps": 66810, "total_steps": 67140, "loss": 0.5684, "lr": 3.701752132825864e-09, "epoch": 9.950848972296694, "percentage": 99.51, "elapsed_time": "4:37:26", "remaining_time": "0:01:22", "throughput": 2315.3, "total_tokens": 38540872} {"current_steps": 66815, "total_steps": 67140, "loss": 0.566, "lr": 3.590764056315976e-09, "epoch": 9.951593684837652, "percentage": 99.52, "elapsed_time": "4:37:27", "remaining_time": "0:01:20", "throughput": 2315.32, "total_tokens": 38543976} {"current_steps": 66820, "total_steps": 67140, "loss": 0.5914, "lr": 3.481465135515838e-09, "epoch": 9.952338397378611, "percentage": 99.52, "elapsed_time": "4:37:28", "remaining_time": "0:01:19", "throughput": 2315.34, "total_tokens": 38546792} {"current_steps": 66825, "total_steps": 67140, "loss": 0.4765, "lr": 3.3738553778084324e-09, "epoch": 9.953083109919572, "percentage": 99.53, "elapsed_time": "4:37:29", "remaining_time": "0:01:18", "throughput": 2315.37, "total_tokens": 38550120} {"current_steps": 66830, "total_steps": 67140, "loss": 0.4592, "lr": 3.267934790465721e-09, "epoch": 9.95382782246053, "percentage": 99.54, "elapsed_time": "4:37:30", "remaining_time": "0:01:17", "throughput": 2315.38, "total_tokens": 38553000} {"current_steps": 66835, "total_steps": 67140, "loss": 0.3022, "lr": 3.1637033806486414e-09, "epoch": 9.954572535001489, "percentage": 99.55, "elapsed_time": "4:37:31", "remaining_time": "0:01:15", "throughput": 2315.4, "total_tokens": 38556040} {"current_steps": 66840, "total_steps": 67140, "loss": 0.4241, "lr": 3.061161155398784e-09, "epoch": 9.955317247542448, "percentage": 99.55, "elapsed_time": "4:37:33", "remaining_time": "0:01:14", "throughput": 2315.41, "total_tokens": 38558792} {"current_steps": 66845, "total_steps": 67140, "loss": 0.4374, "lr": 2.9603081216467156e-09, "epoch": 9.956061960083408, "percentage": 99.56, "elapsed_time": "4:37:34", "remaining_time": "0:01:13", "throughput": 2315.42, "total_tokens": 38561512} {"current_steps": 66850, "total_steps": 67140, "loss": 0.5871, "lr": 2.8611442862036544e-09, "epoch": 9.956806672624367, "percentage": 99.57, "elapsed_time": "4:37:35", "remaining_time": "0:01:12", "throughput": 2315.44, "total_tokens": 38564424} {"current_steps": 66855, "total_steps": 67140, "loss": 0.739, "lr": 2.763669655775347e-09, "epoch": 9.957551385165326, "percentage": 99.58, "elapsed_time": "4:37:36", "remaining_time": "0:01:11", "throughput": 2315.44, "total_tokens": 38567016} {"current_steps": 66860, "total_steps": 67140, "loss": 0.642, "lr": 2.667884236945417e-09, "epoch": 9.958296097706285, "percentage": 99.58, "elapsed_time": "4:37:37", "remaining_time": "0:01:09", "throughput": 2315.46, "total_tokens": 38569832} {"current_steps": 66865, "total_steps": 67140, "loss": 0.6434, "lr": 2.5737880361892397e-09, "epoch": 9.959040810247245, "percentage": 99.59, "elapsed_time": "4:37:38", "remaining_time": "0:01:08", "throughput": 2315.47, "total_tokens": 38572776} {"current_steps": 66870, "total_steps": 67140, "loss": 0.7066, "lr": 2.4813810598628416e-09, "epoch": 9.959785522788204, "percentage": 99.6, "elapsed_time": "4:37:39", "remaining_time": "0:01:07", "throughput": 2315.5, "total_tokens": 38575944} {"current_steps": 66875, "total_steps": 67140, "loss": 0.463, "lr": 2.3906633142140035e-09, "epoch": 9.960530235329163, "percentage": 99.61, "elapsed_time": "4:37:40", "remaining_time": "0:01:06", "throughput": 2315.51, "total_tokens": 38578600} {"current_steps": 66880, "total_steps": 67140, "loss": 0.5937, "lr": 2.3016348053711558e-09, "epoch": 9.961274947870121, "percentage": 99.61, "elapsed_time": "4:37:42", "remaining_time": "0:01:04", "throughput": 2315.53, "total_tokens": 38581704} {"current_steps": 66885, "total_steps": 67140, "loss": 0.5944, "lr": 2.2142955393489316e-09, "epoch": 9.962019660411082, "percentage": 99.62, "elapsed_time": "4:37:43", "remaining_time": "0:01:03", "throughput": 2315.54, "total_tokens": 38584328} {"current_steps": 66890, "total_steps": 67140, "loss": 0.5442, "lr": 2.1286455220537182e-09, "epoch": 9.96276437295204, "percentage": 99.63, "elapsed_time": "4:37:44", "remaining_time": "0:01:02", "throughput": 2315.55, "total_tokens": 38587240} {"current_steps": 66895, "total_steps": 67140, "loss": 0.5124, "lr": 2.044684759269777e-09, "epoch": 9.963509085493, "percentage": 99.64, "elapsed_time": "4:37:45", "remaining_time": "0:01:01", "throughput": 2315.57, "total_tokens": 38590312} {"current_steps": 66900, "total_steps": 67140, "loss": 0.7075, "lr": 1.962413256670348e-09, "epoch": 9.964253798033958, "percentage": 99.64, "elapsed_time": "4:37:46", "remaining_time": "0:00:59", "throughput": 2315.59, "total_tokens": 38593096} {"current_steps": 66905, "total_steps": 67140, "loss": 0.6821, "lr": 1.881831019817648e-09, "epoch": 9.964998510574919, "percentage": 99.65, "elapsed_time": "4:37:47", "remaining_time": "0:00:58", "throughput": 2315.6, "total_tokens": 38595816} {"current_steps": 66910, "total_steps": 67140, "loss": 0.4235, "lr": 1.802938054154546e-09, "epoch": 9.965743223115878, "percentage": 99.66, "elapsed_time": "4:37:48", "remaining_time": "0:00:57", "throughput": 2315.6, "total_tokens": 38598568} {"current_steps": 66915, "total_steps": 67140, "loss": 0.4285, "lr": 1.7257343650156632e-09, "epoch": 9.966487935656836, "percentage": 99.66, "elapsed_time": "4:37:50", "remaining_time": "0:00:56", "throughput": 2315.62, "total_tokens": 38601384} {"current_steps": 66920, "total_steps": 67140, "loss": 0.5846, "lr": 1.6502199576134968e-09, "epoch": 9.967232648197795, "percentage": 99.67, "elapsed_time": "4:37:51", "remaining_time": "0:00:54", "throughput": 2315.63, "total_tokens": 38604232} {"current_steps": 66925, "total_steps": 67140, "loss": 0.4441, "lr": 1.576394837055073e-09, "epoch": 9.967977360738756, "percentage": 99.68, "elapsed_time": "4:37:52", "remaining_time": "0:00:53", "throughput": 2315.65, "total_tokens": 38607240} {"current_steps": 66930, "total_steps": 67140, "loss": 0.5825, "lr": 1.5042590083280683e-09, "epoch": 9.968722073279714, "percentage": 99.69, "elapsed_time": "4:37:53", "remaining_time": "0:00:52", "throughput": 2315.68, "total_tokens": 38610600} {"current_steps": 66935, "total_steps": 67140, "loss": 0.5089, "lr": 1.433812476306362e-09, "epoch": 9.969466785820673, "percentage": 99.69, "elapsed_time": "4:37:54", "remaining_time": "0:00:51", "throughput": 2315.7, "total_tokens": 38613512} {"current_steps": 66940, "total_steps": 67140, "loss": 0.53, "lr": 1.3650552457500353e-09, "epoch": 9.970211498361632, "percentage": 99.7, "elapsed_time": "4:37:55", "remaining_time": "0:00:49", "throughput": 2315.73, "total_tokens": 38616616} {"current_steps": 66945, "total_steps": 67140, "loss": 0.6202, "lr": 1.2979873213081473e-09, "epoch": 9.970956210902592, "percentage": 99.71, "elapsed_time": "4:37:56", "remaining_time": "0:00:48", "throughput": 2315.74, "total_tokens": 38619496} {"current_steps": 66950, "total_steps": 67140, "loss": 0.5649, "lr": 1.2326087075104076e-09, "epoch": 9.971700923443551, "percentage": 99.72, "elapsed_time": "4:37:58", "remaining_time": "0:00:47", "throughput": 2315.76, "total_tokens": 38622440} {"current_steps": 66955, "total_steps": 67140, "loss": 0.4527, "lr": 1.1689194087727285e-09, "epoch": 9.97244563598451, "percentage": 99.72, "elapsed_time": "4:37:59", "remaining_time": "0:00:46", "throughput": 2315.78, "total_tokens": 38625448} {"current_steps": 66960, "total_steps": 67140, "loss": 0.641, "lr": 1.1069194294055507e-09, "epoch": 9.973190348525469, "percentage": 99.73, "elapsed_time": "4:38:00", "remaining_time": "0:00:44", "throughput": 2315.8, "total_tokens": 38628360} {"current_steps": 66965, "total_steps": 67140, "loss": 0.4374, "lr": 1.0466087735916396e-09, "epoch": 9.973935061066427, "percentage": 99.74, "elapsed_time": "4:38:01", "remaining_time": "0:00:43", "throughput": 2315.8, "total_tokens": 38630824} {"current_steps": 66970, "total_steps": 67140, "loss": 0.5507, "lr": 9.879874454110648e-10, "epoch": 9.974679773607388, "percentage": 99.75, "elapsed_time": "4:38:02", "remaining_time": "0:00:42", "throughput": 2315.81, "total_tokens": 38633672} {"current_steps": 66975, "total_steps": 67140, "loss": 0.4008, "lr": 9.310554488245471e-10, "epoch": 9.975424486148347, "percentage": 99.75, "elapsed_time": "4:38:03", "remaining_time": "0:00:41", "throughput": 2315.82, "total_tokens": 38636328} {"current_steps": 66980, "total_steps": 67140, "loss": 0.7554, "lr": 8.758127876762335e-10, "epoch": 9.976169198689306, "percentage": 99.76, "elapsed_time": "4:38:04", "remaining_time": "0:00:39", "throughput": 2315.83, "total_tokens": 38639016} {"current_steps": 66985, "total_steps": 67140, "loss": 0.5607, "lr": 8.222594657020244e-10, "epoch": 9.976913911230266, "percentage": 99.77, "elapsed_time": "4:38:05", "remaining_time": "0:00:38", "throughput": 2315.85, "total_tokens": 38642056} {"current_steps": 66990, "total_steps": 67140, "loss": 0.5734, "lr": 7.703954865212471e-10, "epoch": 9.977658623771225, "percentage": 99.78, "elapsed_time": "4:38:07", "remaining_time": "0:00:37", "throughput": 2315.87, "total_tokens": 38645192} {"current_steps": 66995, "total_steps": 67140, "loss": 0.5982, "lr": 7.202208536366551e-10, "epoch": 9.978403336312184, "percentage": 99.78, "elapsed_time": "4:38:08", "remaining_time": "0:00:36", "throughput": 2315.89, "total_tokens": 38648200} {"current_steps": 67000, "total_steps": 67140, "loss": 0.6234, "lr": 6.717355704427553e-10, "epoch": 9.979148048853142, "percentage": 99.79, "elapsed_time": "4:38:09", "remaining_time": "0:00:34", "throughput": 2315.91, "total_tokens": 38651112} {"current_steps": 67005, "total_steps": 67140, "loss": 0.7587, "lr": 6.249396402091545e-10, "epoch": 9.979892761394101, "percentage": 99.8, "elapsed_time": "4:38:10", "remaining_time": "0:00:33", "throughput": 2315.93, "total_tokens": 38654216} {"current_steps": 67010, "total_steps": 67140, "loss": 0.6765, "lr": 5.79833066102764e-10, "epoch": 9.980637473935062, "percentage": 99.81, "elapsed_time": "4:38:11", "remaining_time": "0:00:32", "throughput": 2315.96, "total_tokens": 38657448} {"current_steps": 67015, "total_steps": 67140, "loss": 0.6406, "lr": 5.364158511739215e-10, "epoch": 9.98138218647602, "percentage": 99.81, "elapsed_time": "4:38:12", "remaining_time": "0:00:31", "throughput": 2315.98, "total_tokens": 38660392} {"current_steps": 67020, "total_steps": 67140, "loss": 0.5955, "lr": 4.946879983508401e-10, "epoch": 9.98212689901698, "percentage": 99.82, "elapsed_time": "4:38:13", "remaining_time": "0:00:29", "throughput": 2315.99, "total_tokens": 38663176} {"current_steps": 67025, "total_steps": 67140, "loss": 0.6247, "lr": 4.5464951045626204e-10, "epoch": 9.982871611557938, "percentage": 99.83, "elapsed_time": "4:38:15", "remaining_time": "0:00:28", "throughput": 2316.01, "total_tokens": 38666088} {"current_steps": 67030, "total_steps": 67140, "loss": 0.6563, "lr": 4.163003901963558e-10, "epoch": 9.983616324098898, "percentage": 99.84, "elapsed_time": "4:38:16", "remaining_time": "0:00:27", "throughput": 2316.02, "total_tokens": 38668840} {"current_steps": 67035, "total_steps": 67140, "loss": 0.647, "lr": 3.796406401634922e-10, "epoch": 9.984361036639857, "percentage": 99.84, "elapsed_time": "4:38:17", "remaining_time": "0:00:26", "throughput": 2316.03, "total_tokens": 38671592} {"current_steps": 67040, "total_steps": 67140, "loss": 0.4424, "lr": 3.4467026283069305e-10, "epoch": 9.985105749180816, "percentage": 99.85, "elapsed_time": "4:38:18", "remaining_time": "0:00:24", "throughput": 2316.05, "total_tokens": 38674472} {"current_steps": 67045, "total_steps": 67140, "loss": 0.5254, "lr": 3.1138926056550886e-10, "epoch": 9.985850461721775, "percentage": 99.86, "elapsed_time": "4:38:19", "remaining_time": "0:00:23", "throughput": 2316.06, "total_tokens": 38677480} {"current_steps": 67050, "total_steps": 67140, "loss": 0.4533, "lr": 2.7979763561614137e-10, "epoch": 9.986595174262735, "percentage": 99.87, "elapsed_time": "4:38:20", "remaining_time": "0:00:22", "throughput": 2316.09, "total_tokens": 38680520} {"current_steps": 67055, "total_steps": 67140, "loss": 0.6401, "lr": 2.498953901142187e-10, "epoch": 9.987339886803694, "percentage": 99.87, "elapsed_time": "4:38:21", "remaining_time": "0:00:21", "throughput": 2316.11, "total_tokens": 38683496} {"current_steps": 67060, "total_steps": 67140, "loss": 0.6181, "lr": 2.216825260858979e-10, "epoch": 9.988084599344653, "percentage": 99.88, "elapsed_time": "4:38:23", "remaining_time": "0:00:19", "throughput": 2316.11, "total_tokens": 38686216} {"current_steps": 67065, "total_steps": 67140, "loss": 0.4357, "lr": 1.951590454324359e-10, "epoch": 9.988829311885612, "percentage": 99.89, "elapsed_time": "4:38:24", "remaining_time": "0:00:18", "throughput": 2316.13, "total_tokens": 38689032} {"current_steps": 67070, "total_steps": 67140, "loss": 0.5348, "lr": 1.7032494994961846e-10, "epoch": 9.989574024426572, "percentage": 99.9, "elapsed_time": "4:38:25", "remaining_time": "0:00:17", "throughput": 2316.15, "total_tokens": 38692040} {"current_steps": 67075, "total_steps": 67140, "loss": 0.7054, "lr": 1.4718024131110674e-10, "epoch": 9.99031873696753, "percentage": 99.9, "elapsed_time": "4:38:26", "remaining_time": "0:00:16", "throughput": 2316.16, "total_tokens": 38695016} {"current_steps": 67080, "total_steps": 67140, "loss": 0.6325, "lr": 1.2572492108786638e-10, "epoch": 9.99106344950849, "percentage": 99.91, "elapsed_time": "4:38:27", "remaining_time": "0:00:14", "throughput": 2316.17, "total_tokens": 38697736} {"current_steps": 67085, "total_steps": 67140, "loss": 0.638, "lr": 1.0595899072318727e-10, "epoch": 9.991808162049448, "percentage": 99.92, "elapsed_time": "4:38:28", "remaining_time": "0:00:13", "throughput": 2316.21, "total_tokens": 38701128} {"current_steps": 67090, "total_steps": 67140, "loss": 0.5592, "lr": 8.788245155766372e-11, "epoch": 9.992552874590409, "percentage": 99.93, "elapsed_time": "4:38:29", "remaining_time": "0:00:12", "throughput": 2316.21, "total_tokens": 38703880} {"current_steps": 67095, "total_steps": 67140, "loss": 0.5565, "lr": 7.149530480976552e-11, "epoch": 9.993297587131368, "percentage": 99.93, "elapsed_time": "4:38:31", "remaining_time": "0:00:11", "throughput": 2316.24, "total_tokens": 38707080} {"current_steps": 67100, "total_steps": 67140, "loss": 0.5788, "lr": 5.679755158971567e-11, "epoch": 9.994042299672326, "percentage": 99.94, "elapsed_time": "4:38:32", "remaining_time": "0:00:09", "throughput": 2316.25, "total_tokens": 38709864} {"current_steps": 67105, "total_steps": 67140, "loss": 0.7534, "lr": 4.3789192888388233e-11, "epoch": 9.994787012213285, "percentage": 99.95, "elapsed_time": "4:38:33", "remaining_time": "0:00:08", "throughput": 2316.26, "total_tokens": 38712616} {"current_steps": 67110, "total_steps": 67140, "loss": 0.3905, "lr": 3.247022958285939e-11, "epoch": 9.995531724754246, "percentage": 99.96, "elapsed_time": "4:38:34", "remaining_time": "0:00:07", "throughput": 2316.27, "total_tokens": 38715240} {"current_steps": 67115, "total_steps": 67140, "loss": 0.3357, "lr": 2.2840662441958594e-11, "epoch": 9.996276437295204, "percentage": 99.96, "elapsed_time": "4:38:35", "remaining_time": "0:00:06", "throughput": 2316.27, "total_tokens": 38717896} {"current_steps": 67120, "total_steps": 67140, "loss": 0.6939, "lr": 1.490049211516631e-11, "epoch": 9.997021149836163, "percentage": 99.97, "elapsed_time": "4:38:36", "remaining_time": "0:00:04", "throughput": 2316.3, "total_tokens": 38721096} {"current_steps": 67125, "total_steps": 67140, "loss": 0.5483, "lr": 8.649719140940703e-12, "epoch": 9.997765862377122, "percentage": 99.98, "elapsed_time": "4:38:37", "remaining_time": "0:00:03", "throughput": 2316.33, "total_tokens": 38724328} {"current_steps": 67130, "total_steps": 67140, "loss": 0.5822, "lr": 4.088343935615413e-12, "epoch": 9.998510574918082, "percentage": 99.99, "elapsed_time": "4:38:39", "remaining_time": "0:00:02", "throughput": 2316.34, "total_tokens": 38727112} {"current_steps": 67135, "total_steps": 67140, "loss": 0.5863, "lr": 1.2163668156039976e-12, "epoch": 9.999255287459041, "percentage": 99.99, "elapsed_time": "4:38:40", "remaining_time": "0:00:01", "throughput": 2316.35, "total_tokens": 38729832} {"current_steps": 67140, "total_steps": 67140, "loss": 0.6976, "lr": 3.378796686881458e-14, "epoch": 10.0, "percentage": 100.0, "elapsed_time": "4:38:41", "remaining_time": "0:00:00", "throughput": 2316.34, "total_tokens": 38732208} {"current_steps": 67140, "total_steps": 67140, "eval_loss": 0.6837868094444275, "epoch": 10.0, "percentage": 100.0, "elapsed_time": "4:39:55", "remaining_time": "0:00:00", "throughput": 2306.14, "total_tokens": 38732208} {"current_steps": 67140, "total_steps": 67140, "epoch": 10.0, "percentage": 100.0, "elapsed_time": "4:39:57", "remaining_time": "0:00:00", "throughput": 2305.89, "total_tokens": 38732208}