{"current_steps": 1, "total_steps": 1918, "loss": 0.4124, "learning_rate": 5.208333333333333e-08, "epoch": 0.0005212745161920897, "percentage": 0.05, "elapsed_time": "0:00:14", "remaining_time": "7:47:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2, "total_steps": 1918, "loss": 0.4261, "learning_rate": 1.0416666666666667e-07, "epoch": 0.0010425490323841794, "percentage": 0.1, "elapsed_time": "0:00:24", "remaining_time": "6:26:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3, "total_steps": 1918, "loss": 0.4092, "learning_rate": 1.5625e-07, "epoch": 0.001563823548576269, "percentage": 0.16, "elapsed_time": "0:00:33", "remaining_time": "6:01:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4, "total_steps": 1918, "loss": 0.3987, "learning_rate": 2.0833333333333333e-07, "epoch": 0.0020850980647683587, "percentage": 0.21, "elapsed_time": "0:00:44", "remaining_time": "5:56:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5, "total_steps": 1918, "loss": 0.4086, "learning_rate": 2.604166666666667e-07, "epoch": 0.002606372580960448, "percentage": 0.26, "elapsed_time": "0:00:54", "remaining_time": "5:46:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6, "total_steps": 1918, "loss": 0.3814, "learning_rate": 3.125e-07, "epoch": 0.003127647097152538, "percentage": 0.31, "elapsed_time": "0:01:04", "remaining_time": "5:40:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7, "total_steps": 1918, "loss": 0.3795, "learning_rate": 3.6458333333333337e-07, "epoch": 0.0036489216133446275, "percentage": 0.36, "elapsed_time": "0:01:14", "remaining_time": "5:40:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8, "total_steps": 1918, "loss": 0.4008, "learning_rate": 4.1666666666666667e-07, "epoch": 0.0041701961295367174, "percentage": 0.42, "elapsed_time": "0:01:25", "remaining_time": "5:38:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9, "total_steps": 1918, "loss": 0.4106, "learning_rate": 4.6875000000000006e-07, "epoch": 0.004691470645728807, "percentage": 0.47, "elapsed_time": "0:01:35", "remaining_time": "5:37:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10, "total_steps": 1918, "loss": 0.3986, "learning_rate": 5.208333333333334e-07, "epoch": 0.005212745161920896, "percentage": 0.52, "elapsed_time": "0:01:45", "remaining_time": "5:36:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11, "total_steps": 1918, "loss": 0.4031, "learning_rate": 5.729166666666667e-07, "epoch": 0.005734019678112986, "percentage": 0.57, "elapsed_time": "0:01:55", "remaining_time": "5:34:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12, "total_steps": 1918, "loss": 0.3776, "learning_rate": 6.25e-07, "epoch": 0.006255294194305076, "percentage": 0.63, "elapsed_time": "0:02:05", "remaining_time": "5:32:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13, "total_steps": 1918, "loss": 0.3865, "learning_rate": 6.770833333333333e-07, "epoch": 0.006776568710497166, "percentage": 0.68, "elapsed_time": "0:02:15", "remaining_time": "5:31:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14, "total_steps": 1918, "loss": 0.3748, "learning_rate": 7.291666666666667e-07, "epoch": 0.007297843226689255, "percentage": 0.73, "elapsed_time": "0:02:27", "remaining_time": "5:33:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15, "total_steps": 1918, "loss": 0.3665, "learning_rate": 7.8125e-07, "epoch": 0.007819117742881345, "percentage": 0.78, "elapsed_time": "0:02:37", "remaining_time": "5:33:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16, "total_steps": 1918, "loss": 0.3597, "learning_rate": 8.333333333333333e-07, "epoch": 0.008340392259073435, "percentage": 0.83, "elapsed_time": "0:02:48", "remaining_time": "5:34:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17, "total_steps": 1918, "loss": 0.3735, "learning_rate": 8.854166666666668e-07, "epoch": 0.008861666775265524, "percentage": 0.89, "elapsed_time": "0:03:00", "remaining_time": "5:36:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18, "total_steps": 1918, "loss": 0.3503, "learning_rate": 9.375000000000001e-07, "epoch": 0.009382941291457614, "percentage": 0.94, "elapsed_time": "0:03:10", "remaining_time": "5:35:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19, "total_steps": 1918, "loss": 0.3331, "learning_rate": 9.895833333333333e-07, "epoch": 0.009904215807649703, "percentage": 0.99, "elapsed_time": "0:03:19", "remaining_time": "5:31:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20, "total_steps": 1918, "loss": 0.3194, "learning_rate": 1.0416666666666667e-06, "epoch": 0.010425490323841793, "percentage": 1.04, "elapsed_time": "0:03:30", "remaining_time": "5:32:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21, "total_steps": 1918, "loss": 0.3059, "learning_rate": 1.0937500000000001e-06, "epoch": 0.010946764840033882, "percentage": 1.09, "elapsed_time": "0:03:39", "remaining_time": "5:30:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22, "total_steps": 1918, "loss": 0.3251, "learning_rate": 1.1458333333333333e-06, "epoch": 0.011468039356225972, "percentage": 1.15, "elapsed_time": "0:03:49", "remaining_time": "5:29:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23, "total_steps": 1918, "loss": 0.3095, "learning_rate": 1.197916666666667e-06, "epoch": 0.011989313872418063, "percentage": 1.2, "elapsed_time": "0:03:59", "remaining_time": "5:29:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24, "total_steps": 1918, "loss": 0.3193, "learning_rate": 1.25e-06, "epoch": 0.012510588388610152, "percentage": 1.25, "elapsed_time": "0:04:09", "remaining_time": "5:28:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25, "total_steps": 1918, "loss": 0.3319, "learning_rate": 1.3020833333333335e-06, "epoch": 0.013031862904802242, "percentage": 1.3, "elapsed_time": "0:04:20", "remaining_time": "5:28:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 26, "total_steps": 1918, "loss": 0.2944, "learning_rate": 1.3541666666666667e-06, "epoch": 0.013553137420994331, "percentage": 1.36, "elapsed_time": "0:04:31", "remaining_time": "5:28:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 27, "total_steps": 1918, "loss": 0.3041, "learning_rate": 1.40625e-06, "epoch": 0.01407441193718642, "percentage": 1.41, "elapsed_time": "0:04:40", "remaining_time": "5:27:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 28, "total_steps": 1918, "loss": 0.3063, "learning_rate": 1.4583333333333335e-06, "epoch": 0.01459568645337851, "percentage": 1.46, "elapsed_time": "0:04:51", "remaining_time": "5:28:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 29, "total_steps": 1918, "loss": 0.3091, "learning_rate": 1.5104166666666667e-06, "epoch": 0.0151169609695706, "percentage": 1.51, "elapsed_time": "0:05:02", "remaining_time": "5:27:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 30, "total_steps": 1918, "loss": 0.2879, "learning_rate": 1.5625e-06, "epoch": 0.01563823548576269, "percentage": 1.56, "elapsed_time": "0:05:13", "remaining_time": "5:28:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 31, "total_steps": 1918, "loss": 0.3016, "learning_rate": 1.6145833333333335e-06, "epoch": 0.01615951000195478, "percentage": 1.62, "elapsed_time": "0:05:23", "remaining_time": "5:28:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 32, "total_steps": 1918, "loss": 0.3042, "learning_rate": 1.6666666666666667e-06, "epoch": 0.01668078451814687, "percentage": 1.67, "elapsed_time": "0:05:34", "remaining_time": "5:28:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 33, "total_steps": 1918, "loss": 0.3048, "learning_rate": 1.71875e-06, "epoch": 0.017202059034338957, "percentage": 1.72, "elapsed_time": "0:05:45", "remaining_time": "5:28:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 34, "total_steps": 1918, "loss": 0.3043, "learning_rate": 1.7708333333333337e-06, "epoch": 0.01772333355053105, "percentage": 1.77, "elapsed_time": "0:05:55", "remaining_time": "5:28:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 35, "total_steps": 1918, "loss": 0.2924, "learning_rate": 1.8229166666666666e-06, "epoch": 0.018244608066723136, "percentage": 1.82, "elapsed_time": "0:06:06", "remaining_time": "5:28:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 36, "total_steps": 1918, "loss": 0.2771, "learning_rate": 1.8750000000000003e-06, "epoch": 0.018765882582915228, "percentage": 1.88, "elapsed_time": "0:06:16", "remaining_time": "5:28:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 37, "total_steps": 1918, "loss": 0.2838, "learning_rate": 1.9270833333333334e-06, "epoch": 0.01928715709910732, "percentage": 1.93, "elapsed_time": "0:06:28", "remaining_time": "5:29:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 38, "total_steps": 1918, "loss": 0.2941, "learning_rate": 1.9791666666666666e-06, "epoch": 0.019808431615299407, "percentage": 1.98, "elapsed_time": "0:06:38", "remaining_time": "5:28:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 39, "total_steps": 1918, "loss": 0.2918, "learning_rate": 2.0312500000000002e-06, "epoch": 0.020329706131491498, "percentage": 2.03, "elapsed_time": "0:06:48", "remaining_time": "5:28:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 40, "total_steps": 1918, "loss": 0.2762, "learning_rate": 2.0833333333333334e-06, "epoch": 0.020850980647683585, "percentage": 2.09, "elapsed_time": "0:06:58", "remaining_time": "5:27:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 41, "total_steps": 1918, "loss": 0.2657, "learning_rate": 2.1354166666666666e-06, "epoch": 0.021372255163875677, "percentage": 2.14, "elapsed_time": "0:07:09", "remaining_time": "5:27:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 42, "total_steps": 1918, "loss": 0.2897, "learning_rate": 2.1875000000000002e-06, "epoch": 0.021893529680067764, "percentage": 2.19, "elapsed_time": "0:07:21", "remaining_time": "5:28:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 43, "total_steps": 1918, "loss": 0.2821, "learning_rate": 2.2395833333333334e-06, "epoch": 0.022414804196259856, "percentage": 2.24, "elapsed_time": "0:07:32", "remaining_time": "5:28:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 44, "total_steps": 1918, "loss": 0.2599, "learning_rate": 2.2916666666666666e-06, "epoch": 0.022936078712451943, "percentage": 2.29, "elapsed_time": "0:07:42", "remaining_time": "5:28:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 45, "total_steps": 1918, "loss": 0.2745, "learning_rate": 2.3437500000000002e-06, "epoch": 0.023457353228644034, "percentage": 2.35, "elapsed_time": "0:07:52", "remaining_time": "5:27:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 46, "total_steps": 1918, "loss": 0.2626, "learning_rate": 2.395833333333334e-06, "epoch": 0.023978627744836126, "percentage": 2.4, "elapsed_time": "0:08:02", "remaining_time": "5:27:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 47, "total_steps": 1918, "loss": 0.2699, "learning_rate": 2.4479166666666666e-06, "epoch": 0.024499902261028213, "percentage": 2.45, "elapsed_time": "0:08:12", "remaining_time": "5:27:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 48, "total_steps": 1918, "loss": 0.2764, "learning_rate": 2.5e-06, "epoch": 0.025021176777220305, "percentage": 2.5, "elapsed_time": "0:08:22", "remaining_time": "5:26:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 49, "total_steps": 1918, "loss": 0.2774, "learning_rate": 2.5520833333333334e-06, "epoch": 0.025542451293412392, "percentage": 2.55, "elapsed_time": "0:08:33", "remaining_time": "5:26:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 50, "total_steps": 1918, "loss": 0.2763, "learning_rate": 2.604166666666667e-06, "epoch": 0.026063725809604484, "percentage": 2.61, "elapsed_time": "0:08:44", "remaining_time": "5:26:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 51, "total_steps": 1918, "loss": 0.2586, "learning_rate": 2.65625e-06, "epoch": 0.02658500032579657, "percentage": 2.66, "elapsed_time": "0:08:55", "remaining_time": "5:26:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 52, "total_steps": 1918, "loss": 0.273, "learning_rate": 2.7083333333333334e-06, "epoch": 0.027106274841988662, "percentage": 2.71, "elapsed_time": "0:09:05", "remaining_time": "5:26:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 53, "total_steps": 1918, "loss": 0.2633, "learning_rate": 2.760416666666667e-06, "epoch": 0.027627549358180754, "percentage": 2.76, "elapsed_time": "0:09:16", "remaining_time": "5:26:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 54, "total_steps": 1918, "loss": 0.2713, "learning_rate": 2.8125e-06, "epoch": 0.02814882387437284, "percentage": 2.82, "elapsed_time": "0:09:26", "remaining_time": "5:25:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 55, "total_steps": 1918, "loss": 0.2675, "learning_rate": 2.8645833333333334e-06, "epoch": 0.028670098390564933, "percentage": 2.87, "elapsed_time": "0:09:36", "remaining_time": "5:25:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 56, "total_steps": 1918, "loss": 0.26, "learning_rate": 2.916666666666667e-06, "epoch": 0.02919137290675702, "percentage": 2.92, "elapsed_time": "0:09:46", "remaining_time": "5:25:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 57, "total_steps": 1918, "loss": 0.2623, "learning_rate": 2.96875e-06, "epoch": 0.02971264742294911, "percentage": 2.97, "elapsed_time": "0:09:57", "remaining_time": "5:25:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 58, "total_steps": 1918, "loss": 0.2709, "learning_rate": 3.0208333333333334e-06, "epoch": 0.0302339219391412, "percentage": 3.02, "elapsed_time": "0:10:08", "remaining_time": "5:25:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 59, "total_steps": 1918, "loss": 0.2519, "learning_rate": 3.072916666666667e-06, "epoch": 0.03075519645533329, "percentage": 3.08, "elapsed_time": "0:10:18", "remaining_time": "5:24:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 60, "total_steps": 1918, "loss": 0.2683, "learning_rate": 3.125e-06, "epoch": 0.03127647097152538, "percentage": 3.13, "elapsed_time": "0:10:28", "remaining_time": "5:24:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 61, "total_steps": 1918, "loss": 0.2486, "learning_rate": 3.1770833333333333e-06, "epoch": 0.031797745487717466, "percentage": 3.18, "elapsed_time": "0:10:39", "remaining_time": "5:24:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 62, "total_steps": 1918, "loss": 0.2589, "learning_rate": 3.229166666666667e-06, "epoch": 0.03231902000390956, "percentage": 3.23, "elapsed_time": "0:10:50", "remaining_time": "5:24:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 63, "total_steps": 1918, "loss": 0.2583, "learning_rate": 3.28125e-06, "epoch": 0.03284029452010165, "percentage": 3.28, "elapsed_time": "0:11:00", "remaining_time": "5:23:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 64, "total_steps": 1918, "loss": 0.2596, "learning_rate": 3.3333333333333333e-06, "epoch": 0.03336156903629374, "percentage": 3.34, "elapsed_time": "0:11:10", "remaining_time": "5:23:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 65, "total_steps": 1918, "loss": 0.2605, "learning_rate": 3.385416666666667e-06, "epoch": 0.03388284355248583, "percentage": 3.39, "elapsed_time": "0:11:20", "remaining_time": "5:23:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 66, "total_steps": 1918, "loss": 0.2477, "learning_rate": 3.4375e-06, "epoch": 0.034404118068677915, "percentage": 3.44, "elapsed_time": "0:11:30", "remaining_time": "5:23:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 67, "total_steps": 1918, "loss": 0.2446, "learning_rate": 3.4895833333333333e-06, "epoch": 0.034925392584870006, "percentage": 3.49, "elapsed_time": "0:11:40", "remaining_time": "5:22:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 68, "total_steps": 1918, "loss": 0.2478, "learning_rate": 3.5416666666666673e-06, "epoch": 0.0354466671010621, "percentage": 3.55, "elapsed_time": "0:11:51", "remaining_time": "5:22:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 69, "total_steps": 1918, "loss": 0.2619, "learning_rate": 3.59375e-06, "epoch": 0.03596794161725419, "percentage": 3.6, "elapsed_time": "0:12:01", "remaining_time": "5:22:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 70, "total_steps": 1918, "loss": 0.2458, "learning_rate": 3.6458333333333333e-06, "epoch": 0.03648921613344627, "percentage": 3.65, "elapsed_time": "0:12:11", "remaining_time": "5:21:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 71, "total_steps": 1918, "loss": 0.2457, "learning_rate": 3.6979166666666673e-06, "epoch": 0.037010490649638364, "percentage": 3.7, "elapsed_time": "0:12:22", "remaining_time": "5:21:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 72, "total_steps": 1918, "loss": 0.2496, "learning_rate": 3.7500000000000005e-06, "epoch": 0.037531765165830455, "percentage": 3.75, "elapsed_time": "0:12:32", "remaining_time": "5:21:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 73, "total_steps": 1918, "loss": 0.2512, "learning_rate": 3.8020833333333333e-06, "epoch": 0.038053039682022546, "percentage": 3.81, "elapsed_time": "0:12:42", "remaining_time": "5:21:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 74, "total_steps": 1918, "loss": 0.2219, "learning_rate": 3.854166666666667e-06, "epoch": 0.03857431419821464, "percentage": 3.86, "elapsed_time": "0:12:52", "remaining_time": "5:20:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 75, "total_steps": 1918, "loss": 0.2579, "learning_rate": 3.90625e-06, "epoch": 0.03909558871440672, "percentage": 3.91, "elapsed_time": "0:13:02", "remaining_time": "5:20:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 76, "total_steps": 1918, "loss": 0.2447, "learning_rate": 3.958333333333333e-06, "epoch": 0.03961686323059881, "percentage": 3.96, "elapsed_time": "0:13:11", "remaining_time": "5:19:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 77, "total_steps": 1918, "loss": 0.2575, "learning_rate": 4.010416666666667e-06, "epoch": 0.040138137746790904, "percentage": 4.01, "elapsed_time": "0:13:21", "remaining_time": "5:19:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 78, "total_steps": 1918, "loss": 0.2524, "learning_rate": 4.0625000000000005e-06, "epoch": 0.040659412262982995, "percentage": 4.07, "elapsed_time": "0:13:33", "remaining_time": "5:19:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 79, "total_steps": 1918, "loss": 0.2534, "learning_rate": 4.114583333333334e-06, "epoch": 0.04118068677917508, "percentage": 4.12, "elapsed_time": "0:13:44", "remaining_time": "5:19:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 80, "total_steps": 1918, "loss": 0.2434, "learning_rate": 4.166666666666667e-06, "epoch": 0.04170196129536717, "percentage": 4.17, "elapsed_time": "0:13:54", "remaining_time": "5:19:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 81, "total_steps": 1918, "loss": 0.2224, "learning_rate": 4.21875e-06, "epoch": 0.04222323581155926, "percentage": 4.22, "elapsed_time": "0:14:04", "remaining_time": "5:19:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 82, "total_steps": 1918, "loss": 0.2646, "learning_rate": 4.270833333333333e-06, "epoch": 0.04274451032775135, "percentage": 4.28, "elapsed_time": "0:14:15", "remaining_time": "5:19:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 83, "total_steps": 1918, "loss": 0.2613, "learning_rate": 4.322916666666667e-06, "epoch": 0.043265784843943444, "percentage": 4.33, "elapsed_time": "0:14:27", "remaining_time": "5:19:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 84, "total_steps": 1918, "loss": 0.2616, "learning_rate": 4.3750000000000005e-06, "epoch": 0.04378705936013553, "percentage": 4.38, "elapsed_time": "0:14:36", "remaining_time": "5:18:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 85, "total_steps": 1918, "loss": 0.241, "learning_rate": 4.427083333333334e-06, "epoch": 0.04430833387632762, "percentage": 4.43, "elapsed_time": "0:14:46", "remaining_time": "5:18:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 86, "total_steps": 1918, "loss": 0.2664, "learning_rate": 4.479166666666667e-06, "epoch": 0.04482960839251971, "percentage": 4.48, "elapsed_time": "0:14:55", "remaining_time": "5:17:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 87, "total_steps": 1918, "loss": 0.2364, "learning_rate": 4.53125e-06, "epoch": 0.0453508829087118, "percentage": 4.54, "elapsed_time": "0:15:06", "remaining_time": "5:18:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 88, "total_steps": 1918, "loss": 0.235, "learning_rate": 4.583333333333333e-06, "epoch": 0.04587215742490389, "percentage": 4.59, "elapsed_time": "0:15:15", "remaining_time": "5:17:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 89, "total_steps": 1918, "loss": 0.2502, "learning_rate": 4.635416666666667e-06, "epoch": 0.04639343194109598, "percentage": 4.64, "elapsed_time": "0:15:26", "remaining_time": "5:17:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 90, "total_steps": 1918, "loss": 0.2591, "learning_rate": 4.6875000000000004e-06, "epoch": 0.04691470645728807, "percentage": 4.69, "elapsed_time": "0:15:35", "remaining_time": "5:16:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 91, "total_steps": 1918, "loss": 0.2503, "learning_rate": 4.739583333333334e-06, "epoch": 0.04743598097348016, "percentage": 4.74, "elapsed_time": "0:15:47", "remaining_time": "5:16:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 92, "total_steps": 1918, "loss": 0.2345, "learning_rate": 4.791666666666668e-06, "epoch": 0.04795725548967225, "percentage": 4.8, "elapsed_time": "0:15:58", "remaining_time": "5:17:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 93, "total_steps": 1918, "loss": 0.2258, "learning_rate": 4.84375e-06, "epoch": 0.048478530005864336, "percentage": 4.85, "elapsed_time": "0:16:08", "remaining_time": "5:16:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 94, "total_steps": 1918, "loss": 0.2469, "learning_rate": 4.895833333333333e-06, "epoch": 0.04899980452205643, "percentage": 4.9, "elapsed_time": "0:16:19", "remaining_time": "5:16:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 95, "total_steps": 1918, "loss": 0.2595, "learning_rate": 4.947916666666667e-06, "epoch": 0.04952107903824852, "percentage": 4.95, "elapsed_time": "0:16:28", "remaining_time": "5:16:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 96, "total_steps": 1918, "loss": 0.2357, "learning_rate": 5e-06, "epoch": 0.05004235355444061, "percentage": 5.01, "elapsed_time": "0:16:39", "remaining_time": "5:16:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 97, "total_steps": 1918, "loss": 0.2617, "learning_rate": 4.999996283681687e-06, "epoch": 0.050563628070632693, "percentage": 5.06, "elapsed_time": "0:16:49", "remaining_time": "5:15:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 98, "total_steps": 1918, "loss": 0.2476, "learning_rate": 4.9999851347377946e-06, "epoch": 0.051084902586824785, "percentage": 5.11, "elapsed_time": "0:16:59", "remaining_time": "5:15:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 99, "total_steps": 1918, "loss": 0.2392, "learning_rate": 4.99996655320147e-06, "epoch": 0.051606177103016876, "percentage": 5.16, "elapsed_time": "0:17:10", "remaining_time": "5:15:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 100, "total_steps": 1918, "loss": 0.2608, "learning_rate": 4.999940539127958e-06, "epoch": 0.05212745161920897, "percentage": 5.21, "elapsed_time": "0:17:21", "remaining_time": "5:15:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 101, "total_steps": 1918, "loss": 0.2442, "learning_rate": 4.999907092594598e-06, "epoch": 0.05264872613540106, "percentage": 5.27, "elapsed_time": "0:17:31", "remaining_time": "5:15:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 102, "total_steps": 1918, "loss": 0.2226, "learning_rate": 4.99986621370083e-06, "epoch": 0.05317000065159314, "percentage": 5.32, "elapsed_time": "0:17:42", "remaining_time": "5:15:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 103, "total_steps": 1918, "loss": 0.2432, "learning_rate": 4.99981790256819e-06, "epoch": 0.053691275167785234, "percentage": 5.37, "elapsed_time": "0:17:52", "remaining_time": "5:14:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 104, "total_steps": 1918, "loss": 0.2283, "learning_rate": 4.999762159340305e-06, "epoch": 0.054212549683977325, "percentage": 5.42, "elapsed_time": "0:18:02", "remaining_time": "5:14:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 105, "total_steps": 1918, "loss": 0.218, "learning_rate": 4.999698984182909e-06, "epoch": 0.054733824200169416, "percentage": 5.47, "elapsed_time": "0:18:11", "remaining_time": "5:14:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 106, "total_steps": 1918, "loss": 0.2508, "learning_rate": 4.999628377283821e-06, "epoch": 0.05525509871636151, "percentage": 5.53, "elapsed_time": "0:18:22", "remaining_time": "5:14:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 107, "total_steps": 1918, "loss": 0.227, "learning_rate": 4.99955033885296e-06, "epoch": 0.05577637323255359, "percentage": 5.58, "elapsed_time": "0:18:31", "remaining_time": "5:13:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 108, "total_steps": 1918, "loss": 0.2654, "learning_rate": 4.999464869122339e-06, "epoch": 0.05629764774874568, "percentage": 5.63, "elapsed_time": "0:18:42", "remaining_time": "5:13:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 109, "total_steps": 1918, "loss": 0.2559, "learning_rate": 4.999371968346064e-06, "epoch": 0.056818922264937774, "percentage": 5.68, "elapsed_time": "0:18:52", "remaining_time": "5:13:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 110, "total_steps": 1918, "loss": 0.2453, "learning_rate": 4.999271636800334e-06, "epoch": 0.057340196781129865, "percentage": 5.74, "elapsed_time": "0:19:02", "remaining_time": "5:12:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 111, "total_steps": 1918, "loss": 0.2546, "learning_rate": 4.999163874783441e-06, "epoch": 0.05786147129732195, "percentage": 5.79, "elapsed_time": "0:19:12", "remaining_time": "5:12:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 112, "total_steps": 1918, "loss": 0.2555, "learning_rate": 4.999048682615766e-06, "epoch": 0.05838274581351404, "percentage": 5.84, "elapsed_time": "0:19:23", "remaining_time": "5:12:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 113, "total_steps": 1918, "loss": 0.2449, "learning_rate": 4.9989260606397816e-06, "epoch": 0.05890402032970613, "percentage": 5.89, "elapsed_time": "0:19:33", "remaining_time": "5:12:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 114, "total_steps": 1918, "loss": 0.255, "learning_rate": 4.998796009220051e-06, "epoch": 0.05942529484589822, "percentage": 5.94, "elapsed_time": "0:19:44", "remaining_time": "5:12:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 115, "total_steps": 1918, "loss": 0.2372, "learning_rate": 4.9986585287432236e-06, "epoch": 0.059946569362090314, "percentage": 6.0, "elapsed_time": "0:19:54", "remaining_time": "5:12:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 116, "total_steps": 1918, "loss": 0.2442, "learning_rate": 4.998513619618036e-06, "epoch": 0.0604678438782824, "percentage": 6.05, "elapsed_time": "0:20:04", "remaining_time": "5:11:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 117, "total_steps": 1918, "loss": 0.2281, "learning_rate": 4.998361282275311e-06, "epoch": 0.06098911839447449, "percentage": 6.1, "elapsed_time": "0:20:15", "remaining_time": "5:11:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 118, "total_steps": 1918, "loss": 0.2554, "learning_rate": 4.998201517167956e-06, "epoch": 0.06151039291066658, "percentage": 6.15, "elapsed_time": "0:20:26", "remaining_time": "5:11:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 119, "total_steps": 1918, "loss": 0.2334, "learning_rate": 4.998034324770962e-06, "epoch": 0.06203166742685867, "percentage": 6.2, "elapsed_time": "0:20:38", "remaining_time": "5:11:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 120, "total_steps": 1918, "loss": 0.2407, "learning_rate": 4.997859705581399e-06, "epoch": 0.06255294194305076, "percentage": 6.26, "elapsed_time": "0:20:48", "remaining_time": "5:11:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 121, "total_steps": 1918, "loss": 0.23, "learning_rate": 4.997677660118423e-06, "epoch": 0.06307421645924285, "percentage": 6.31, "elapsed_time": "0:20:59", "remaining_time": "5:11:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 122, "total_steps": 1918, "loss": 0.2369, "learning_rate": 4.997488188923262e-06, "epoch": 0.06359549097543493, "percentage": 6.36, "elapsed_time": "0:21:09", "remaining_time": "5:11:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 123, "total_steps": 1918, "loss": 0.2322, "learning_rate": 4.9972912925592245e-06, "epoch": 0.06411676549162702, "percentage": 6.41, "elapsed_time": "0:21:20", "remaining_time": "5:11:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 124, "total_steps": 1918, "loss": 0.2254, "learning_rate": 4.997086971611696e-06, "epoch": 0.06463804000781911, "percentage": 6.47, "elapsed_time": "0:21:31", "remaining_time": "5:11:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 125, "total_steps": 1918, "loss": 0.2322, "learning_rate": 4.996875226688133e-06, "epoch": 0.0651593145240112, "percentage": 6.52, "elapsed_time": "0:21:41", "remaining_time": "5:11:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 126, "total_steps": 1918, "loss": 0.2511, "learning_rate": 4.996656058418064e-06, "epoch": 0.0656805890402033, "percentage": 6.57, "elapsed_time": "0:21:51", "remaining_time": "5:10:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 127, "total_steps": 1918, "loss": 0.2359, "learning_rate": 4.996429467453088e-06, "epoch": 0.06620186355639539, "percentage": 6.62, "elapsed_time": "0:22:01", "remaining_time": "5:10:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 128, "total_steps": 1918, "loss": 0.2176, "learning_rate": 4.996195454466873e-06, "epoch": 0.06672313807258748, "percentage": 6.67, "elapsed_time": "0:22:11", "remaining_time": "5:10:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 129, "total_steps": 1918, "loss": 0.2409, "learning_rate": 4.995954020155153e-06, "epoch": 0.06724441258877957, "percentage": 6.73, "elapsed_time": "0:22:22", "remaining_time": "5:10:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 130, "total_steps": 1918, "loss": 0.2472, "learning_rate": 4.995705165235726e-06, "epoch": 0.06776568710497166, "percentage": 6.78, "elapsed_time": "0:22:32", "remaining_time": "5:10:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 131, "total_steps": 1918, "loss": 0.2446, "learning_rate": 4.995448890448449e-06, "epoch": 0.06828696162116374, "percentage": 6.83, "elapsed_time": "0:22:43", "remaining_time": "5:10:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 132, "total_steps": 1918, "loss": 0.2364, "learning_rate": 4.995185196555242e-06, "epoch": 0.06880823613735583, "percentage": 6.88, "elapsed_time": "0:22:52", "remaining_time": "5:09:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 133, "total_steps": 1918, "loss": 0.2469, "learning_rate": 4.994914084340082e-06, "epoch": 0.06932951065354792, "percentage": 6.93, "elapsed_time": "0:23:03", "remaining_time": "5:09:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 134, "total_steps": 1918, "loss": 0.2286, "learning_rate": 4.994635554608999e-06, "epoch": 0.06985078516974001, "percentage": 6.99, "elapsed_time": "0:23:16", "remaining_time": "5:09:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 135, "total_steps": 1918, "loss": 0.24, "learning_rate": 4.994349608190079e-06, "epoch": 0.0703720596859321, "percentage": 7.04, "elapsed_time": "0:23:26", "remaining_time": "5:09:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 136, "total_steps": 1918, "loss": 0.2393, "learning_rate": 4.994056245933454e-06, "epoch": 0.0708933342021242, "percentage": 7.09, "elapsed_time": "0:23:36", "remaining_time": "5:09:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 137, "total_steps": 1918, "loss": 0.2446, "learning_rate": 4.993755468711308e-06, "epoch": 0.07141460871831629, "percentage": 7.14, "elapsed_time": "0:23:46", "remaining_time": "5:09:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 138, "total_steps": 1918, "loss": 0.2269, "learning_rate": 4.993447277417867e-06, "epoch": 0.07193588323450838, "percentage": 7.19, "elapsed_time": "0:23:56", "remaining_time": "5:08:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 139, "total_steps": 1918, "loss": 0.2484, "learning_rate": 4.993131672969402e-06, "epoch": 0.07245715775070047, "percentage": 7.25, "elapsed_time": "0:24:06", "remaining_time": "5:08:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 140, "total_steps": 1918, "loss": 0.238, "learning_rate": 4.992808656304221e-06, "epoch": 0.07297843226689255, "percentage": 7.3, "elapsed_time": "0:24:18", "remaining_time": "5:08:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 141, "total_steps": 1918, "loss": 0.231, "learning_rate": 4.99247822838267e-06, "epoch": 0.07349970678308464, "percentage": 7.35, "elapsed_time": "0:24:28", "remaining_time": "5:08:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 142, "total_steps": 1918, "loss": 0.2373, "learning_rate": 4.99214039018713e-06, "epoch": 0.07402098129927673, "percentage": 7.4, "elapsed_time": "0:24:38", "remaining_time": "5:08:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 143, "total_steps": 1918, "loss": 0.2395, "learning_rate": 4.991795142722012e-06, "epoch": 0.07454225581546882, "percentage": 7.46, "elapsed_time": "0:24:49", "remaining_time": "5:08:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 144, "total_steps": 1918, "loss": 0.235, "learning_rate": 4.9914424870137565e-06, "epoch": 0.07506353033166091, "percentage": 7.51, "elapsed_time": "0:25:00", "remaining_time": "5:08:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 145, "total_steps": 1918, "loss": 0.2427, "learning_rate": 4.991082424110826e-06, "epoch": 0.075584804847853, "percentage": 7.56, "elapsed_time": "0:25:11", "remaining_time": "5:08:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 146, "total_steps": 1918, "loss": 0.2437, "learning_rate": 4.990714955083709e-06, "epoch": 0.07610607936404509, "percentage": 7.61, "elapsed_time": "0:25:21", "remaining_time": "5:07:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 147, "total_steps": 1918, "loss": 0.2237, "learning_rate": 4.9903400810249116e-06, "epoch": 0.07662735388023718, "percentage": 7.66, "elapsed_time": "0:25:31", "remaining_time": "5:07:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 148, "total_steps": 1918, "loss": 0.2277, "learning_rate": 4.9899578030489534e-06, "epoch": 0.07714862839642928, "percentage": 7.72, "elapsed_time": "0:25:42", "remaining_time": "5:07:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 149, "total_steps": 1918, "loss": 0.2349, "learning_rate": 4.9895681222923685e-06, "epoch": 0.07766990291262135, "percentage": 7.77, "elapsed_time": "0:25:51", "remaining_time": "5:07:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 150, "total_steps": 1918, "loss": 0.2378, "learning_rate": 4.989171039913698e-06, "epoch": 0.07819117742881344, "percentage": 7.82, "elapsed_time": "0:26:02", "remaining_time": "5:06:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 151, "total_steps": 1918, "loss": 0.2309, "learning_rate": 4.9887665570934905e-06, "epoch": 0.07871245194500553, "percentage": 7.87, "elapsed_time": "0:26:12", "remaining_time": "5:06:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 152, "total_steps": 1918, "loss": 0.2242, "learning_rate": 4.988354675034296e-06, "epoch": 0.07923372646119763, "percentage": 7.92, "elapsed_time": "0:26:22", "remaining_time": "5:06:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 153, "total_steps": 1918, "loss": 0.2285, "learning_rate": 4.987935394960661e-06, "epoch": 0.07975500097738972, "percentage": 7.98, "elapsed_time": "0:26:32", "remaining_time": "5:06:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 154, "total_steps": 1918, "loss": 0.2545, "learning_rate": 4.98750871811913e-06, "epoch": 0.08027627549358181, "percentage": 8.03, "elapsed_time": "0:26:41", "remaining_time": "5:05:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 155, "total_steps": 1918, "loss": 0.2277, "learning_rate": 4.987074645778234e-06, "epoch": 0.0807975500097739, "percentage": 8.08, "elapsed_time": "0:26:51", "remaining_time": "5:05:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 156, "total_steps": 1918, "loss": 0.2327, "learning_rate": 4.986633179228495e-06, "epoch": 0.08131882452596599, "percentage": 8.13, "elapsed_time": "0:27:02", "remaining_time": "5:05:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 157, "total_steps": 1918, "loss": 0.2424, "learning_rate": 4.986184319782418e-06, "epoch": 0.08184009904215808, "percentage": 8.19, "elapsed_time": "0:27:14", "remaining_time": "5:05:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 158, "total_steps": 1918, "loss": 0.2508, "learning_rate": 4.9857280687744856e-06, "epoch": 0.08236137355835016, "percentage": 8.24, "elapsed_time": "0:27:24", "remaining_time": "5:05:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 159, "total_steps": 1918, "loss": 0.2297, "learning_rate": 4.985264427561158e-06, "epoch": 0.08288264807454225, "percentage": 8.29, "elapsed_time": "0:27:34", "remaining_time": "5:05:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 160, "total_steps": 1918, "loss": 0.2307, "learning_rate": 4.984793397520865e-06, "epoch": 0.08340392259073434, "percentage": 8.34, "elapsed_time": "0:27:45", "remaining_time": "5:05:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 161, "total_steps": 1918, "loss": 0.2323, "learning_rate": 4.984314980054005e-06, "epoch": 0.08392519710692643, "percentage": 8.39, "elapsed_time": "0:27:54", "remaining_time": "5:04:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 162, "total_steps": 1918, "loss": 0.2473, "learning_rate": 4.983829176582939e-06, "epoch": 0.08444647162311852, "percentage": 8.45, "elapsed_time": "0:28:04", "remaining_time": "5:04:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 163, "total_steps": 1918, "loss": 0.2344, "learning_rate": 4.983335988551986e-06, "epoch": 0.08496774613931062, "percentage": 8.5, "elapsed_time": "0:28:16", "remaining_time": "5:04:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 164, "total_steps": 1918, "loss": 0.2447, "learning_rate": 4.982835417427424e-06, "epoch": 0.0854890206555027, "percentage": 8.55, "elapsed_time": "0:28:26", "remaining_time": "5:04:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 165, "total_steps": 1918, "loss": 0.2339, "learning_rate": 4.982327464697476e-06, "epoch": 0.0860102951716948, "percentage": 8.6, "elapsed_time": "0:28:37", "remaining_time": "5:04:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 166, "total_steps": 1918, "loss": 0.2421, "learning_rate": 4.981812131872315e-06, "epoch": 0.08653156968788689, "percentage": 8.65, "elapsed_time": "0:28:47", "remaining_time": "5:03:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 167, "total_steps": 1918, "loss": 0.2063, "learning_rate": 4.981289420484051e-06, "epoch": 0.08705284420407897, "percentage": 8.71, "elapsed_time": "0:28:56", "remaining_time": "5:03:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 168, "total_steps": 1918, "loss": 0.2223, "learning_rate": 4.980759332086736e-06, "epoch": 0.08757411872027106, "percentage": 8.76, "elapsed_time": "0:29:07", "remaining_time": "5:03:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 169, "total_steps": 1918, "loss": 0.2518, "learning_rate": 4.980221868256351e-06, "epoch": 0.08809539323646315, "percentage": 8.81, "elapsed_time": "0:29:18", "remaining_time": "5:03:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 170, "total_steps": 1918, "loss": 0.2244, "learning_rate": 4.9796770305908045e-06, "epoch": 0.08861666775265524, "percentage": 8.86, "elapsed_time": "0:29:27", "remaining_time": "5:02:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 171, "total_steps": 1918, "loss": 0.2315, "learning_rate": 4.979124820709931e-06, "epoch": 0.08913794226884733, "percentage": 8.92, "elapsed_time": "0:29:37", "remaining_time": "5:02:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 172, "total_steps": 1918, "loss": 0.226, "learning_rate": 4.978565240255477e-06, "epoch": 0.08965921678503942, "percentage": 8.97, "elapsed_time": "0:29:48", "remaining_time": "5:02:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 173, "total_steps": 1918, "loss": 0.2314, "learning_rate": 4.977998290891109e-06, "epoch": 0.09018049130123151, "percentage": 9.02, "elapsed_time": "0:29:57", "remaining_time": "5:02:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 174, "total_steps": 1918, "loss": 0.2359, "learning_rate": 4.9774239743023975e-06, "epoch": 0.0907017658174236, "percentage": 9.07, "elapsed_time": "0:30:08", "remaining_time": "5:02:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 175, "total_steps": 1918, "loss": 0.2371, "learning_rate": 4.976842292196817e-06, "epoch": 0.0912230403336157, "percentage": 9.12, "elapsed_time": "0:30:19", "remaining_time": "5:02:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 176, "total_steps": 1918, "loss": 0.2346, "learning_rate": 4.9762532463037385e-06, "epoch": 0.09174431484980777, "percentage": 9.18, "elapsed_time": "0:30:29", "remaining_time": "5:01:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 177, "total_steps": 1918, "loss": 0.2377, "learning_rate": 4.97565683837443e-06, "epoch": 0.09226558936599986, "percentage": 9.23, "elapsed_time": "0:30:39", "remaining_time": "5:01:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 178, "total_steps": 1918, "loss": 0.2301, "learning_rate": 4.9750530701820446e-06, "epoch": 0.09278686388219196, "percentage": 9.28, "elapsed_time": "0:30:49", "remaining_time": "5:01:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 179, "total_steps": 1918, "loss": 0.246, "learning_rate": 4.974441943521616e-06, "epoch": 0.09330813839838405, "percentage": 9.33, "elapsed_time": "0:31:00", "remaining_time": "5:01:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 180, "total_steps": 1918, "loss": 0.2255, "learning_rate": 4.9738234602100605e-06, "epoch": 0.09382941291457614, "percentage": 9.38, "elapsed_time": "0:31:10", "remaining_time": "5:01:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 181, "total_steps": 1918, "loss": 0.2326, "learning_rate": 4.97319762208616e-06, "epoch": 0.09435068743076823, "percentage": 9.44, "elapsed_time": "0:31:20", "remaining_time": "5:00:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 182, "total_steps": 1918, "loss": 0.245, "learning_rate": 4.972564431010567e-06, "epoch": 0.09487196194696032, "percentage": 9.49, "elapsed_time": "0:31:31", "remaining_time": "5:00:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 183, "total_steps": 1918, "loss": 0.2247, "learning_rate": 4.971923888865792e-06, "epoch": 0.09539323646315241, "percentage": 9.54, "elapsed_time": "0:31:42", "remaining_time": "5:00:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 184, "total_steps": 1918, "loss": 0.2073, "learning_rate": 4.971275997556203e-06, "epoch": 0.0959145109793445, "percentage": 9.59, "elapsed_time": "0:31:52", "remaining_time": "5:00:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 185, "total_steps": 1918, "loss": 0.2284, "learning_rate": 4.970620759008015e-06, "epoch": 0.09643578549553658, "percentage": 9.65, "elapsed_time": "0:32:01", "remaining_time": "5:00:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 186, "total_steps": 1918, "loss": 0.2483, "learning_rate": 4.969958175169291e-06, "epoch": 0.09695706001172867, "percentage": 9.7, "elapsed_time": "0:32:12", "remaining_time": "4:59:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 187, "total_steps": 1918, "loss": 0.2184, "learning_rate": 4.969288248009924e-06, "epoch": 0.09747833452792076, "percentage": 9.75, "elapsed_time": "0:32:22", "remaining_time": "4:59:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 188, "total_steps": 1918, "loss": 0.2229, "learning_rate": 4.968610979521647e-06, "epoch": 0.09799960904411285, "percentage": 9.8, "elapsed_time": "0:32:32", "remaining_time": "4:59:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 189, "total_steps": 1918, "loss": 0.2456, "learning_rate": 4.967926371718017e-06, "epoch": 0.09852088356030494, "percentage": 9.85, "elapsed_time": "0:32:42", "remaining_time": "4:59:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 190, "total_steps": 1918, "loss": 0.2358, "learning_rate": 4.96723442663441e-06, "epoch": 0.09904215807649704, "percentage": 9.91, "elapsed_time": "0:32:53", "remaining_time": "4:59:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 191, "total_steps": 1918, "loss": 0.2259, "learning_rate": 4.966535146328014e-06, "epoch": 0.09956343259268913, "percentage": 9.96, "elapsed_time": "0:33:03", "remaining_time": "4:58:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 192, "total_steps": 1918, "loss": 0.2262, "learning_rate": 4.965828532877831e-06, "epoch": 0.10008470710888122, "percentage": 10.01, "elapsed_time": "0:33:13", "remaining_time": "4:58:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 193, "total_steps": 1918, "loss": 0.2475, "learning_rate": 4.96511458838466e-06, "epoch": 0.10060598162507331, "percentage": 10.06, "elapsed_time": "0:33:24", "remaining_time": "4:58:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 194, "total_steps": 1918, "loss": 0.2311, "learning_rate": 4.964393314971096e-06, "epoch": 0.10112725614126539, "percentage": 10.11, "elapsed_time": "0:33:35", "remaining_time": "4:58:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 195, "total_steps": 1918, "loss": 0.2395, "learning_rate": 4.963664714781525e-06, "epoch": 0.10164853065745748, "percentage": 10.17, "elapsed_time": "0:33:46", "remaining_time": "4:58:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 196, "total_steps": 1918, "loss": 0.2191, "learning_rate": 4.962928789982117e-06, "epoch": 0.10216980517364957, "percentage": 10.22, "elapsed_time": "0:33:56", "remaining_time": "4:58:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 197, "total_steps": 1918, "loss": 0.2208, "learning_rate": 4.9621855427608134e-06, "epoch": 0.10269107968984166, "percentage": 10.27, "elapsed_time": "0:34:05", "remaining_time": "4:57:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 198, "total_steps": 1918, "loss": 0.2459, "learning_rate": 4.961434975327331e-06, "epoch": 0.10321235420603375, "percentage": 10.32, "elapsed_time": "0:34:15", "remaining_time": "4:57:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 199, "total_steps": 1918, "loss": 0.2328, "learning_rate": 4.960677089913146e-06, "epoch": 0.10373362872222584, "percentage": 10.38, "elapsed_time": "0:34:26", "remaining_time": "4:57:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 200, "total_steps": 1918, "loss": 0.2312, "learning_rate": 4.959911888771496e-06, "epoch": 0.10425490323841793, "percentage": 10.43, "elapsed_time": "0:34:36", "remaining_time": "4:57:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 201, "total_steps": 1918, "loss": 0.2074, "learning_rate": 4.959139374177364e-06, "epoch": 0.10477617775461003, "percentage": 10.48, "elapsed_time": "0:34:46", "remaining_time": "4:57:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 202, "total_steps": 1918, "loss": 0.2357, "learning_rate": 4.958359548427478e-06, "epoch": 0.10529745227080212, "percentage": 10.53, "elapsed_time": "0:34:56", "remaining_time": "4:56:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 203, "total_steps": 1918, "loss": 0.2182, "learning_rate": 4.957572413840303e-06, "epoch": 0.10581872678699421, "percentage": 10.58, "elapsed_time": "0:35:07", "remaining_time": "4:56:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 204, "total_steps": 1918, "loss": 0.2237, "learning_rate": 4.956777972756033e-06, "epoch": 0.10634000130318629, "percentage": 10.64, "elapsed_time": "0:35:17", "remaining_time": "4:56:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 205, "total_steps": 1918, "loss": 0.2105, "learning_rate": 4.955976227536584e-06, "epoch": 0.10686127581937838, "percentage": 10.69, "elapsed_time": "0:35:27", "remaining_time": "4:56:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 206, "total_steps": 1918, "loss": 0.2273, "learning_rate": 4.95516718056559e-06, "epoch": 0.10738255033557047, "percentage": 10.74, "elapsed_time": "0:35:37", "remaining_time": "4:56:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 207, "total_steps": 1918, "loss": 0.239, "learning_rate": 4.95435083424839e-06, "epoch": 0.10790382485176256, "percentage": 10.79, "elapsed_time": "0:35:47", "remaining_time": "4:55:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 208, "total_steps": 1918, "loss": 0.2417, "learning_rate": 4.953527191012029e-06, "epoch": 0.10842509936795465, "percentage": 10.84, "elapsed_time": "0:35:57", "remaining_time": "4:55:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 209, "total_steps": 1918, "loss": 0.2282, "learning_rate": 4.95269625330524e-06, "epoch": 0.10894637388414674, "percentage": 10.9, "elapsed_time": "0:36:08", "remaining_time": "4:55:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 210, "total_steps": 1918, "loss": 0.2013, "learning_rate": 4.951858023598448e-06, "epoch": 0.10946764840033883, "percentage": 10.95, "elapsed_time": "0:36:17", "remaining_time": "4:55:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 211, "total_steps": 1918, "loss": 0.2271, "learning_rate": 4.951012504383756e-06, "epoch": 0.10998892291653092, "percentage": 11.0, "elapsed_time": "0:36:27", "remaining_time": "4:54:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 212, "total_steps": 1918, "loss": 0.2393, "learning_rate": 4.9501596981749375e-06, "epoch": 0.11051019743272301, "percentage": 11.05, "elapsed_time": "0:36:37", "remaining_time": "4:54:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 213, "total_steps": 1918, "loss": 0.2311, "learning_rate": 4.949299607507434e-06, "epoch": 0.11103147194891509, "percentage": 11.11, "elapsed_time": "0:36:48", "remaining_time": "4:54:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 214, "total_steps": 1918, "loss": 0.2029, "learning_rate": 4.94843223493834e-06, "epoch": 0.11155274646510718, "percentage": 11.16, "elapsed_time": "0:36:58", "remaining_time": "4:54:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 215, "total_steps": 1918, "loss": 0.2342, "learning_rate": 4.947557583046403e-06, "epoch": 0.11207402098129927, "percentage": 11.21, "elapsed_time": "0:37:08", "remaining_time": "4:54:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 216, "total_steps": 1918, "loss": 0.2188, "learning_rate": 4.94667565443201e-06, "epoch": 0.11259529549749137, "percentage": 11.26, "elapsed_time": "0:37:18", "remaining_time": "4:54:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 217, "total_steps": 1918, "loss": 0.2376, "learning_rate": 4.945786451717183e-06, "epoch": 0.11311657001368346, "percentage": 11.31, "elapsed_time": "0:37:30", "remaining_time": "4:54:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 218, "total_steps": 1918, "loss": 0.2353, "learning_rate": 4.944889977545571e-06, "epoch": 0.11363784452987555, "percentage": 11.37, "elapsed_time": "0:37:41", "remaining_time": "4:53:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 219, "total_steps": 1918, "loss": 0.249, "learning_rate": 4.94398623458244e-06, "epoch": 0.11415911904606764, "percentage": 11.42, "elapsed_time": "0:37:51", "remaining_time": "4:53:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 220, "total_steps": 1918, "loss": 0.2212, "learning_rate": 4.943075225514667e-06, "epoch": 0.11468039356225973, "percentage": 11.47, "elapsed_time": "0:38:01", "remaining_time": "4:53:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 221, "total_steps": 1918, "loss": 0.2427, "learning_rate": 4.942156953050733e-06, "epoch": 0.11520166807845182, "percentage": 11.52, "elapsed_time": "0:38:12", "remaining_time": "4:53:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 222, "total_steps": 1918, "loss": 0.2315, "learning_rate": 4.94123141992071e-06, "epoch": 0.1157229425946439, "percentage": 11.57, "elapsed_time": "0:38:22", "remaining_time": "4:53:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 223, "total_steps": 1918, "loss": 0.2323, "learning_rate": 4.940298628876261e-06, "epoch": 0.11624421711083599, "percentage": 11.63, "elapsed_time": "0:38:32", "remaining_time": "4:53:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 224, "total_steps": 1918, "loss": 0.2208, "learning_rate": 4.9393585826906245e-06, "epoch": 0.11676549162702808, "percentage": 11.68, "elapsed_time": "0:38:42", "remaining_time": "4:52:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 225, "total_steps": 1918, "loss": 0.219, "learning_rate": 4.938411284158608e-06, "epoch": 0.11728676614322017, "percentage": 11.73, "elapsed_time": "0:38:53", "remaining_time": "4:52:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 226, "total_steps": 1918, "loss": 0.2482, "learning_rate": 4.937456736096581e-06, "epoch": 0.11780804065941226, "percentage": 11.78, "elapsed_time": "0:39:04", "remaining_time": "4:52:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 227, "total_steps": 1918, "loss": 0.2373, "learning_rate": 4.936494941342469e-06, "epoch": 0.11832931517560435, "percentage": 11.84, "elapsed_time": "0:39:14", "remaining_time": "4:52:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 228, "total_steps": 1918, "loss": 0.2323, "learning_rate": 4.93552590275574e-06, "epoch": 0.11885058969179645, "percentage": 11.89, "elapsed_time": "0:39:24", "remaining_time": "4:52:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 229, "total_steps": 1918, "loss": 0.2266, "learning_rate": 4.934549623217399e-06, "epoch": 0.11937186420798854, "percentage": 11.94, "elapsed_time": "0:39:35", "remaining_time": "4:52:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 230, "total_steps": 1918, "loss": 0.2325, "learning_rate": 4.9335661056299755e-06, "epoch": 0.11989313872418063, "percentage": 11.99, "elapsed_time": "0:39:45", "remaining_time": "4:51:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 231, "total_steps": 1918, "loss": 0.2224, "learning_rate": 4.932575352917524e-06, "epoch": 0.1204144132403727, "percentage": 12.04, "elapsed_time": "0:39:56", "remaining_time": "4:51:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 232, "total_steps": 1918, "loss": 0.2159, "learning_rate": 4.931577368025607e-06, "epoch": 0.1209356877565648, "percentage": 12.1, "elapsed_time": "0:40:06", "remaining_time": "4:51:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 233, "total_steps": 1918, "loss": 0.2418, "learning_rate": 4.930572153921287e-06, "epoch": 0.12145696227275689, "percentage": 12.15, "elapsed_time": "0:40:16", "remaining_time": "4:51:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 234, "total_steps": 1918, "loss": 0.2296, "learning_rate": 4.92955971359312e-06, "epoch": 0.12197823678894898, "percentage": 12.2, "elapsed_time": "0:40:26", "remaining_time": "4:51:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 235, "total_steps": 1918, "loss": 0.211, "learning_rate": 4.928540050051146e-06, "epoch": 0.12249951130514107, "percentage": 12.25, "elapsed_time": "0:40:36", "remaining_time": "4:50:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 236, "total_steps": 1918, "loss": 0.2147, "learning_rate": 4.927513166326881e-06, "epoch": 0.12302078582133316, "percentage": 12.3, "elapsed_time": "0:40:47", "remaining_time": "4:50:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 237, "total_steps": 1918, "loss": 0.2274, "learning_rate": 4.9264790654733076e-06, "epoch": 0.12354206033752525, "percentage": 12.36, "elapsed_time": "0:40:58", "remaining_time": "4:50:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 238, "total_steps": 1918, "loss": 0.235, "learning_rate": 4.925437750564863e-06, "epoch": 0.12406333485371734, "percentage": 12.41, "elapsed_time": "0:41:08", "remaining_time": "4:50:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 239, "total_steps": 1918, "loss": 0.2272, "learning_rate": 4.924389224697433e-06, "epoch": 0.12458460936990944, "percentage": 12.46, "elapsed_time": "0:41:18", "remaining_time": "4:50:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 240, "total_steps": 1918, "loss": 0.2412, "learning_rate": 4.923333490988343e-06, "epoch": 0.12510588388610153, "percentage": 12.51, "elapsed_time": "0:41:30", "remaining_time": "4:50:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 241, "total_steps": 1918, "loss": 0.2168, "learning_rate": 4.922270552576347e-06, "epoch": 0.1256271584022936, "percentage": 12.57, "elapsed_time": "0:41:40", "remaining_time": "4:50:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 242, "total_steps": 1918, "loss": 0.2133, "learning_rate": 4.921200412621619e-06, "epoch": 0.1261484329184857, "percentage": 12.62, "elapsed_time": "0:41:50", "remaining_time": "4:49:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 243, "total_steps": 1918, "loss": 0.2246, "learning_rate": 4.920123074305743e-06, "epoch": 0.1266697074346778, "percentage": 12.67, "elapsed_time": "0:42:00", "remaining_time": "4:49:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 244, "total_steps": 1918, "loss": 0.2182, "learning_rate": 4.919038540831705e-06, "epoch": 0.12719098195086986, "percentage": 12.72, "elapsed_time": "0:42:09", "remaining_time": "4:49:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 245, "total_steps": 1918, "loss": 0.2119, "learning_rate": 4.917946815423883e-06, "epoch": 0.12771225646706197, "percentage": 12.77, "elapsed_time": "0:42:18", "remaining_time": "4:48:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 246, "total_steps": 1918, "loss": 0.231, "learning_rate": 4.916847901328035e-06, "epoch": 0.12823353098325405, "percentage": 12.83, "elapsed_time": "0:42:29", "remaining_time": "4:48:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 247, "total_steps": 1918, "loss": 0.2362, "learning_rate": 4.915741801811294e-06, "epoch": 0.12875480549944615, "percentage": 12.88, "elapsed_time": "0:42:39", "remaining_time": "4:48:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 248, "total_steps": 1918, "loss": 0.2375, "learning_rate": 4.914628520162154e-06, "epoch": 0.12927608001563823, "percentage": 12.93, "elapsed_time": "0:42:51", "remaining_time": "4:48:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 249, "total_steps": 1918, "loss": 0.1983, "learning_rate": 4.913508059690461e-06, "epoch": 0.12979735453183033, "percentage": 12.98, "elapsed_time": "0:43:02", "remaining_time": "4:48:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 250, "total_steps": 1918, "loss": 0.2208, "learning_rate": 4.912380423727405e-06, "epoch": 0.1303186290480224, "percentage": 13.03, "elapsed_time": "0:43:13", "remaining_time": "4:48:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 251, "total_steps": 1918, "loss": 0.2163, "learning_rate": 4.911245615625512e-06, "epoch": 0.13083990356421452, "percentage": 13.09, "elapsed_time": "0:43:23", "remaining_time": "4:48:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 252, "total_steps": 1918, "loss": 0.2379, "learning_rate": 4.910103638758627e-06, "epoch": 0.1313611780804066, "percentage": 13.14, "elapsed_time": "0:43:34", "remaining_time": "4:48:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 253, "total_steps": 1918, "loss": 0.224, "learning_rate": 4.9089544965219095e-06, "epoch": 0.13188245259659867, "percentage": 13.19, "elapsed_time": "0:43:45", "remaining_time": "4:47:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 254, "total_steps": 1918, "loss": 0.2088, "learning_rate": 4.907798192331821e-06, "epoch": 0.13240372711279078, "percentage": 13.24, "elapsed_time": "0:43:54", "remaining_time": "4:47:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 255, "total_steps": 1918, "loss": 0.2211, "learning_rate": 4.90663472962612e-06, "epoch": 0.13292500162898285, "percentage": 13.3, "elapsed_time": "0:44:05", "remaining_time": "4:47:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 256, "total_steps": 1918, "loss": 0.2287, "learning_rate": 4.905464111863841e-06, "epoch": 0.13344627614517496, "percentage": 13.35, "elapsed_time": "0:44:14", "remaining_time": "4:47:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 257, "total_steps": 1918, "loss": 0.2339, "learning_rate": 4.904286342525298e-06, "epoch": 0.13396755066136704, "percentage": 13.4, "elapsed_time": "0:44:25", "remaining_time": "4:47:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 258, "total_steps": 1918, "loss": 0.2327, "learning_rate": 4.903101425112062e-06, "epoch": 0.13448882517755914, "percentage": 13.45, "elapsed_time": "0:44:37", "remaining_time": "4:47:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 259, "total_steps": 1918, "loss": 0.2253, "learning_rate": 4.9019093631469575e-06, "epoch": 0.13501009969375122, "percentage": 13.5, "elapsed_time": "0:44:46", "remaining_time": "4:46:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 260, "total_steps": 1918, "loss": 0.248, "learning_rate": 4.900710160174048e-06, "epoch": 0.13553137420994332, "percentage": 13.56, "elapsed_time": "0:44:56", "remaining_time": "4:46:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 261, "total_steps": 1918, "loss": 0.2174, "learning_rate": 4.899503819758633e-06, "epoch": 0.1360526487261354, "percentage": 13.61, "elapsed_time": "0:45:06", "remaining_time": "4:46:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 262, "total_steps": 1918, "loss": 0.2219, "learning_rate": 4.898290345487226e-06, "epoch": 0.13657392324232748, "percentage": 13.66, "elapsed_time": "0:45:17", "remaining_time": "4:46:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 263, "total_steps": 1918, "loss": 0.2131, "learning_rate": 4.897069740967554e-06, "epoch": 0.13709519775851958, "percentage": 13.71, "elapsed_time": "0:45:27", "remaining_time": "4:46:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 264, "total_steps": 1918, "loss": 0.2284, "learning_rate": 4.89584200982854e-06, "epoch": 0.13761647227471166, "percentage": 13.76, "elapsed_time": "0:45:37", "remaining_time": "4:45:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 265, "total_steps": 1918, "loss": 0.2418, "learning_rate": 4.894607155720294e-06, "epoch": 0.13813774679090376, "percentage": 13.82, "elapsed_time": "0:45:47", "remaining_time": "4:45:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 266, "total_steps": 1918, "loss": 0.2385, "learning_rate": 4.893365182314108e-06, "epoch": 0.13865902130709584, "percentage": 13.87, "elapsed_time": "0:45:57", "remaining_time": "4:45:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 267, "total_steps": 1918, "loss": 0.2229, "learning_rate": 4.892116093302436e-06, "epoch": 0.13918029582328795, "percentage": 13.92, "elapsed_time": "0:46:08", "remaining_time": "4:45:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 268, "total_steps": 1918, "loss": 0.2355, "learning_rate": 4.890859892398886e-06, "epoch": 0.13970157033948002, "percentage": 13.97, "elapsed_time": "0:46:18", "remaining_time": "4:45:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 269, "total_steps": 1918, "loss": 0.2344, "learning_rate": 4.889596583338213e-06, "epoch": 0.14022284485567213, "percentage": 14.03, "elapsed_time": "0:46:28", "remaining_time": "4:44:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 270, "total_steps": 1918, "loss": 0.2188, "learning_rate": 4.8883261698763045e-06, "epoch": 0.1407441193718642, "percentage": 14.08, "elapsed_time": "0:46:37", "remaining_time": "4:44:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 271, "total_steps": 1918, "loss": 0.2274, "learning_rate": 4.887048655790169e-06, "epoch": 0.14126539388805628, "percentage": 14.13, "elapsed_time": "0:46:49", "remaining_time": "4:44:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 272, "total_steps": 1918, "loss": 0.2398, "learning_rate": 4.8857640448779246e-06, "epoch": 0.1417866684042484, "percentage": 14.18, "elapsed_time": "0:47:00", "remaining_time": "4:44:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 273, "total_steps": 1918, "loss": 0.2221, "learning_rate": 4.884472340958791e-06, "epoch": 0.14230794292044047, "percentage": 14.23, "elapsed_time": "0:47:09", "remaining_time": "4:44:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 274, "total_steps": 1918, "loss": 0.2318, "learning_rate": 4.883173547873073e-06, "epoch": 0.14282921743663257, "percentage": 14.29, "elapsed_time": "0:47:19", "remaining_time": "4:43:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 275, "total_steps": 1918, "loss": 0.2313, "learning_rate": 4.881867669482157e-06, "epoch": 0.14335049195282465, "percentage": 14.34, "elapsed_time": "0:47:29", "remaining_time": "4:43:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 276, "total_steps": 1918, "loss": 0.2332, "learning_rate": 4.880554709668486e-06, "epoch": 0.14387176646901675, "percentage": 14.39, "elapsed_time": "0:47:40", "remaining_time": "4:43:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 277, "total_steps": 1918, "loss": 0.235, "learning_rate": 4.879234672335564e-06, "epoch": 0.14439304098520883, "percentage": 14.44, "elapsed_time": "0:47:51", "remaining_time": "4:43:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 278, "total_steps": 1918, "loss": 0.2395, "learning_rate": 4.8779075614079354e-06, "epoch": 0.14491431550140094, "percentage": 14.49, "elapsed_time": "0:48:01", "remaining_time": "4:43:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 279, "total_steps": 1918, "loss": 0.2223, "learning_rate": 4.87657338083117e-06, "epoch": 0.145435590017593, "percentage": 14.55, "elapsed_time": "0:48:13", "remaining_time": "4:43:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 280, "total_steps": 1918, "loss": 0.2275, "learning_rate": 4.875232134571863e-06, "epoch": 0.1459568645337851, "percentage": 14.6, "elapsed_time": "0:48:23", "remaining_time": "4:43:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 281, "total_steps": 1918, "loss": 0.2211, "learning_rate": 4.8738838266176094e-06, "epoch": 0.1464781390499772, "percentage": 14.65, "elapsed_time": "0:48:33", "remaining_time": "4:42:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 282, "total_steps": 1918, "loss": 0.229, "learning_rate": 4.872528460977005e-06, "epoch": 0.14699941356616927, "percentage": 14.7, "elapsed_time": "0:48:43", "remaining_time": "4:42:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 283, "total_steps": 1918, "loss": 0.2258, "learning_rate": 4.871166041679626e-06, "epoch": 0.14752068808236138, "percentage": 14.75, "elapsed_time": "0:48:54", "remaining_time": "4:42:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 284, "total_steps": 1918, "loss": 0.2323, "learning_rate": 4.869796572776018e-06, "epoch": 0.14804196259855346, "percentage": 14.81, "elapsed_time": "0:49:05", "remaining_time": "4:42:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 285, "total_steps": 1918, "loss": 0.2107, "learning_rate": 4.868420058337687e-06, "epoch": 0.14856323711474556, "percentage": 14.86, "elapsed_time": "0:49:15", "remaining_time": "4:42:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 286, "total_steps": 1918, "loss": 0.2107, "learning_rate": 4.867036502457087e-06, "epoch": 0.14908451163093764, "percentage": 14.91, "elapsed_time": "0:49:25", "remaining_time": "4:42:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 287, "total_steps": 1918, "loss": 0.2249, "learning_rate": 4.865645909247604e-06, "epoch": 0.14960578614712974, "percentage": 14.96, "elapsed_time": "0:49:37", "remaining_time": "4:41:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 288, "total_steps": 1918, "loss": 0.2399, "learning_rate": 4.864248282843548e-06, "epoch": 0.15012706066332182, "percentage": 15.02, "elapsed_time": "0:49:48", "remaining_time": "4:41:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 289, "total_steps": 1918, "loss": 0.2151, "learning_rate": 4.862843627400139e-06, "epoch": 0.1506483351795139, "percentage": 15.07, "elapsed_time": "0:49:58", "remaining_time": "4:41:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 290, "total_steps": 1918, "loss": 0.2175, "learning_rate": 4.861431947093494e-06, "epoch": 0.151169609695706, "percentage": 15.12, "elapsed_time": "0:50:09", "remaining_time": "4:41:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 291, "total_steps": 1918, "loss": 0.2298, "learning_rate": 4.860013246120616e-06, "epoch": 0.15169088421189808, "percentage": 15.17, "elapsed_time": "0:50:18", "remaining_time": "4:41:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 292, "total_steps": 1918, "loss": 0.2089, "learning_rate": 4.85858752869938e-06, "epoch": 0.15221215872809019, "percentage": 15.22, "elapsed_time": "0:50:29", "remaining_time": "4:41:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 293, "total_steps": 1918, "loss": 0.2266, "learning_rate": 4.857154799068522e-06, "epoch": 0.15273343324428226, "percentage": 15.28, "elapsed_time": "0:50:41", "remaining_time": "4:41:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 294, "total_steps": 1918, "loss": 0.2255, "learning_rate": 4.855715061487626e-06, "epoch": 0.15325470776047437, "percentage": 15.33, "elapsed_time": "0:50:50", "remaining_time": "4:40:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 295, "total_steps": 1918, "loss": 0.2223, "learning_rate": 4.8542683202371105e-06, "epoch": 0.15377598227666645, "percentage": 15.38, "elapsed_time": "0:51:01", "remaining_time": "4:40:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 296, "total_steps": 1918, "loss": 0.2154, "learning_rate": 4.8528145796182155e-06, "epoch": 0.15429725679285855, "percentage": 15.43, "elapsed_time": "0:51:12", "remaining_time": "4:40:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 297, "total_steps": 1918, "loss": 0.2228, "learning_rate": 4.851353843952992e-06, "epoch": 0.15481853130905063, "percentage": 15.48, "elapsed_time": "0:51:24", "remaining_time": "4:40:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 298, "total_steps": 1918, "loss": 0.2335, "learning_rate": 4.849886117584286e-06, "epoch": 0.1553398058252427, "percentage": 15.54, "elapsed_time": "0:51:34", "remaining_time": "4:40:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 299, "total_steps": 1918, "loss": 0.2097, "learning_rate": 4.84841140487573e-06, "epoch": 0.1558610803414348, "percentage": 15.59, "elapsed_time": "0:51:43", "remaining_time": "4:40:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 300, "total_steps": 1918, "loss": 0.2272, "learning_rate": 4.846929710211724e-06, "epoch": 0.1563823548576269, "percentage": 15.64, "elapsed_time": "0:51:54", "remaining_time": "4:39:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 301, "total_steps": 1918, "loss": 0.2321, "learning_rate": 4.845441037997428e-06, "epoch": 0.156903629373819, "percentage": 15.69, "elapsed_time": "0:52:05", "remaining_time": "4:39:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 302, "total_steps": 1918, "loss": 0.2212, "learning_rate": 4.843945392658744e-06, "epoch": 0.15742490389001107, "percentage": 15.75, "elapsed_time": "0:52:15", "remaining_time": "4:39:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 303, "total_steps": 1918, "loss": 0.2312, "learning_rate": 4.84244277864231e-06, "epoch": 0.15794617840620317, "percentage": 15.8, "elapsed_time": "0:52:26", "remaining_time": "4:39:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 304, "total_steps": 1918, "loss": 0.2328, "learning_rate": 4.840933200415479e-06, "epoch": 0.15846745292239525, "percentage": 15.85, "elapsed_time": "0:52:37", "remaining_time": "4:39:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 305, "total_steps": 1918, "loss": 0.2317, "learning_rate": 4.839416662466307e-06, "epoch": 0.15898872743858736, "percentage": 15.9, "elapsed_time": "0:52:48", "remaining_time": "4:39:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 306, "total_steps": 1918, "loss": 0.2297, "learning_rate": 4.837893169303548e-06, "epoch": 0.15951000195477943, "percentage": 15.95, "elapsed_time": "0:52:58", "remaining_time": "4:39:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 307, "total_steps": 1918, "loss": 0.2182, "learning_rate": 4.836362725456628e-06, "epoch": 0.1600312764709715, "percentage": 16.01, "elapsed_time": "0:53:08", "remaining_time": "4:38:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 308, "total_steps": 1918, "loss": 0.2251, "learning_rate": 4.834825335475641e-06, "epoch": 0.16055255098716362, "percentage": 16.06, "elapsed_time": "0:53:17", "remaining_time": "4:38:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 309, "total_steps": 1918, "loss": 0.2165, "learning_rate": 4.833281003931331e-06, "epoch": 0.1610738255033557, "percentage": 16.11, "elapsed_time": "0:53:28", "remaining_time": "4:38:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 310, "total_steps": 1918, "loss": 0.2333, "learning_rate": 4.831729735415081e-06, "epoch": 0.1615951000195478, "percentage": 16.16, "elapsed_time": "0:53:39", "remaining_time": "4:38:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 311, "total_steps": 1918, "loss": 0.2408, "learning_rate": 4.830171534538895e-06, "epoch": 0.16211637453573988, "percentage": 16.21, "elapsed_time": "0:53:50", "remaining_time": "4:38:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 312, "total_steps": 1918, "loss": 0.2118, "learning_rate": 4.828606405935391e-06, "epoch": 0.16263764905193198, "percentage": 16.27, "elapsed_time": "0:54:01", "remaining_time": "4:38:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 313, "total_steps": 1918, "loss": 0.2259, "learning_rate": 4.827034354257782e-06, "epoch": 0.16315892356812406, "percentage": 16.32, "elapsed_time": "0:54:12", "remaining_time": "4:37:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 314, "total_steps": 1918, "loss": 0.2197, "learning_rate": 4.825455384179864e-06, "epoch": 0.16368019808431616, "percentage": 16.37, "elapsed_time": "0:54:22", "remaining_time": "4:37:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 315, "total_steps": 1918, "loss": 0.2346, "learning_rate": 4.823869500395999e-06, "epoch": 0.16420147260050824, "percentage": 16.42, "elapsed_time": "0:54:32", "remaining_time": "4:37:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 316, "total_steps": 1918, "loss": 0.2298, "learning_rate": 4.822276707621109e-06, "epoch": 0.16472274711670032, "percentage": 16.48, "elapsed_time": "0:54:43", "remaining_time": "4:37:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 317, "total_steps": 1918, "loss": 0.227, "learning_rate": 4.820677010590652e-06, "epoch": 0.16524402163289242, "percentage": 16.53, "elapsed_time": "0:54:53", "remaining_time": "4:37:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 318, "total_steps": 1918, "loss": 0.2388, "learning_rate": 4.819070414060616e-06, "epoch": 0.1657652961490845, "percentage": 16.58, "elapsed_time": "0:55:04", "remaining_time": "4:37:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 319, "total_steps": 1918, "loss": 0.2338, "learning_rate": 4.817456922807499e-06, "epoch": 0.1662865706652766, "percentage": 16.63, "elapsed_time": "0:55:16", "remaining_time": "4:37:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 320, "total_steps": 1918, "loss": 0.2299, "learning_rate": 4.815836541628299e-06, "epoch": 0.16680784518146868, "percentage": 16.68, "elapsed_time": "0:55:26", "remaining_time": "4:36:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 321, "total_steps": 1918, "loss": 0.2047, "learning_rate": 4.814209275340498e-06, "epoch": 0.1673291196976608, "percentage": 16.74, "elapsed_time": "0:55:36", "remaining_time": "4:36:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 322, "total_steps": 1918, "loss": 0.2189, "learning_rate": 4.8125751287820484e-06, "epoch": 0.16785039421385287, "percentage": 16.79, "elapsed_time": "0:55:46", "remaining_time": "4:36:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 323, "total_steps": 1918, "loss": 0.2355, "learning_rate": 4.8109341068113566e-06, "epoch": 0.16837166873004497, "percentage": 16.84, "elapsed_time": "0:55:57", "remaining_time": "4:36:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 324, "total_steps": 1918, "loss": 0.2311, "learning_rate": 4.8092862143072705e-06, "epoch": 0.16889294324623705, "percentage": 16.89, "elapsed_time": "0:56:08", "remaining_time": "4:36:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 325, "total_steps": 1918, "loss": 0.2316, "learning_rate": 4.807631456169064e-06, "epoch": 0.16941421776242913, "percentage": 16.94, "elapsed_time": "0:56:18", "remaining_time": "4:36:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 326, "total_steps": 1918, "loss": 0.2108, "learning_rate": 4.805969837316424e-06, "epoch": 0.16993549227862123, "percentage": 17.0, "elapsed_time": "0:56:28", "remaining_time": "4:35:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 327, "total_steps": 1918, "loss": 0.2292, "learning_rate": 4.804301362689435e-06, "epoch": 0.1704567667948133, "percentage": 17.05, "elapsed_time": "0:56:40", "remaining_time": "4:35:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 328, "total_steps": 1918, "loss": 0.2168, "learning_rate": 4.8026260372485625e-06, "epoch": 0.1709780413110054, "percentage": 17.1, "elapsed_time": "0:56:49", "remaining_time": "4:35:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 329, "total_steps": 1918, "loss": 0.2119, "learning_rate": 4.8009438659746396e-06, "epoch": 0.1714993158271975, "percentage": 17.15, "elapsed_time": "0:56:59", "remaining_time": "4:35:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 330, "total_steps": 1918, "loss": 0.2227, "learning_rate": 4.7992548538688554e-06, "epoch": 0.1720205903433896, "percentage": 17.21, "elapsed_time": "0:57:09", "remaining_time": "4:35:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 331, "total_steps": 1918, "loss": 0.2161, "learning_rate": 4.797559005952733e-06, "epoch": 0.17254186485958167, "percentage": 17.26, "elapsed_time": "0:57:18", "remaining_time": "4:34:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 332, "total_steps": 1918, "loss": 0.2338, "learning_rate": 4.795856327268124e-06, "epoch": 0.17306313937577378, "percentage": 17.31, "elapsed_time": "0:57:29", "remaining_time": "4:34:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 333, "total_steps": 1918, "loss": 0.2232, "learning_rate": 4.794146822877182e-06, "epoch": 0.17358441389196586, "percentage": 17.36, "elapsed_time": "0:57:41", "remaining_time": "4:34:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 334, "total_steps": 1918, "loss": 0.2181, "learning_rate": 4.792430497862358e-06, "epoch": 0.17410568840815793, "percentage": 17.41, "elapsed_time": "0:57:52", "remaining_time": "4:34:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 335, "total_steps": 1918, "loss": 0.2333, "learning_rate": 4.790707357326381e-06, "epoch": 0.17462696292435004, "percentage": 17.47, "elapsed_time": "0:58:03", "remaining_time": "4:34:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 336, "total_steps": 1918, "loss": 0.2034, "learning_rate": 4.788977406392242e-06, "epoch": 0.17514823744054211, "percentage": 17.52, "elapsed_time": "0:58:13", "remaining_time": "4:34:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 337, "total_steps": 1918, "loss": 0.2272, "learning_rate": 4.787240650203178e-06, "epoch": 0.17566951195673422, "percentage": 17.57, "elapsed_time": "0:58:22", "remaining_time": "4:33:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 338, "total_steps": 1918, "loss": 0.2376, "learning_rate": 4.785497093922662e-06, "epoch": 0.1761907864729263, "percentage": 17.62, "elapsed_time": "0:58:33", "remaining_time": "4:33:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 339, "total_steps": 1918, "loss": 0.23, "learning_rate": 4.78374674273438e-06, "epoch": 0.1767120609891184, "percentage": 17.67, "elapsed_time": "0:58:44", "remaining_time": "4:33:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 340, "total_steps": 1918, "loss": 0.2132, "learning_rate": 4.781989601842224e-06, "epoch": 0.17723333550531048, "percentage": 17.73, "elapsed_time": "0:58:55", "remaining_time": "4:33:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 341, "total_steps": 1918, "loss": 0.1965, "learning_rate": 4.780225676470268e-06, "epoch": 0.17775461002150258, "percentage": 17.78, "elapsed_time": "0:59:05", "remaining_time": "4:33:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 342, "total_steps": 1918, "loss": 0.2076, "learning_rate": 4.77845497186276e-06, "epoch": 0.17827588453769466, "percentage": 17.83, "elapsed_time": "0:59:15", "remaining_time": "4:33:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 343, "total_steps": 1918, "loss": 0.2195, "learning_rate": 4.776677493284101e-06, "epoch": 0.17879715905388674, "percentage": 17.88, "elapsed_time": "0:59:25", "remaining_time": "4:32:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 344, "total_steps": 1918, "loss": 0.2293, "learning_rate": 4.774893246018831e-06, "epoch": 0.17931843357007884, "percentage": 17.94, "elapsed_time": "0:59:36", "remaining_time": "4:32:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 345, "total_steps": 1918, "loss": 0.218, "learning_rate": 4.773102235371617e-06, "epoch": 0.17983970808627092, "percentage": 17.99, "elapsed_time": "0:59:47", "remaining_time": "4:32:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 346, "total_steps": 1918, "loss": 0.2174, "learning_rate": 4.771304466667229e-06, "epoch": 0.18036098260246303, "percentage": 18.04, "elapsed_time": "0:59:59", "remaining_time": "4:32:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 347, "total_steps": 1918, "loss": 0.2237, "learning_rate": 4.769499945250533e-06, "epoch": 0.1808822571186551, "percentage": 18.09, "elapsed_time": "1:00:08", "remaining_time": "4:32:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 348, "total_steps": 1918, "loss": 0.2323, "learning_rate": 4.76768867648647e-06, "epoch": 0.1814035316348472, "percentage": 18.14, "elapsed_time": "1:00:19", "remaining_time": "4:32:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 349, "total_steps": 1918, "loss": 0.2027, "learning_rate": 4.7658706657600395e-06, "epoch": 0.1819248061510393, "percentage": 18.2, "elapsed_time": "1:00:29", "remaining_time": "4:31:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 350, "total_steps": 1918, "loss": 0.2298, "learning_rate": 4.764045918476288e-06, "epoch": 0.1824460806672314, "percentage": 18.25, "elapsed_time": "1:00:40", "remaining_time": "4:31:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 351, "total_steps": 1918, "loss": 0.2217, "learning_rate": 4.762214440060289e-06, "epoch": 0.18296735518342347, "percentage": 18.3, "elapsed_time": "1:00:50", "remaining_time": "4:31:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 352, "total_steps": 1918, "loss": 0.2376, "learning_rate": 4.760376235957127e-06, "epoch": 0.18348862969961555, "percentage": 18.35, "elapsed_time": "1:01:00", "remaining_time": "4:31:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 353, "total_steps": 1918, "loss": 0.2103, "learning_rate": 4.758531311631884e-06, "epoch": 0.18400990421580765, "percentage": 18.4, "elapsed_time": "1:01:11", "remaining_time": "4:31:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 354, "total_steps": 1918, "loss": 0.2271, "learning_rate": 4.756679672569621e-06, "epoch": 0.18453117873199973, "percentage": 18.46, "elapsed_time": "1:01:22", "remaining_time": "4:31:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 355, "total_steps": 1918, "loss": 0.2176, "learning_rate": 4.7548213242753616e-06, "epoch": 0.18505245324819183, "percentage": 18.51, "elapsed_time": "1:01:33", "remaining_time": "4:31:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 356, "total_steps": 1918, "loss": 0.2211, "learning_rate": 4.752956272274078e-06, "epoch": 0.1855737277643839, "percentage": 18.56, "elapsed_time": "1:01:44", "remaining_time": "4:30:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 357, "total_steps": 1918, "loss": 0.2225, "learning_rate": 4.751084522110669e-06, "epoch": 0.18609500228057602, "percentage": 18.61, "elapsed_time": "1:01:55", "remaining_time": "4:30:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 358, "total_steps": 1918, "loss": 0.2116, "learning_rate": 4.749206079349952e-06, "epoch": 0.1866162767967681, "percentage": 18.67, "elapsed_time": "1:02:07", "remaining_time": "4:30:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 359, "total_steps": 1918, "loss": 0.2142, "learning_rate": 4.747320949576641e-06, "epoch": 0.1871375513129602, "percentage": 18.72, "elapsed_time": "1:02:18", "remaining_time": "4:30:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 360, "total_steps": 1918, "loss": 0.2107, "learning_rate": 4.745429138395329e-06, "epoch": 0.18765882582915228, "percentage": 18.77, "elapsed_time": "1:02:26", "remaining_time": "4:30:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 361, "total_steps": 1918, "loss": 0.2199, "learning_rate": 4.743530651430472e-06, "epoch": 0.18818010034534435, "percentage": 18.82, "elapsed_time": "1:02:36", "remaining_time": "4:30:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 362, "total_steps": 1918, "loss": 0.2232, "learning_rate": 4.741625494326379e-06, "epoch": 0.18870137486153646, "percentage": 18.87, "elapsed_time": "1:02:48", "remaining_time": "4:29:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 363, "total_steps": 1918, "loss": 0.2193, "learning_rate": 4.739713672747183e-06, "epoch": 0.18922264937772854, "percentage": 18.93, "elapsed_time": "1:02:57", "remaining_time": "4:29:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 364, "total_steps": 1918, "loss": 0.226, "learning_rate": 4.737795192376836e-06, "epoch": 0.18974392389392064, "percentage": 18.98, "elapsed_time": "1:03:07", "remaining_time": "4:29:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 365, "total_steps": 1918, "loss": 0.2339, "learning_rate": 4.735870058919084e-06, "epoch": 0.19026519841011272, "percentage": 19.03, "elapsed_time": "1:03:17", "remaining_time": "4:29:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 366, "total_steps": 1918, "loss": 0.2393, "learning_rate": 4.733938278097456e-06, "epoch": 0.19078647292630482, "percentage": 19.08, "elapsed_time": "1:03:28", "remaining_time": "4:29:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 367, "total_steps": 1918, "loss": 0.224, "learning_rate": 4.731999855655239e-06, "epoch": 0.1913077474424969, "percentage": 19.13, "elapsed_time": "1:03:39", "remaining_time": "4:29:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 368, "total_steps": 1918, "loss": 0.2448, "learning_rate": 4.730054797355471e-06, "epoch": 0.191829021958689, "percentage": 19.19, "elapsed_time": "1:03:49", "remaining_time": "4:28:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 369, "total_steps": 1918, "loss": 0.2051, "learning_rate": 4.728103108980915e-06, "epoch": 0.19235029647488108, "percentage": 19.24, "elapsed_time": "1:03:59", "remaining_time": "4:28:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 370, "total_steps": 1918, "loss": 0.2139, "learning_rate": 4.726144796334049e-06, "epoch": 0.19287157099107316, "percentage": 19.29, "elapsed_time": "1:04:09", "remaining_time": "4:28:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 371, "total_steps": 1918, "loss": 0.2288, "learning_rate": 4.724179865237042e-06, "epoch": 0.19339284550726527, "percentage": 19.34, "elapsed_time": "1:04:20", "remaining_time": "4:28:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 372, "total_steps": 1918, "loss": 0.2107, "learning_rate": 4.722208321531743e-06, "epoch": 0.19391412002345734, "percentage": 19.4, "elapsed_time": "1:04:30", "remaining_time": "4:28:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 373, "total_steps": 1918, "loss": 0.2192, "learning_rate": 4.720230171079657e-06, "epoch": 0.19443539453964945, "percentage": 19.45, "elapsed_time": "1:04:41", "remaining_time": "4:27:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 374, "total_steps": 1918, "loss": 0.2256, "learning_rate": 4.7182454197619355e-06, "epoch": 0.19495666905584152, "percentage": 19.5, "elapsed_time": "1:04:53", "remaining_time": "4:27:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 375, "total_steps": 1918, "loss": 0.2274, "learning_rate": 4.716254073479352e-06, "epoch": 0.19547794357203363, "percentage": 19.55, "elapsed_time": "1:05:04", "remaining_time": "4:27:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 376, "total_steps": 1918, "loss": 0.2145, "learning_rate": 4.714256138152287e-06, "epoch": 0.1959992180882257, "percentage": 19.6, "elapsed_time": "1:05:14", "remaining_time": "4:27:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 377, "total_steps": 1918, "loss": 0.2236, "learning_rate": 4.712251619720712e-06, "epoch": 0.1965204926044178, "percentage": 19.66, "elapsed_time": "1:05:24", "remaining_time": "4:27:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 378, "total_steps": 1918, "loss": 0.224, "learning_rate": 4.71024052414417e-06, "epoch": 0.1970417671206099, "percentage": 19.71, "elapsed_time": "1:05:34", "remaining_time": "4:27:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 379, "total_steps": 1918, "loss": 0.2167, "learning_rate": 4.70822285740176e-06, "epoch": 0.19756304163680197, "percentage": 19.76, "elapsed_time": "1:05:43", "remaining_time": "4:26:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 380, "total_steps": 1918, "loss": 0.225, "learning_rate": 4.706198625492111e-06, "epoch": 0.19808431615299407, "percentage": 19.81, "elapsed_time": "1:05:53", "remaining_time": "4:26:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 381, "total_steps": 1918, "loss": 0.2154, "learning_rate": 4.704167834433378e-06, "epoch": 0.19860559066918615, "percentage": 19.86, "elapsed_time": "1:06:03", "remaining_time": "4:26:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 382, "total_steps": 1918, "loss": 0.2211, "learning_rate": 4.702130490263215e-06, "epoch": 0.19912686518537825, "percentage": 19.92, "elapsed_time": "1:06:14", "remaining_time": "4:26:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 383, "total_steps": 1918, "loss": 0.2067, "learning_rate": 4.700086599038755e-06, "epoch": 0.19964813970157033, "percentage": 19.97, "elapsed_time": "1:06:25", "remaining_time": "4:26:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 384, "total_steps": 1918, "loss": 0.2325, "learning_rate": 4.698036166836598e-06, "epoch": 0.20016941421776244, "percentage": 20.02, "elapsed_time": "1:06:35", "remaining_time": "4:26:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 385, "total_steps": 1918, "loss": 0.2095, "learning_rate": 4.695979199752794e-06, "epoch": 0.20069068873395451, "percentage": 20.07, "elapsed_time": "1:06:45", "remaining_time": "4:25:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 386, "total_steps": 1918, "loss": 0.2222, "learning_rate": 4.693915703902816e-06, "epoch": 0.20121196325014662, "percentage": 20.13, "elapsed_time": "1:06:55", "remaining_time": "4:25:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 387, "total_steps": 1918, "loss": 0.2103, "learning_rate": 4.691845685421551e-06, "epoch": 0.2017332377663387, "percentage": 20.18, "elapsed_time": "1:07:05", "remaining_time": "4:25:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 388, "total_steps": 1918, "loss": 0.2196, "learning_rate": 4.689769150463277e-06, "epoch": 0.20225451228253077, "percentage": 20.23, "elapsed_time": "1:07:15", "remaining_time": "4:25:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 389, "total_steps": 1918, "loss": 0.226, "learning_rate": 4.687686105201645e-06, "epoch": 0.20277578679872288, "percentage": 20.28, "elapsed_time": "1:07:26", "remaining_time": "4:25:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 390, "total_steps": 1918, "loss": 0.2047, "learning_rate": 4.685596555829664e-06, "epoch": 0.20329706131491496, "percentage": 20.33, "elapsed_time": "1:07:36", "remaining_time": "4:24:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 391, "total_steps": 1918, "loss": 0.2083, "learning_rate": 4.683500508559676e-06, "epoch": 0.20381833583110706, "percentage": 20.39, "elapsed_time": "1:07:48", "remaining_time": "4:24:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 392, "total_steps": 1918, "loss": 0.2065, "learning_rate": 4.681397969623347e-06, "epoch": 0.20433961034729914, "percentage": 20.44, "elapsed_time": "1:07:59", "remaining_time": "4:24:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 393, "total_steps": 1918, "loss": 0.2444, "learning_rate": 4.679288945271639e-06, "epoch": 0.20486088486349124, "percentage": 20.49, "elapsed_time": "1:08:10", "remaining_time": "4:24:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 394, "total_steps": 1918, "loss": 0.2236, "learning_rate": 4.677173441774796e-06, "epoch": 0.20538215937968332, "percentage": 20.54, "elapsed_time": "1:08:20", "remaining_time": "4:24:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 395, "total_steps": 1918, "loss": 0.2337, "learning_rate": 4.675051465422326e-06, "epoch": 0.20590343389587543, "percentage": 20.59, "elapsed_time": "1:08:32", "remaining_time": "4:24:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 396, "total_steps": 1918, "loss": 0.2195, "learning_rate": 4.6729230225229815e-06, "epoch": 0.2064247084120675, "percentage": 20.65, "elapsed_time": "1:08:41", "remaining_time": "4:24:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 397, "total_steps": 1918, "loss": 0.2287, "learning_rate": 4.670788119404739e-06, "epoch": 0.20694598292825958, "percentage": 20.7, "elapsed_time": "1:08:51", "remaining_time": "4:23:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 398, "total_steps": 1918, "loss": 0.2071, "learning_rate": 4.66864676241478e-06, "epoch": 0.20746725744445169, "percentage": 20.75, "elapsed_time": "1:09:02", "remaining_time": "4:23:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 399, "total_steps": 1918, "loss": 0.2168, "learning_rate": 4.666498957919479e-06, "epoch": 0.20798853196064376, "percentage": 20.8, "elapsed_time": "1:09:12", "remaining_time": "4:23:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 400, "total_steps": 1918, "loss": 0.2176, "learning_rate": 4.664344712304375e-06, "epoch": 0.20850980647683587, "percentage": 20.86, "elapsed_time": "1:09:22", "remaining_time": "4:23:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 401, "total_steps": 1918, "loss": 0.2306, "learning_rate": 4.6621840319741576e-06, "epoch": 0.20903108099302795, "percentage": 20.91, "elapsed_time": "1:09:31", "remaining_time": "4:23:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 402, "total_steps": 1918, "loss": 0.219, "learning_rate": 4.660016923352648e-06, "epoch": 0.20955235550922005, "percentage": 20.96, "elapsed_time": "1:09:42", "remaining_time": "4:22:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 403, "total_steps": 1918, "loss": 0.2164, "learning_rate": 4.657843392882778e-06, "epoch": 0.21007363002541213, "percentage": 21.01, "elapsed_time": "1:09:53", "remaining_time": "4:22:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 404, "total_steps": 1918, "loss": 0.2082, "learning_rate": 4.6556634470265725e-06, "epoch": 0.21059490454160423, "percentage": 21.06, "elapsed_time": "1:10:03", "remaining_time": "4:22:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 405, "total_steps": 1918, "loss": 0.2209, "learning_rate": 4.6534770922651305e-06, "epoch": 0.2111161790577963, "percentage": 21.12, "elapsed_time": "1:10:13", "remaining_time": "4:22:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 406, "total_steps": 1918, "loss": 0.2335, "learning_rate": 4.651284335098603e-06, "epoch": 0.21163745357398842, "percentage": 21.17, "elapsed_time": "1:10:24", "remaining_time": "4:22:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 407, "total_steps": 1918, "loss": 0.2224, "learning_rate": 4.6490851820461785e-06, "epoch": 0.2121587280901805, "percentage": 21.22, "elapsed_time": "1:10:35", "remaining_time": "4:22:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 408, "total_steps": 1918, "loss": 0.212, "learning_rate": 4.646879639646058e-06, "epoch": 0.21268000260637257, "percentage": 21.27, "elapsed_time": "1:10:46", "remaining_time": "4:21:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 409, "total_steps": 1918, "loss": 0.2136, "learning_rate": 4.64466771445544e-06, "epoch": 0.21320127712256468, "percentage": 21.32, "elapsed_time": "1:10:56", "remaining_time": "4:21:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 410, "total_steps": 1918, "loss": 0.1937, "learning_rate": 4.642449413050499e-06, "epoch": 0.21372255163875675, "percentage": 21.38, "elapsed_time": "1:11:06", "remaining_time": "4:21:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 411, "total_steps": 1918, "loss": 0.2254, "learning_rate": 4.640224742026365e-06, "epoch": 0.21424382615494886, "percentage": 21.43, "elapsed_time": "1:11:16", "remaining_time": "4:21:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 412, "total_steps": 1918, "loss": 0.2112, "learning_rate": 4.637993707997107e-06, "epoch": 0.21476510067114093, "percentage": 21.48, "elapsed_time": "1:11:26", "remaining_time": "4:21:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 413, "total_steps": 1918, "loss": 0.206, "learning_rate": 4.635756317595714e-06, "epoch": 0.21528637518733304, "percentage": 21.53, "elapsed_time": "1:11:36", "remaining_time": "4:20:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 414, "total_steps": 1918, "loss": 0.2076, "learning_rate": 4.6335125774740665e-06, "epoch": 0.21580764970352512, "percentage": 21.58, "elapsed_time": "1:11:46", "remaining_time": "4:20:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 415, "total_steps": 1918, "loss": 0.2177, "learning_rate": 4.6312624943029275e-06, "epoch": 0.21632892421971722, "percentage": 21.64, "elapsed_time": "1:11:56", "remaining_time": "4:20:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 416, "total_steps": 1918, "loss": 0.2373, "learning_rate": 4.629006074771918e-06, "epoch": 0.2168501987359093, "percentage": 21.69, "elapsed_time": "1:12:07", "remaining_time": "4:20:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 417, "total_steps": 1918, "loss": 0.211, "learning_rate": 4.626743325589496e-06, "epoch": 0.21737147325210138, "percentage": 21.74, "elapsed_time": "1:12:15", "remaining_time": "4:20:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 418, "total_steps": 1918, "loss": 0.2225, "learning_rate": 4.624474253482938e-06, "epoch": 0.21789274776829348, "percentage": 21.79, "elapsed_time": "1:12:25", "remaining_time": "4:19:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 419, "total_steps": 1918, "loss": 0.2151, "learning_rate": 4.622198865198321e-06, "epoch": 0.21841402228448556, "percentage": 21.85, "elapsed_time": "1:12:35", "remaining_time": "4:19:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 420, "total_steps": 1918, "loss": 0.2089, "learning_rate": 4.619917167500496e-06, "epoch": 0.21893529680067766, "percentage": 21.9, "elapsed_time": "1:12:45", "remaining_time": "4:19:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 421, "total_steps": 1918, "loss": 0.2266, "learning_rate": 4.617629167173078e-06, "epoch": 0.21945657131686974, "percentage": 21.95, "elapsed_time": "1:12:55", "remaining_time": "4:19:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 422, "total_steps": 1918, "loss": 0.231, "learning_rate": 4.615334871018415e-06, "epoch": 0.21997784583306185, "percentage": 22.0, "elapsed_time": "1:13:05", "remaining_time": "4:19:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 423, "total_steps": 1918, "loss": 0.1894, "learning_rate": 4.613034285857575e-06, "epoch": 0.22049912034925392, "percentage": 22.05, "elapsed_time": "1:13:14", "remaining_time": "4:18:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 424, "total_steps": 1918, "loss": 0.2273, "learning_rate": 4.610727418530324e-06, "epoch": 0.22102039486544603, "percentage": 22.11, "elapsed_time": "1:13:24", "remaining_time": "4:18:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 425, "total_steps": 1918, "loss": 0.2196, "learning_rate": 4.6084142758951055e-06, "epoch": 0.2215416693816381, "percentage": 22.16, "elapsed_time": "1:13:34", "remaining_time": "4:18:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 426, "total_steps": 1918, "loss": 0.2109, "learning_rate": 4.606094864829016e-06, "epoch": 0.22206294389783018, "percentage": 22.21, "elapsed_time": "1:13:44", "remaining_time": "4:18:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 427, "total_steps": 1918, "loss": 0.2213, "learning_rate": 4.603769192227795e-06, "epoch": 0.2225842184140223, "percentage": 22.26, "elapsed_time": "1:13:54", "remaining_time": "4:18:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 428, "total_steps": 1918, "loss": 0.2166, "learning_rate": 4.601437265005792e-06, "epoch": 0.22310549293021437, "percentage": 22.31, "elapsed_time": "1:14:04", "remaining_time": "4:17:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 429, "total_steps": 1918, "loss": 0.207, "learning_rate": 4.599099090095955e-06, "epoch": 0.22362676744640647, "percentage": 22.37, "elapsed_time": "1:14:14", "remaining_time": "4:17:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 430, "total_steps": 1918, "loss": 0.2193, "learning_rate": 4.5967546744498044e-06, "epoch": 0.22414804196259855, "percentage": 22.42, "elapsed_time": "1:14:25", "remaining_time": "4:17:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 431, "total_steps": 1918, "loss": 0.2113, "learning_rate": 4.594404025037418e-06, "epoch": 0.22466931647879065, "percentage": 22.47, "elapsed_time": "1:14:34", "remaining_time": "4:17:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 432, "total_steps": 1918, "loss": 0.2256, "learning_rate": 4.592047148847404e-06, "epoch": 0.22519059099498273, "percentage": 22.52, "elapsed_time": "1:14:45", "remaining_time": "4:17:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 433, "total_steps": 1918, "loss": 0.2198, "learning_rate": 4.589684052886884e-06, "epoch": 0.22571186551117484, "percentage": 22.58, "elapsed_time": "1:14:55", "remaining_time": "4:16:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 434, "total_steps": 1918, "loss": 0.231, "learning_rate": 4.587314744181471e-06, "epoch": 0.2262331400273669, "percentage": 22.63, "elapsed_time": "1:15:05", "remaining_time": "4:16:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 435, "total_steps": 1918, "loss": 0.209, "learning_rate": 4.58493922977525e-06, "epoch": 0.226754414543559, "percentage": 22.68, "elapsed_time": "1:15:16", "remaining_time": "4:16:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 436, "total_steps": 1918, "loss": 0.2072, "learning_rate": 4.582557516730755e-06, "epoch": 0.2272756890597511, "percentage": 22.73, "elapsed_time": "1:15:27", "remaining_time": "4:16:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 437, "total_steps": 1918, "loss": 0.196, "learning_rate": 4.58016961212895e-06, "epoch": 0.22779696357594317, "percentage": 22.78, "elapsed_time": "1:15:37", "remaining_time": "4:16:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 438, "total_steps": 1918, "loss": 0.2277, "learning_rate": 4.577775523069204e-06, "epoch": 0.22831823809213528, "percentage": 22.84, "elapsed_time": "1:15:48", "remaining_time": "4:16:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 439, "total_steps": 1918, "loss": 0.2407, "learning_rate": 4.575375256669276e-06, "epoch": 0.22883951260832736, "percentage": 22.89, "elapsed_time": "1:15:59", "remaining_time": "4:16:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 440, "total_steps": 1918, "loss": 0.1848, "learning_rate": 4.572968820065288e-06, "epoch": 0.22936078712451946, "percentage": 22.94, "elapsed_time": "1:16:09", "remaining_time": "4:15:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 441, "total_steps": 1918, "loss": 0.2163, "learning_rate": 4.570556220411708e-06, "epoch": 0.22988206164071154, "percentage": 22.99, "elapsed_time": "1:16:19", "remaining_time": "4:15:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 442, "total_steps": 1918, "loss": 0.2093, "learning_rate": 4.568137464881328e-06, "epoch": 0.23040333615690364, "percentage": 23.04, "elapsed_time": "1:16:31", "remaining_time": "4:15:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 443, "total_steps": 1918, "loss": 0.2132, "learning_rate": 4.5657125606652385e-06, "epoch": 0.23092461067309572, "percentage": 23.1, "elapsed_time": "1:16:41", "remaining_time": "4:15:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 444, "total_steps": 1918, "loss": 0.2262, "learning_rate": 4.563281514972814e-06, "epoch": 0.2314458851892878, "percentage": 23.15, "elapsed_time": "1:16:51", "remaining_time": "4:15:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 445, "total_steps": 1918, "loss": 0.2404, "learning_rate": 4.560844335031684e-06, "epoch": 0.2319671597054799, "percentage": 23.2, "elapsed_time": "1:17:02", "remaining_time": "4:15:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 446, "total_steps": 1918, "loss": 0.2343, "learning_rate": 4.55840102808772e-06, "epoch": 0.23248843422167198, "percentage": 23.25, "elapsed_time": "1:17:13", "remaining_time": "4:14:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 447, "total_steps": 1918, "loss": 0.2063, "learning_rate": 4.555951601405005e-06, "epoch": 0.23300970873786409, "percentage": 23.31, "elapsed_time": "1:17:23", "remaining_time": "4:14:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 448, "total_steps": 1918, "loss": 0.2202, "learning_rate": 4.55349606226582e-06, "epoch": 0.23353098325405616, "percentage": 23.36, "elapsed_time": "1:17:34", "remaining_time": "4:14:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 449, "total_steps": 1918, "loss": 0.2324, "learning_rate": 4.551034417970616e-06, "epoch": 0.23405225777024827, "percentage": 23.41, "elapsed_time": "1:17:45", "remaining_time": "4:14:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 450, "total_steps": 1918, "loss": 0.2186, "learning_rate": 4.548566675837996e-06, "epoch": 0.23457353228644034, "percentage": 23.46, "elapsed_time": "1:17:57", "remaining_time": "4:14:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 451, "total_steps": 1918, "loss": 0.2101, "learning_rate": 4.546092843204694e-06, "epoch": 0.23509480680263245, "percentage": 23.51, "elapsed_time": "1:18:07", "remaining_time": "4:14:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 452, "total_steps": 1918, "loss": 0.2248, "learning_rate": 4.543612927425547e-06, "epoch": 0.23561608131882453, "percentage": 23.57, "elapsed_time": "1:18:18", "remaining_time": "4:13:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 453, "total_steps": 1918, "loss": 0.2082, "learning_rate": 4.541126935873481e-06, "epoch": 0.2361373558350166, "percentage": 23.62, "elapsed_time": "1:18:28", "remaining_time": "4:13:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 454, "total_steps": 1918, "loss": 0.2114, "learning_rate": 4.538634875939486e-06, "epoch": 0.2366586303512087, "percentage": 23.67, "elapsed_time": "1:18:39", "remaining_time": "4:13:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 455, "total_steps": 1918, "loss": 0.2133, "learning_rate": 4.536136755032592e-06, "epoch": 0.2371799048674008, "percentage": 23.72, "elapsed_time": "1:18:50", "remaining_time": "4:13:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 456, "total_steps": 1918, "loss": 0.214, "learning_rate": 4.5336325805798475e-06, "epoch": 0.2377011793835929, "percentage": 23.77, "elapsed_time": "1:19:01", "remaining_time": "4:13:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 457, "total_steps": 1918, "loss": 0.2074, "learning_rate": 4.5311223600263016e-06, "epoch": 0.23822245389978497, "percentage": 23.83, "elapsed_time": "1:19:11", "remaining_time": "4:13:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 458, "total_steps": 1918, "loss": 0.208, "learning_rate": 4.528606100834976e-06, "epoch": 0.23874372841597707, "percentage": 23.88, "elapsed_time": "1:19:20", "remaining_time": "4:12:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 459, "total_steps": 1918, "loss": 0.2108, "learning_rate": 4.526083810486848e-06, "epoch": 0.23926500293216915, "percentage": 23.93, "elapsed_time": "1:19:31", "remaining_time": "4:12:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 460, "total_steps": 1918, "loss": 0.2126, "learning_rate": 4.523555496480824e-06, "epoch": 0.23978627744836126, "percentage": 23.98, "elapsed_time": "1:19:40", "remaining_time": "4:12:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 461, "total_steps": 1918, "loss": 0.2218, "learning_rate": 4.5210211663337195e-06, "epoch": 0.24030755196455333, "percentage": 24.04, "elapsed_time": "1:19:51", "remaining_time": "4:12:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 462, "total_steps": 1918, "loss": 0.2115, "learning_rate": 4.518480827580237e-06, "epoch": 0.2408288264807454, "percentage": 24.09, "elapsed_time": "1:20:01", "remaining_time": "4:12:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 463, "total_steps": 1918, "loss": 0.2142, "learning_rate": 4.515934487772942e-06, "epoch": 0.24135010099693752, "percentage": 24.14, "elapsed_time": "1:20:13", "remaining_time": "4:12:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 464, "total_steps": 1918, "loss": 0.198, "learning_rate": 4.513382154482242e-06, "epoch": 0.2418713755131296, "percentage": 24.19, "elapsed_time": "1:20:23", "remaining_time": "4:11:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 465, "total_steps": 1918, "loss": 0.2272, "learning_rate": 4.510823835296364e-06, "epoch": 0.2423926500293217, "percentage": 24.24, "elapsed_time": "1:20:33", "remaining_time": "4:11:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 466, "total_steps": 1918, "loss": 0.2001, "learning_rate": 4.50825953782133e-06, "epoch": 0.24291392454551378, "percentage": 24.3, "elapsed_time": "1:20:43", "remaining_time": "4:11:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 467, "total_steps": 1918, "loss": 0.2124, "learning_rate": 4.505689269680937e-06, "epoch": 0.24343519906170588, "percentage": 24.35, "elapsed_time": "1:20:54", "remaining_time": "4:11:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 468, "total_steps": 1918, "loss": 0.2126, "learning_rate": 4.503113038516732e-06, "epoch": 0.24395647357789796, "percentage": 24.4, "elapsed_time": "1:21:04", "remaining_time": "4:11:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 469, "total_steps": 1918, "loss": 0.2225, "learning_rate": 4.500530851987992e-06, "epoch": 0.24447774809409006, "percentage": 24.45, "elapsed_time": "1:21:14", "remaining_time": "4:11:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 470, "total_steps": 1918, "loss": 0.1993, "learning_rate": 4.4979427177716974e-06, "epoch": 0.24499902261028214, "percentage": 24.5, "elapsed_time": "1:21:25", "remaining_time": "4:10:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 471, "total_steps": 1918, "loss": 0.209, "learning_rate": 4.495348643562514e-06, "epoch": 0.24552029712647422, "percentage": 24.56, "elapsed_time": "1:21:35", "remaining_time": "4:10:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 472, "total_steps": 1918, "loss": 0.2205, "learning_rate": 4.4927486370727656e-06, "epoch": 0.24604157164266632, "percentage": 24.61, "elapsed_time": "1:21:46", "remaining_time": "4:10:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 473, "total_steps": 1918, "loss": 0.2306, "learning_rate": 4.4901427060324135e-06, "epoch": 0.2465628461588584, "percentage": 24.66, "elapsed_time": "1:21:56", "remaining_time": "4:10:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 474, "total_steps": 1918, "loss": 0.2187, "learning_rate": 4.487530858189033e-06, "epoch": 0.2470841206750505, "percentage": 24.71, "elapsed_time": "1:22:06", "remaining_time": "4:10:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 475, "total_steps": 1918, "loss": 0.2314, "learning_rate": 4.4849131013077915e-06, "epoch": 0.24760539519124258, "percentage": 24.77, "elapsed_time": "1:22:16", "remaining_time": "4:09:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 476, "total_steps": 1918, "loss": 0.2175, "learning_rate": 4.482289443171421e-06, "epoch": 0.2481266697074347, "percentage": 24.82, "elapsed_time": "1:22:26", "remaining_time": "4:09:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 477, "total_steps": 1918, "loss": 0.2151, "learning_rate": 4.479659891580203e-06, "epoch": 0.24864794422362677, "percentage": 24.87, "elapsed_time": "1:22:36", "remaining_time": "4:09:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 478, "total_steps": 1918, "loss": 0.2243, "learning_rate": 4.477024454351937e-06, "epoch": 0.24916921873981887, "percentage": 24.92, "elapsed_time": "1:22:47", "remaining_time": "4:09:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 479, "total_steps": 1918, "loss": 0.2246, "learning_rate": 4.4743831393219215e-06, "epoch": 0.24969049325601095, "percentage": 24.97, "elapsed_time": "1:22:58", "remaining_time": "4:09:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 480, "total_steps": 1918, "loss": 0.2194, "learning_rate": 4.471735954342932e-06, "epoch": 0.25021176777220305, "percentage": 25.03, "elapsed_time": "1:23:09", "remaining_time": "4:09:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 481, "total_steps": 1918, "loss": 0.214, "learning_rate": 4.469082907285192e-06, "epoch": 0.2507330422883951, "percentage": 25.08, "elapsed_time": "1:23:19", "remaining_time": "4:08:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 482, "total_steps": 1918, "loss": 0.2195, "learning_rate": 4.4664240060363565e-06, "epoch": 0.2512543168045872, "percentage": 25.13, "elapsed_time": "1:23:30", "remaining_time": "4:08:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 483, "total_steps": 1918, "loss": 0.2058, "learning_rate": 4.463759258501485e-06, "epoch": 0.2517755913207793, "percentage": 25.18, "elapsed_time": "1:23:42", "remaining_time": "4:08:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 484, "total_steps": 1918, "loss": 0.2198, "learning_rate": 4.461088672603015e-06, "epoch": 0.2522968658369714, "percentage": 25.23, "elapsed_time": "1:23:52", "remaining_time": "4:08:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 485, "total_steps": 1918, "loss": 0.225, "learning_rate": 4.458412256280747e-06, "epoch": 0.25281814035316347, "percentage": 25.29, "elapsed_time": "1:24:03", "remaining_time": "4:08:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 486, "total_steps": 1918, "loss": 0.2006, "learning_rate": 4.455730017491812e-06, "epoch": 0.2533394148693556, "percentage": 25.34, "elapsed_time": "1:24:13", "remaining_time": "4:08:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 487, "total_steps": 1918, "loss": 0.2041, "learning_rate": 4.453041964210653e-06, "epoch": 0.2538606893855477, "percentage": 25.39, "elapsed_time": "1:24:23", "remaining_time": "4:07:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 488, "total_steps": 1918, "loss": 0.2215, "learning_rate": 4.450348104428998e-06, "epoch": 0.2543819639017397, "percentage": 25.44, "elapsed_time": "1:24:35", "remaining_time": "4:07:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 489, "total_steps": 1918, "loss": 0.222, "learning_rate": 4.447648446155841e-06, "epoch": 0.25490323841793183, "percentage": 25.5, "elapsed_time": "1:24:45", "remaining_time": "4:07:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 490, "total_steps": 1918, "loss": 0.2114, "learning_rate": 4.4449429974174115e-06, "epoch": 0.25542451293412394, "percentage": 25.55, "elapsed_time": "1:24:55", "remaining_time": "4:07:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 491, "total_steps": 1918, "loss": 0.1928, "learning_rate": 4.442231766257159e-06, "epoch": 0.25594578745031604, "percentage": 25.6, "elapsed_time": "1:25:05", "remaining_time": "4:07:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 492, "total_steps": 1918, "loss": 0.2, "learning_rate": 4.43951476073572e-06, "epoch": 0.2564670619665081, "percentage": 25.65, "elapsed_time": "1:25:15", "remaining_time": "4:07:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 493, "total_steps": 1918, "loss": 0.2182, "learning_rate": 4.436791988930901e-06, "epoch": 0.2569883364827002, "percentage": 25.7, "elapsed_time": "1:25:25", "remaining_time": "4:06:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 494, "total_steps": 1918, "loss": 0.2096, "learning_rate": 4.434063458937652e-06, "epoch": 0.2575096109988923, "percentage": 25.76, "elapsed_time": "1:25:35", "remaining_time": "4:06:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 495, "total_steps": 1918, "loss": 0.2257, "learning_rate": 4.43132917886804e-06, "epoch": 0.2580308855150844, "percentage": 25.81, "elapsed_time": "1:25:46", "remaining_time": "4:06:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 496, "total_steps": 1918, "loss": 0.2181, "learning_rate": 4.428589156851231e-06, "epoch": 0.25855216003127646, "percentage": 25.86, "elapsed_time": "1:25:57", "remaining_time": "4:06:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 497, "total_steps": 1918, "loss": 0.2162, "learning_rate": 4.42584340103346e-06, "epoch": 0.25907343454746856, "percentage": 25.91, "elapsed_time": "1:26:08", "remaining_time": "4:06:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 498, "total_steps": 1918, "loss": 0.2301, "learning_rate": 4.423091919578008e-06, "epoch": 0.25959470906366067, "percentage": 25.96, "elapsed_time": "1:26:19", "remaining_time": "4:06:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 499, "total_steps": 1918, "loss": 0.2355, "learning_rate": 4.4203347206651805e-06, "epoch": 0.2601159835798527, "percentage": 26.02, "elapsed_time": "1:26:31", "remaining_time": "4:06:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 500, "total_steps": 1918, "loss": 0.1954, "learning_rate": 4.417571812492279e-06, "epoch": 0.2606372580960448, "percentage": 26.07, "elapsed_time": "1:26:41", "remaining_time": "4:05:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 500, "total_steps": 1918, "eval_loss": 0.21339768171310425, "epoch": 0.2606372580960448, "percentage": 26.07, "elapsed_time": "1:27:33", "remaining_time": "4:08:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 501, "total_steps": 1918, "loss": 0.2233, "learning_rate": 4.4148032032735835e-06, "epoch": 0.2611585326122369, "percentage": 26.12, "elapsed_time": "1:27:45", "remaining_time": "4:08:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 502, "total_steps": 1918, "loss": 0.205, "learning_rate": 4.4120289012403185e-06, "epoch": 0.26167980712842903, "percentage": 26.17, "elapsed_time": "1:27:55", "remaining_time": "4:08:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 503, "total_steps": 1918, "loss": 0.2156, "learning_rate": 4.409248914640636e-06, "epoch": 0.2622010816446211, "percentage": 26.23, "elapsed_time": "1:28:05", "remaining_time": "4:07:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 504, "total_steps": 1918, "loss": 0.2247, "learning_rate": 4.4064632517395875e-06, "epoch": 0.2627223561608132, "percentage": 26.28, "elapsed_time": "1:28:14", "remaining_time": "4:07:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 505, "total_steps": 1918, "loss": 0.2234, "learning_rate": 4.4036719208191025e-06, "epoch": 0.2632436306770053, "percentage": 26.33, "elapsed_time": "1:28:25", "remaining_time": "4:07:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 506, "total_steps": 1918, "loss": 0.2219, "learning_rate": 4.400874930177959e-06, "epoch": 0.26376490519319734, "percentage": 26.38, "elapsed_time": "1:28:34", "remaining_time": "4:07:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 507, "total_steps": 1918, "loss": 0.1922, "learning_rate": 4.398072288131763e-06, "epoch": 0.26428617970938945, "percentage": 26.43, "elapsed_time": "1:28:45", "remaining_time": "4:07:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 508, "total_steps": 1918, "loss": 0.2175, "learning_rate": 4.395264003012924e-06, "epoch": 0.26480745422558155, "percentage": 26.49, "elapsed_time": "1:28:55", "remaining_time": "4:06:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 509, "total_steps": 1918, "loss": 0.218, "learning_rate": 4.392450083170625e-06, "epoch": 0.26532872874177366, "percentage": 26.54, "elapsed_time": "1:29:05", "remaining_time": "4:06:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 510, "total_steps": 1918, "loss": 0.2064, "learning_rate": 4.389630536970806e-06, "epoch": 0.2658500032579657, "percentage": 26.59, "elapsed_time": "1:29:16", "remaining_time": "4:06:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 511, "total_steps": 1918, "loss": 0.2181, "learning_rate": 4.386805372796129e-06, "epoch": 0.2663712777741578, "percentage": 26.64, "elapsed_time": "1:29:26", "remaining_time": "4:06:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 512, "total_steps": 1918, "loss": 0.2093, "learning_rate": 4.383974599045963e-06, "epoch": 0.2668925522903499, "percentage": 26.69, "elapsed_time": "1:29:36", "remaining_time": "4:06:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 513, "total_steps": 1918, "loss": 0.2113, "learning_rate": 4.3811382241363545e-06, "epoch": 0.267413826806542, "percentage": 26.75, "elapsed_time": "1:29:46", "remaining_time": "4:05:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 514, "total_steps": 1918, "loss": 0.2103, "learning_rate": 4.378296256499998e-06, "epoch": 0.26793510132273407, "percentage": 26.8, "elapsed_time": "1:29:56", "remaining_time": "4:05:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 515, "total_steps": 1918, "loss": 0.208, "learning_rate": 4.375448704586221e-06, "epoch": 0.2684563758389262, "percentage": 26.85, "elapsed_time": "1:30:06", "remaining_time": "4:05:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 516, "total_steps": 1918, "loss": 0.2001, "learning_rate": 4.37259557686095e-06, "epoch": 0.2689776503551183, "percentage": 26.9, "elapsed_time": "1:30:17", "remaining_time": "4:05:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 517, "total_steps": 1918, "loss": 0.2155, "learning_rate": 4.369736881806691e-06, "epoch": 0.26949892487131033, "percentage": 26.96, "elapsed_time": "1:30:29", "remaining_time": "4:05:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 518, "total_steps": 1918, "loss": 0.2049, "learning_rate": 4.366872627922498e-06, "epoch": 0.27002019938750244, "percentage": 27.01, "elapsed_time": "1:30:39", "remaining_time": "4:05:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 519, "total_steps": 1918, "loss": 0.2161, "learning_rate": 4.364002823723956e-06, "epoch": 0.27054147390369454, "percentage": 27.06, "elapsed_time": "1:30:49", "remaining_time": "4:04:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 520, "total_steps": 1918, "loss": 0.2178, "learning_rate": 4.36112747774315e-06, "epoch": 0.27106274841988665, "percentage": 27.11, "elapsed_time": "1:31:01", "remaining_time": "4:04:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 521, "total_steps": 1918, "loss": 0.2008, "learning_rate": 4.358246598528641e-06, "epoch": 0.2715840229360787, "percentage": 27.16, "elapsed_time": "1:31:12", "remaining_time": "4:04:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 522, "total_steps": 1918, "loss": 0.1985, "learning_rate": 4.355360194645439e-06, "epoch": 0.2721052974522708, "percentage": 27.22, "elapsed_time": "1:31:22", "remaining_time": "4:04:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 523, "total_steps": 1918, "loss": 0.2138, "learning_rate": 4.35246827467498e-06, "epoch": 0.2726265719684629, "percentage": 27.27, "elapsed_time": "1:31:33", "remaining_time": "4:04:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 524, "total_steps": 1918, "loss": 0.2155, "learning_rate": 4.349570847215104e-06, "epoch": 0.27314784648465495, "percentage": 27.32, "elapsed_time": "1:31:43", "remaining_time": "4:04:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 525, "total_steps": 1918, "loss": 0.2197, "learning_rate": 4.346667920880016e-06, "epoch": 0.27366912100084706, "percentage": 27.37, "elapsed_time": "1:31:54", "remaining_time": "4:03:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 526, "total_steps": 1918, "loss": 0.2074, "learning_rate": 4.343759504300278e-06, "epoch": 0.27419039551703916, "percentage": 27.42, "elapsed_time": "1:32:06", "remaining_time": "4:03:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 527, "total_steps": 1918, "loss": 0.2136, "learning_rate": 4.34084560612277e-06, "epoch": 0.27471167003323127, "percentage": 27.48, "elapsed_time": "1:32:16", "remaining_time": "4:03:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 528, "total_steps": 1918, "loss": 0.2053, "learning_rate": 4.337926235010672e-06, "epoch": 0.2752329445494233, "percentage": 27.53, "elapsed_time": "1:32:26", "remaining_time": "4:03:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 529, "total_steps": 1918, "loss": 0.2194, "learning_rate": 4.335001399643433e-06, "epoch": 0.2757542190656154, "percentage": 27.58, "elapsed_time": "1:32:36", "remaining_time": "4:03:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 530, "total_steps": 1918, "loss": 0.211, "learning_rate": 4.332071108716747e-06, "epoch": 0.27627549358180753, "percentage": 27.63, "elapsed_time": "1:32:46", "remaining_time": "4:02:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 531, "total_steps": 1918, "loss": 0.2066, "learning_rate": 4.329135370942531e-06, "epoch": 0.27679676809799963, "percentage": 27.69, "elapsed_time": "1:32:58", "remaining_time": "4:02:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 532, "total_steps": 1918, "loss": 0.2125, "learning_rate": 4.326194195048894e-06, "epoch": 0.2773180426141917, "percentage": 27.74, "elapsed_time": "1:33:08", "remaining_time": "4:02:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 533, "total_steps": 1918, "loss": 0.2073, "learning_rate": 4.323247589780111e-06, "epoch": 0.2778393171303838, "percentage": 27.79, "elapsed_time": "1:33:19", "remaining_time": "4:02:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 534, "total_steps": 1918, "loss": 0.2035, "learning_rate": 4.320295563896601e-06, "epoch": 0.2783605916465759, "percentage": 27.84, "elapsed_time": "1:33:31", "remaining_time": "4:02:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 535, "total_steps": 1918, "loss": 0.2262, "learning_rate": 4.317338126174899e-06, "epoch": 0.27888186616276794, "percentage": 27.89, "elapsed_time": "1:33:42", "remaining_time": "4:02:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 536, "total_steps": 1918, "loss": 0.2178, "learning_rate": 4.314375285407629e-06, "epoch": 0.27940314067896005, "percentage": 27.95, "elapsed_time": "1:33:54", "remaining_time": "4:02:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 537, "total_steps": 1918, "loss": 0.1976, "learning_rate": 4.311407050403479e-06, "epoch": 0.27992441519515215, "percentage": 28.0, "elapsed_time": "1:34:04", "remaining_time": "4:01:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 538, "total_steps": 1918, "loss": 0.2111, "learning_rate": 4.308433429987172e-06, "epoch": 0.28044568971134426, "percentage": 28.05, "elapsed_time": "1:34:15", "remaining_time": "4:01:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 539, "total_steps": 1918, "loss": 0.2085, "learning_rate": 4.305454432999445e-06, "epoch": 0.2809669642275363, "percentage": 28.1, "elapsed_time": "1:34:25", "remaining_time": "4:01:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 540, "total_steps": 1918, "loss": 0.2132, "learning_rate": 4.302470068297019e-06, "epoch": 0.2814882387437284, "percentage": 28.15, "elapsed_time": "1:34:36", "remaining_time": "4:01:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 541, "total_steps": 1918, "loss": 0.2119, "learning_rate": 4.2994803447525735e-06, "epoch": 0.2820095132599205, "percentage": 28.21, "elapsed_time": "1:34:47", "remaining_time": "4:01:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 542, "total_steps": 1918, "loss": 0.1951, "learning_rate": 4.29648527125472e-06, "epoch": 0.28253078777611257, "percentage": 28.26, "elapsed_time": "1:34:57", "remaining_time": "4:01:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 543, "total_steps": 1918, "loss": 0.2034, "learning_rate": 4.2934848567079745e-06, "epoch": 0.2830520622923047, "percentage": 28.31, "elapsed_time": "1:35:08", "remaining_time": "4:00:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 544, "total_steps": 1918, "loss": 0.2195, "learning_rate": 4.290479110032735e-06, "epoch": 0.2835733368084968, "percentage": 28.36, "elapsed_time": "1:35:18", "remaining_time": "4:00:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 545, "total_steps": 1918, "loss": 0.2013, "learning_rate": 4.28746804016525e-06, "epoch": 0.2840946113246889, "percentage": 28.42, "elapsed_time": "1:35:27", "remaining_time": "4:00:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 546, "total_steps": 1918, "loss": 0.2244, "learning_rate": 4.284451656057595e-06, "epoch": 0.28461588584088093, "percentage": 28.47, "elapsed_time": "1:35:38", "remaining_time": "4:00:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 547, "total_steps": 1918, "loss": 0.2199, "learning_rate": 4.281429966677644e-06, "epoch": 0.28513716035707304, "percentage": 28.52, "elapsed_time": "1:35:48", "remaining_time": "4:00:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 548, "total_steps": 1918, "loss": 0.2042, "learning_rate": 4.2784029810090456e-06, "epoch": 0.28565843487326514, "percentage": 28.57, "elapsed_time": "1:36:00", "remaining_time": "4:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 549, "total_steps": 1918, "loss": 0.2119, "learning_rate": 4.275370708051194e-06, "epoch": 0.28617970938945725, "percentage": 28.62, "elapsed_time": "1:36:11", "remaining_time": "3:59:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 550, "total_steps": 1918, "loss": 0.2214, "learning_rate": 4.2723331568192004e-06, "epoch": 0.2867009839056493, "percentage": 28.68, "elapsed_time": "1:36:21", "remaining_time": "3:59:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 551, "total_steps": 1918, "loss": 0.2169, "learning_rate": 4.269290336343873e-06, "epoch": 0.2872222584218414, "percentage": 28.73, "elapsed_time": "1:36:32", "remaining_time": "3:59:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 552, "total_steps": 1918, "loss": 0.2117, "learning_rate": 4.266242255671681e-06, "epoch": 0.2877435329380335, "percentage": 28.78, "elapsed_time": "1:36:41", "remaining_time": "3:59:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 553, "total_steps": 1918, "loss": 0.2108, "learning_rate": 4.2631889238647375e-06, "epoch": 0.28826480745422556, "percentage": 28.83, "elapsed_time": "1:36:51", "remaining_time": "3:59:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 554, "total_steps": 1918, "loss": 0.2121, "learning_rate": 4.260130350000763e-06, "epoch": 0.28878608197041766, "percentage": 28.88, "elapsed_time": "1:37:02", "remaining_time": "3:58:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 555, "total_steps": 1918, "loss": 0.2157, "learning_rate": 4.257066543173064e-06, "epoch": 0.28930735648660977, "percentage": 28.94, "elapsed_time": "1:37:13", "remaining_time": "3:58:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 556, "total_steps": 1918, "loss": 0.2138, "learning_rate": 4.253997512490507e-06, "epoch": 0.2898286310028019, "percentage": 28.99, "elapsed_time": "1:37:24", "remaining_time": "3:58:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 557, "total_steps": 1918, "loss": 0.2251, "learning_rate": 4.250923267077489e-06, "epoch": 0.2903499055189939, "percentage": 29.04, "elapsed_time": "1:37:33", "remaining_time": "3:58:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 558, "total_steps": 1918, "loss": 0.2168, "learning_rate": 4.247843816073909e-06, "epoch": 0.290871180035186, "percentage": 29.09, "elapsed_time": "1:37:44", "remaining_time": "3:58:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 559, "total_steps": 1918, "loss": 0.2151, "learning_rate": 4.2447591686351406e-06, "epoch": 0.29139245455137813, "percentage": 29.14, "elapsed_time": "1:37:54", "remaining_time": "3:58:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 560, "total_steps": 1918, "loss": 0.2137, "learning_rate": 4.2416693339320115e-06, "epoch": 0.2919137290675702, "percentage": 29.2, "elapsed_time": "1:38:04", "remaining_time": "3:57:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 561, "total_steps": 1918, "loss": 0.2001, "learning_rate": 4.238574321150769e-06, "epoch": 0.2924350035837623, "percentage": 29.25, "elapsed_time": "1:38:14", "remaining_time": "3:57:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 562, "total_steps": 1918, "loss": 0.2126, "learning_rate": 4.235474139493055e-06, "epoch": 0.2929562780999544, "percentage": 29.3, "elapsed_time": "1:38:25", "remaining_time": "3:57:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 563, "total_steps": 1918, "loss": 0.2198, "learning_rate": 4.23236879817588e-06, "epoch": 0.2934775526161465, "percentage": 29.35, "elapsed_time": "1:38:36", "remaining_time": "3:57:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 564, "total_steps": 1918, "loss": 0.2026, "learning_rate": 4.229258306431592e-06, "epoch": 0.29399882713233855, "percentage": 29.41, "elapsed_time": "1:38:46", "remaining_time": "3:57:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 565, "total_steps": 1918, "loss": 0.2081, "learning_rate": 4.226142673507852e-06, "epoch": 0.29452010164853065, "percentage": 29.46, "elapsed_time": "1:38:56", "remaining_time": "3:56:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 566, "total_steps": 1918, "loss": 0.2082, "learning_rate": 4.22302190866761e-06, "epoch": 0.29504137616472276, "percentage": 29.51, "elapsed_time": "1:39:07", "remaining_time": "3:56:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 567, "total_steps": 1918, "loss": 0.2058, "learning_rate": 4.219896021189067e-06, "epoch": 0.29556265068091486, "percentage": 29.56, "elapsed_time": "1:39:17", "remaining_time": "3:56:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 568, "total_steps": 1918, "loss": 0.2076, "learning_rate": 4.2167650203656605e-06, "epoch": 0.2960839251971069, "percentage": 29.61, "elapsed_time": "1:39:27", "remaining_time": "3:56:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 569, "total_steps": 1918, "loss": 0.2098, "learning_rate": 4.213628915506025e-06, "epoch": 0.296605199713299, "percentage": 29.67, "elapsed_time": "1:39:36", "remaining_time": "3:56:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 570, "total_steps": 1918, "loss": 0.2004, "learning_rate": 4.210487715933973e-06, "epoch": 0.2971264742294911, "percentage": 29.72, "elapsed_time": "1:39:46", "remaining_time": "3:55:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 571, "total_steps": 1918, "loss": 0.2179, "learning_rate": 4.207341430988461e-06, "epoch": 0.29764774874568317, "percentage": 29.77, "elapsed_time": "1:39:57", "remaining_time": "3:55:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 572, "total_steps": 1918, "loss": 0.2103, "learning_rate": 4.204190070023567e-06, "epoch": 0.2981690232618753, "percentage": 29.82, "elapsed_time": "1:40:07", "remaining_time": "3:55:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 573, "total_steps": 1918, "loss": 0.2108, "learning_rate": 4.2010336424084596e-06, "epoch": 0.2986902977780674, "percentage": 29.87, "elapsed_time": "1:40:18", "remaining_time": "3:55:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 574, "total_steps": 1918, "loss": 0.2114, "learning_rate": 4.19787215752737e-06, "epoch": 0.2992115722942595, "percentage": 29.93, "elapsed_time": "1:40:28", "remaining_time": "3:55:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 575, "total_steps": 1918, "loss": 0.2185, "learning_rate": 4.194705624779566e-06, "epoch": 0.29973284681045154, "percentage": 29.98, "elapsed_time": "1:40:39", "remaining_time": "3:55:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 576, "total_steps": 1918, "loss": 0.2115, "learning_rate": 4.191534053579322e-06, "epoch": 0.30025412132664364, "percentage": 30.03, "elapsed_time": "1:40:51", "remaining_time": "3:54:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 577, "total_steps": 1918, "loss": 0.205, "learning_rate": 4.188357453355893e-06, "epoch": 0.30077539584283575, "percentage": 30.08, "elapsed_time": "1:41:01", "remaining_time": "3:54:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 578, "total_steps": 1918, "loss": 0.2223, "learning_rate": 4.1851758335534844e-06, "epoch": 0.3012966703590278, "percentage": 30.14, "elapsed_time": "1:41:11", "remaining_time": "3:54:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 579, "total_steps": 1918, "loss": 0.1904, "learning_rate": 4.181989203631227e-06, "epoch": 0.3018179448752199, "percentage": 30.19, "elapsed_time": "1:41:21", "remaining_time": "3:54:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 580, "total_steps": 1918, "loss": 0.2093, "learning_rate": 4.178797573063144e-06, "epoch": 0.302339219391412, "percentage": 30.24, "elapsed_time": "1:41:32", "remaining_time": "3:54:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 581, "total_steps": 1918, "loss": 0.2124, "learning_rate": 4.175600951338129e-06, "epoch": 0.3028604939076041, "percentage": 30.29, "elapsed_time": "1:41:41", "remaining_time": "3:54:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 582, "total_steps": 1918, "loss": 0.2293, "learning_rate": 4.172399347959912e-06, "epoch": 0.30338176842379616, "percentage": 30.34, "elapsed_time": "1:41:52", "remaining_time": "3:53:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 583, "total_steps": 1918, "loss": 0.2094, "learning_rate": 4.169192772447036e-06, "epoch": 0.30390304293998827, "percentage": 30.4, "elapsed_time": "1:42:02", "remaining_time": "3:53:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 584, "total_steps": 1918, "loss": 0.2083, "learning_rate": 4.1659812343328246e-06, "epoch": 0.30442431745618037, "percentage": 30.45, "elapsed_time": "1:42:12", "remaining_time": "3:53:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 585, "total_steps": 1918, "loss": 0.2062, "learning_rate": 4.162764743165355e-06, "epoch": 0.3049455919723725, "percentage": 30.5, "elapsed_time": "1:42:22", "remaining_time": "3:53:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 586, "total_steps": 1918, "loss": 0.2024, "learning_rate": 4.1595433085074334e-06, "epoch": 0.3054668664885645, "percentage": 30.55, "elapsed_time": "1:42:32", "remaining_time": "3:53:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 587, "total_steps": 1918, "loss": 0.2212, "learning_rate": 4.156316939936559e-06, "epoch": 0.30598814100475663, "percentage": 30.6, "elapsed_time": "1:42:42", "remaining_time": "3:52:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 588, "total_steps": 1918, "loss": 0.2141, "learning_rate": 4.153085647044904e-06, "epoch": 0.30650941552094874, "percentage": 30.66, "elapsed_time": "1:42:53", "remaining_time": "3:52:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 589, "total_steps": 1918, "loss": 0.1918, "learning_rate": 4.149849439439277e-06, "epoch": 0.3070306900371408, "percentage": 30.71, "elapsed_time": "1:43:02", "remaining_time": "3:52:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 590, "total_steps": 1918, "loss": 0.1979, "learning_rate": 4.146608326741101e-06, "epoch": 0.3075519645533329, "percentage": 30.76, "elapsed_time": "1:43:13", "remaining_time": "3:52:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 591, "total_steps": 1918, "loss": 0.2222, "learning_rate": 4.1433623185863805e-06, "epoch": 0.308073239069525, "percentage": 30.81, "elapsed_time": "1:43:23", "remaining_time": "3:52:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 592, "total_steps": 1918, "loss": 0.2026, "learning_rate": 4.140111424625676e-06, "epoch": 0.3085945135857171, "percentage": 30.87, "elapsed_time": "1:43:33", "remaining_time": "3:51:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 593, "total_steps": 1918, "loss": 0.2111, "learning_rate": 4.1368556545240724e-06, "epoch": 0.30911578810190915, "percentage": 30.92, "elapsed_time": "1:43:43", "remaining_time": "3:51:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 594, "total_steps": 1918, "loss": 0.2121, "learning_rate": 4.133595017961152e-06, "epoch": 0.30963706261810126, "percentage": 30.97, "elapsed_time": "1:43:54", "remaining_time": "3:51:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 595, "total_steps": 1918, "loss": 0.2092, "learning_rate": 4.130329524630966e-06, "epoch": 0.31015833713429336, "percentage": 31.02, "elapsed_time": "1:44:04", "remaining_time": "3:51:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 596, "total_steps": 1918, "loss": 0.1888, "learning_rate": 4.127059184242004e-06, "epoch": 0.3106796116504854, "percentage": 31.07, "elapsed_time": "1:44:14", "remaining_time": "3:51:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 597, "total_steps": 1918, "loss": 0.2041, "learning_rate": 4.123784006517166e-06, "epoch": 0.3112008861666775, "percentage": 31.13, "elapsed_time": "1:44:23", "remaining_time": "3:51:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 598, "total_steps": 1918, "loss": 0.2247, "learning_rate": 4.120504001193737e-06, "epoch": 0.3117221606828696, "percentage": 31.18, "elapsed_time": "1:44:34", "remaining_time": "3:50:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 599, "total_steps": 1918, "loss": 0.2187, "learning_rate": 4.117219178023349e-06, "epoch": 0.3122434351990617, "percentage": 31.23, "elapsed_time": "1:44:45", "remaining_time": "3:50:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 600, "total_steps": 1918, "loss": 0.2212, "learning_rate": 4.113929546771963e-06, "epoch": 0.3127647097152538, "percentage": 31.28, "elapsed_time": "1:44:56", "remaining_time": "3:50:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 601, "total_steps": 1918, "loss": 0.2059, "learning_rate": 4.1106351172198325e-06, "epoch": 0.3132859842314459, "percentage": 31.33, "elapsed_time": "1:45:05", "remaining_time": "3:50:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 602, "total_steps": 1918, "loss": 0.2056, "learning_rate": 4.1073358991614745e-06, "epoch": 0.313807258747638, "percentage": 31.39, "elapsed_time": "1:45:16", "remaining_time": "3:50:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 603, "total_steps": 1918, "loss": 0.2157, "learning_rate": 4.1040319024056465e-06, "epoch": 0.3143285332638301, "percentage": 31.44, "elapsed_time": "1:45:27", "remaining_time": "3:49:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 604, "total_steps": 1918, "loss": 0.2267, "learning_rate": 4.10072313677531e-06, "epoch": 0.31484980778002214, "percentage": 31.49, "elapsed_time": "1:45:38", "remaining_time": "3:49:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 605, "total_steps": 1918, "loss": 0.2274, "learning_rate": 4.0974096121076076e-06, "epoch": 0.31537108229621424, "percentage": 31.54, "elapsed_time": "1:45:48", "remaining_time": "3:49:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 606, "total_steps": 1918, "loss": 0.2042, "learning_rate": 4.094091338253829e-06, "epoch": 0.31589235681240635, "percentage": 31.6, "elapsed_time": "1:45:58", "remaining_time": "3:49:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 607, "total_steps": 1918, "loss": 0.1994, "learning_rate": 4.0907683250793814e-06, "epoch": 0.3164136313285984, "percentage": 31.65, "elapsed_time": "1:46:08", "remaining_time": "3:49:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 608, "total_steps": 1918, "loss": 0.2021, "learning_rate": 4.0874405824637676e-06, "epoch": 0.3169349058447905, "percentage": 31.7, "elapsed_time": "1:46:19", "remaining_time": "3:49:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 609, "total_steps": 1918, "loss": 0.2047, "learning_rate": 4.084108120300546e-06, "epoch": 0.3174561803609826, "percentage": 31.75, "elapsed_time": "1:46:28", "remaining_time": "3:48:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 610, "total_steps": 1918, "loss": 0.1883, "learning_rate": 4.080770948497311e-06, "epoch": 0.3179774548771747, "percentage": 31.8, "elapsed_time": "1:46:38", "remaining_time": "3:48:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 611, "total_steps": 1918, "loss": 0.2095, "learning_rate": 4.077429076975655e-06, "epoch": 0.31849872939336676, "percentage": 31.86, "elapsed_time": "1:46:49", "remaining_time": "3:48:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 612, "total_steps": 1918, "loss": 0.2145, "learning_rate": 4.074082515671145e-06, "epoch": 0.31902000390955887, "percentage": 31.91, "elapsed_time": "1:46:58", "remaining_time": "3:48:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 613, "total_steps": 1918, "loss": 0.2049, "learning_rate": 4.070731274533291e-06, "epoch": 0.319541278425751, "percentage": 31.96, "elapsed_time": "1:47:09", "remaining_time": "3:48:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 614, "total_steps": 1918, "loss": 0.2137, "learning_rate": 4.067375363525516e-06, "epoch": 0.320062552941943, "percentage": 32.01, "elapsed_time": "1:47:19", "remaining_time": "3:47:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 615, "total_steps": 1918, "loss": 0.2003, "learning_rate": 4.064014792625126e-06, "epoch": 0.32058382745813513, "percentage": 32.06, "elapsed_time": "1:47:29", "remaining_time": "3:47:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 616, "total_steps": 1918, "loss": 0.2091, "learning_rate": 4.060649571823284e-06, "epoch": 0.32110510197432723, "percentage": 32.12, "elapsed_time": "1:47:41", "remaining_time": "3:47:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 617, "total_steps": 1918, "loss": 0.2096, "learning_rate": 4.057279711124973e-06, "epoch": 0.32162637649051934, "percentage": 32.17, "elapsed_time": "1:47:51", "remaining_time": "3:47:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 618, "total_steps": 1918, "loss": 0.2212, "learning_rate": 4.053905220548974e-06, "epoch": 0.3221476510067114, "percentage": 32.22, "elapsed_time": "1:48:02", "remaining_time": "3:47:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 619, "total_steps": 1918, "loss": 0.1766, "learning_rate": 4.050526110127832e-06, "epoch": 0.3226689255229035, "percentage": 32.27, "elapsed_time": "1:48:11", "remaining_time": "3:47:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 620, "total_steps": 1918, "loss": 0.2056, "learning_rate": 4.047142389907827e-06, "epoch": 0.3231902000390956, "percentage": 32.33, "elapsed_time": "1:48:21", "remaining_time": "3:46:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 621, "total_steps": 1918, "loss": 0.2175, "learning_rate": 4.043754069948944e-06, "epoch": 0.3237114745552877, "percentage": 32.38, "elapsed_time": "1:48:32", "remaining_time": "3:46:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 622, "total_steps": 1918, "loss": 0.2108, "learning_rate": 4.040361160324844e-06, "epoch": 0.32423274907147975, "percentage": 32.43, "elapsed_time": "1:48:42", "remaining_time": "3:46:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 623, "total_steps": 1918, "loss": 0.1984, "learning_rate": 4.036963671122831e-06, "epoch": 0.32475402358767186, "percentage": 32.48, "elapsed_time": "1:48:52", "remaining_time": "3:46:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 624, "total_steps": 1918, "loss": 0.2186, "learning_rate": 4.033561612443829e-06, "epoch": 0.32527529810386396, "percentage": 32.53, "elapsed_time": "1:49:03", "remaining_time": "3:46:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 625, "total_steps": 1918, "loss": 0.202, "learning_rate": 4.030154994402341e-06, "epoch": 0.325796572620056, "percentage": 32.59, "elapsed_time": "1:49:11", "remaining_time": "3:45:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 626, "total_steps": 1918, "loss": 0.1998, "learning_rate": 4.0267438271264304e-06, "epoch": 0.3263178471362481, "percentage": 32.64, "elapsed_time": "1:49:21", "remaining_time": "3:45:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 627, "total_steps": 1918, "loss": 0.2196, "learning_rate": 4.023328120757685e-06, "epoch": 0.3268391216524402, "percentage": 32.69, "elapsed_time": "1:49:31", "remaining_time": "3:45:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 628, "total_steps": 1918, "loss": 0.2065, "learning_rate": 4.019907885451184e-06, "epoch": 0.32736039616863233, "percentage": 32.74, "elapsed_time": "1:49:40", "remaining_time": "3:45:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 629, "total_steps": 1918, "loss": 0.1978, "learning_rate": 4.016483131375476e-06, "epoch": 0.3278816706848244, "percentage": 32.79, "elapsed_time": "1:49:51", "remaining_time": "3:45:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 630, "total_steps": 1918, "loss": 0.2181, "learning_rate": 4.01305386871254e-06, "epoch": 0.3284029452010165, "percentage": 32.85, "elapsed_time": "1:50:02", "remaining_time": "3:44:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 631, "total_steps": 1918, "loss": 0.2189, "learning_rate": 4.009620107657763e-06, "epoch": 0.3289242197172086, "percentage": 32.9, "elapsed_time": "1:50:12", "remaining_time": "3:44:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 632, "total_steps": 1918, "loss": 0.203, "learning_rate": 4.006181858419905e-06, "epoch": 0.32944549423340064, "percentage": 32.95, "elapsed_time": "1:50:23", "remaining_time": "3:44:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 633, "total_steps": 1918, "loss": 0.1977, "learning_rate": 4.002739131221066e-06, "epoch": 0.32996676874959274, "percentage": 33.0, "elapsed_time": "1:50:33", "remaining_time": "3:44:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 634, "total_steps": 1918, "loss": 0.2003, "learning_rate": 3.999291936296664e-06, "epoch": 0.33048804326578485, "percentage": 33.06, "elapsed_time": "1:50:43", "remaining_time": "3:44:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 635, "total_steps": 1918, "loss": 0.1925, "learning_rate": 3.995840283895399e-06, "epoch": 0.33100931778197695, "percentage": 33.11, "elapsed_time": "1:50:56", "remaining_time": "3:44:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 636, "total_steps": 1918, "loss": 0.2083, "learning_rate": 3.99238418427922e-06, "epoch": 0.331530592298169, "percentage": 33.16, "elapsed_time": "1:51:06", "remaining_time": "3:43:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 637, "total_steps": 1918, "loss": 0.2245, "learning_rate": 3.988923647723301e-06, "epoch": 0.3320518668143611, "percentage": 33.21, "elapsed_time": "1:51:16", "remaining_time": "3:43:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 638, "total_steps": 1918, "loss": 0.2097, "learning_rate": 3.9854586845160055e-06, "epoch": 0.3325731413305532, "percentage": 33.26, "elapsed_time": "1:51:26", "remaining_time": "3:43:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 639, "total_steps": 1918, "loss": 0.1979, "learning_rate": 3.981989304958861e-06, "epoch": 0.3330944158467453, "percentage": 33.32, "elapsed_time": "1:51:37", "remaining_time": "3:43:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 640, "total_steps": 1918, "loss": 0.191, "learning_rate": 3.978515519366519e-06, "epoch": 0.33361569036293737, "percentage": 33.37, "elapsed_time": "1:51:48", "remaining_time": "3:43:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 641, "total_steps": 1918, "loss": 0.2269, "learning_rate": 3.975037338066736e-06, "epoch": 0.33413696487912947, "percentage": 33.42, "elapsed_time": "1:51:58", "remaining_time": "3:43:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 642, "total_steps": 1918, "loss": 0.212, "learning_rate": 3.9715547714003355e-06, "epoch": 0.3346582393953216, "percentage": 33.47, "elapsed_time": "1:52:09", "remaining_time": "3:42:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 643, "total_steps": 1918, "loss": 0.1926, "learning_rate": 3.968067829721178e-06, "epoch": 0.3351795139115136, "percentage": 33.52, "elapsed_time": "1:52:19", "remaining_time": "3:42:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 644, "total_steps": 1918, "loss": 0.2213, "learning_rate": 3.96457652339613e-06, "epoch": 0.33570078842770573, "percentage": 33.58, "elapsed_time": "1:52:30", "remaining_time": "3:42:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 645, "total_steps": 1918, "loss": 0.2033, "learning_rate": 3.961080862805039e-06, "epoch": 0.33622206294389784, "percentage": 33.63, "elapsed_time": "1:52:40", "remaining_time": "3:42:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 646, "total_steps": 1918, "loss": 0.1999, "learning_rate": 3.9575808583406926e-06, "epoch": 0.33674333746008994, "percentage": 33.68, "elapsed_time": "1:52:50", "remaining_time": "3:42:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 647, "total_steps": 1918, "loss": 0.2067, "learning_rate": 3.954076520408796e-06, "epoch": 0.337264611976282, "percentage": 33.73, "elapsed_time": "1:52:59", "remaining_time": "3:41:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 648, "total_steps": 1918, "loss": 0.1966, "learning_rate": 3.950567859427938e-06, "epoch": 0.3377858864924741, "percentage": 33.79, "elapsed_time": "1:53:11", "remaining_time": "3:41:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 649, "total_steps": 1918, "loss": 0.1943, "learning_rate": 3.947054885829559e-06, "epoch": 0.3383071610086662, "percentage": 33.84, "elapsed_time": "1:53:21", "remaining_time": "3:41:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 650, "total_steps": 1918, "loss": 0.2166, "learning_rate": 3.943537610057921e-06, "epoch": 0.33882843552485825, "percentage": 33.89, "elapsed_time": "1:53:31", "remaining_time": "3:41:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 651, "total_steps": 1918, "loss": 0.2182, "learning_rate": 3.940016042570079e-06, "epoch": 0.33934971004105036, "percentage": 33.94, "elapsed_time": "1:53:41", "remaining_time": "3:41:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 652, "total_steps": 1918, "loss": 0.2093, "learning_rate": 3.936490193835843e-06, "epoch": 0.33987098455724246, "percentage": 33.99, "elapsed_time": "1:53:51", "remaining_time": "3:41:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 653, "total_steps": 1918, "loss": 0.2269, "learning_rate": 3.932960074337755e-06, "epoch": 0.34039225907343457, "percentage": 34.05, "elapsed_time": "1:54:01", "remaining_time": "3:40:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 654, "total_steps": 1918, "loss": 0.2035, "learning_rate": 3.929425694571055e-06, "epoch": 0.3409135335896266, "percentage": 34.1, "elapsed_time": "1:54:13", "remaining_time": "3:40:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 655, "total_steps": 1918, "loss": 0.2122, "learning_rate": 3.925887065043643e-06, "epoch": 0.3414348081058187, "percentage": 34.15, "elapsed_time": "1:54:23", "remaining_time": "3:40:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 656, "total_steps": 1918, "loss": 0.2139, "learning_rate": 3.922344196276063e-06, "epoch": 0.3419560826220108, "percentage": 34.2, "elapsed_time": "1:54:33", "remaining_time": "3:40:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 657, "total_steps": 1918, "loss": 0.2027, "learning_rate": 3.918797098801453e-06, "epoch": 0.34247735713820293, "percentage": 34.25, "elapsed_time": "1:54:44", "remaining_time": "3:40:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 658, "total_steps": 1918, "loss": 0.1975, "learning_rate": 3.915245783165531e-06, "epoch": 0.342998631654395, "percentage": 34.31, "elapsed_time": "1:54:54", "remaining_time": "3:40:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 659, "total_steps": 1918, "loss": 0.21, "learning_rate": 3.911690259926551e-06, "epoch": 0.3435199061705871, "percentage": 34.36, "elapsed_time": "1:55:07", "remaining_time": "3:39:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 660, "total_steps": 1918, "loss": 0.2029, "learning_rate": 3.908130539655278e-06, "epoch": 0.3440411806867792, "percentage": 34.41, "elapsed_time": "1:55:17", "remaining_time": "3:39:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 661, "total_steps": 1918, "loss": 0.2265, "learning_rate": 3.904566632934955e-06, "epoch": 0.34456245520297124, "percentage": 34.46, "elapsed_time": "1:55:27", "remaining_time": "3:39:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 662, "total_steps": 1918, "loss": 0.2064, "learning_rate": 3.900998550361271e-06, "epoch": 0.34508372971916335, "percentage": 34.52, "elapsed_time": "1:55:38", "remaining_time": "3:39:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 663, "total_steps": 1918, "loss": 0.2009, "learning_rate": 3.897426302542331e-06, "epoch": 0.34560500423535545, "percentage": 34.57, "elapsed_time": "1:55:49", "remaining_time": "3:39:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 664, "total_steps": 1918, "loss": 0.1984, "learning_rate": 3.893849900098623e-06, "epoch": 0.34612627875154756, "percentage": 34.62, "elapsed_time": "1:55:59", "remaining_time": "3:39:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 665, "total_steps": 1918, "loss": 0.2042, "learning_rate": 3.890269353662987e-06, "epoch": 0.3466475532677396, "percentage": 34.67, "elapsed_time": "1:56:09", "remaining_time": "3:38:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 666, "total_steps": 1918, "loss": 0.2077, "learning_rate": 3.886684673880583e-06, "epoch": 0.3471688277839317, "percentage": 34.72, "elapsed_time": "1:56:20", "remaining_time": "3:38:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 667, "total_steps": 1918, "loss": 0.2036, "learning_rate": 3.8830958714088595e-06, "epoch": 0.3476901023001238, "percentage": 34.78, "elapsed_time": "1:56:30", "remaining_time": "3:38:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 668, "total_steps": 1918, "loss": 0.2034, "learning_rate": 3.879502956917524e-06, "epoch": 0.34821137681631587, "percentage": 34.83, "elapsed_time": "1:56:40", "remaining_time": "3:38:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 669, "total_steps": 1918, "loss": 0.2075, "learning_rate": 3.875905941088505e-06, "epoch": 0.34873265133250797, "percentage": 34.88, "elapsed_time": "1:56:51", "remaining_time": "3:38:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 670, "total_steps": 1918, "loss": 0.1985, "learning_rate": 3.872304834615929e-06, "epoch": 0.3492539258487001, "percentage": 34.93, "elapsed_time": "1:57:01", "remaining_time": "3:37:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 671, "total_steps": 1918, "loss": 0.1895, "learning_rate": 3.868699648206081e-06, "epoch": 0.3497752003648922, "percentage": 34.98, "elapsed_time": "1:57:10", "remaining_time": "3:37:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 672, "total_steps": 1918, "loss": 0.207, "learning_rate": 3.8650903925773795e-06, "epoch": 0.35029647488108423, "percentage": 35.04, "elapsed_time": "1:57:22", "remaining_time": "3:37:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 673, "total_steps": 1918, "loss": 0.2111, "learning_rate": 3.861477078460337e-06, "epoch": 0.35081774939727633, "percentage": 35.09, "elapsed_time": "1:57:33", "remaining_time": "3:37:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 674, "total_steps": 1918, "loss": 0.2148, "learning_rate": 3.857859716597534e-06, "epoch": 0.35133902391346844, "percentage": 35.14, "elapsed_time": "1:57:42", "remaining_time": "3:37:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 675, "total_steps": 1918, "loss": 0.2196, "learning_rate": 3.854238317743586e-06, "epoch": 0.35186029842966055, "percentage": 35.19, "elapsed_time": "1:57:53", "remaining_time": "3:37:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 676, "total_steps": 1918, "loss": 0.2105, "learning_rate": 3.8506128926651095e-06, "epoch": 0.3523815729458526, "percentage": 35.25, "elapsed_time": "1:58:03", "remaining_time": "3:36:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 677, "total_steps": 1918, "loss": 0.2132, "learning_rate": 3.846983452140689e-06, "epoch": 0.3529028474620447, "percentage": 35.3, "elapsed_time": "1:58:13", "remaining_time": "3:36:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 678, "total_steps": 1918, "loss": 0.2053, "learning_rate": 3.843350006960852e-06, "epoch": 0.3534241219782368, "percentage": 35.35, "elapsed_time": "1:58:24", "remaining_time": "3:36:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 679, "total_steps": 1918, "loss": 0.2102, "learning_rate": 3.83971256792803e-06, "epoch": 0.35394539649442885, "percentage": 35.4, "elapsed_time": "1:58:35", "remaining_time": "3:36:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 680, "total_steps": 1918, "loss": 0.2021, "learning_rate": 3.836071145856526e-06, "epoch": 0.35446667101062096, "percentage": 35.45, "elapsed_time": "1:58:45", "remaining_time": "3:36:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 681, "total_steps": 1918, "loss": 0.2034, "learning_rate": 3.832425751572488e-06, "epoch": 0.35498794552681306, "percentage": 35.51, "elapsed_time": "1:58:54", "remaining_time": "3:35:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 682, "total_steps": 1918, "loss": 0.1993, "learning_rate": 3.828776395913872e-06, "epoch": 0.35550922004300517, "percentage": 35.56, "elapsed_time": "1:59:03", "remaining_time": "3:35:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 683, "total_steps": 1918, "loss": 0.2096, "learning_rate": 3.825123089730413e-06, "epoch": 0.3560304945591972, "percentage": 35.61, "elapsed_time": "1:59:14", "remaining_time": "3:35:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 684, "total_steps": 1918, "loss": 0.1915, "learning_rate": 3.821465843883588e-06, "epoch": 0.3565517690753893, "percentage": 35.66, "elapsed_time": "1:59:24", "remaining_time": "3:35:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 685, "total_steps": 1918, "loss": 0.1905, "learning_rate": 3.81780466924659e-06, "epoch": 0.35707304359158143, "percentage": 35.71, "elapsed_time": "1:59:34", "remaining_time": "3:35:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 686, "total_steps": 1918, "loss": 0.1969, "learning_rate": 3.814139576704291e-06, "epoch": 0.3575943181077735, "percentage": 35.77, "elapsed_time": "1:59:44", "remaining_time": "3:35:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 687, "total_steps": 1918, "loss": 0.2115, "learning_rate": 3.810470577153212e-06, "epoch": 0.3581155926239656, "percentage": 35.82, "elapsed_time": "1:59:56", "remaining_time": "3:34:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 688, "total_steps": 1918, "loss": 0.1997, "learning_rate": 3.8067976815014885e-06, "epoch": 0.3586368671401577, "percentage": 35.87, "elapsed_time": "2:00:07", "remaining_time": "3:34:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 689, "total_steps": 1918, "loss": 0.2077, "learning_rate": 3.8031209006688397e-06, "epoch": 0.3591581416563498, "percentage": 35.92, "elapsed_time": "2:00:18", "remaining_time": "3:34:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 690, "total_steps": 1918, "loss": 0.2079, "learning_rate": 3.7994402455865375e-06, "epoch": 0.35967941617254184, "percentage": 35.97, "elapsed_time": "2:00:29", "remaining_time": "3:34:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 691, "total_steps": 1918, "loss": 0.2017, "learning_rate": 3.795755727197368e-06, "epoch": 0.36020069068873395, "percentage": 36.03, "elapsed_time": "2:00:39", "remaining_time": "3:34:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 692, "total_steps": 1918, "loss": 0.2221, "learning_rate": 3.7920673564556083e-06, "epoch": 0.36072196520492605, "percentage": 36.08, "elapsed_time": "2:00:49", "remaining_time": "3:34:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 693, "total_steps": 1918, "loss": 0.1955, "learning_rate": 3.788375144326985e-06, "epoch": 0.36124323972111816, "percentage": 36.13, "elapsed_time": "2:01:01", "remaining_time": "3:33:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 694, "total_steps": 1918, "loss": 0.2116, "learning_rate": 3.784679101788647e-06, "epoch": 0.3617645142373102, "percentage": 36.18, "elapsed_time": "2:01:11", "remaining_time": "3:33:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 695, "total_steps": 1918, "loss": 0.214, "learning_rate": 3.78097923982913e-06, "epoch": 0.3622857887535023, "percentage": 36.24, "elapsed_time": "2:01:22", "remaining_time": "3:33:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 696, "total_steps": 1918, "loss": 0.1905, "learning_rate": 3.7772755694483265e-06, "epoch": 0.3628070632696944, "percentage": 36.29, "elapsed_time": "2:01:32", "remaining_time": "3:33:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 697, "total_steps": 1918, "loss": 0.1971, "learning_rate": 3.7735681016574504e-06, "epoch": 0.36332833778588647, "percentage": 36.34, "elapsed_time": "2:01:41", "remaining_time": "3:33:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 698, "total_steps": 1918, "loss": 0.1996, "learning_rate": 3.7698568474790064e-06, "epoch": 0.3638496123020786, "percentage": 36.39, "elapsed_time": "2:01:52", "remaining_time": "3:33:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 699, "total_steps": 1918, "loss": 0.2161, "learning_rate": 3.766141817946757e-06, "epoch": 0.3643708868182707, "percentage": 36.44, "elapsed_time": "2:02:02", "remaining_time": "3:32:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 700, "total_steps": 1918, "loss": 0.2008, "learning_rate": 3.7624230241056854e-06, "epoch": 0.3648921613344628, "percentage": 36.5, "elapsed_time": "2:02:13", "remaining_time": "3:32:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 701, "total_steps": 1918, "loss": 0.2293, "learning_rate": 3.7587004770119716e-06, "epoch": 0.36541343585065483, "percentage": 36.55, "elapsed_time": "2:02:24", "remaining_time": "3:32:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 702, "total_steps": 1918, "loss": 0.2015, "learning_rate": 3.7549741877329504e-06, "epoch": 0.36593471036684694, "percentage": 36.6, "elapsed_time": "2:02:34", "remaining_time": "3:32:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 703, "total_steps": 1918, "loss": 0.2097, "learning_rate": 3.7512441673470836e-06, "epoch": 0.36645598488303904, "percentage": 36.65, "elapsed_time": "2:02:44", "remaining_time": "3:32:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 704, "total_steps": 1918, "loss": 0.1945, "learning_rate": 3.747510426943925e-06, "epoch": 0.3669772593992311, "percentage": 36.7, "elapsed_time": "2:02:55", "remaining_time": "3:31:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 705, "total_steps": 1918, "loss": 0.2033, "learning_rate": 3.7437729776240894e-06, "epoch": 0.3674985339154232, "percentage": 36.76, "elapsed_time": "2:03:05", "remaining_time": "3:31:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 706, "total_steps": 1918, "loss": 0.187, "learning_rate": 3.740031830499219e-06, "epoch": 0.3680198084316153, "percentage": 36.81, "elapsed_time": "2:03:14", "remaining_time": "3:31:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 707, "total_steps": 1918, "loss": 0.2017, "learning_rate": 3.7362869966919467e-06, "epoch": 0.3685410829478074, "percentage": 36.86, "elapsed_time": "2:03:26", "remaining_time": "3:31:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 708, "total_steps": 1918, "loss": 0.2112, "learning_rate": 3.7325384873358695e-06, "epoch": 0.36906235746399946, "percentage": 36.91, "elapsed_time": "2:03:35", "remaining_time": "3:31:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 709, "total_steps": 1918, "loss": 0.2117, "learning_rate": 3.7287863135755098e-06, "epoch": 0.36958363198019156, "percentage": 36.97, "elapsed_time": "2:03:46", "remaining_time": "3:31:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 710, "total_steps": 1918, "loss": 0.1984, "learning_rate": 3.7250304865662857e-06, "epoch": 0.37010490649638367, "percentage": 37.02, "elapsed_time": "2:03:56", "remaining_time": "3:30:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 711, "total_steps": 1918, "loss": 0.2079, "learning_rate": 3.7212710174744753e-06, "epoch": 0.3706261810125758, "percentage": 37.07, "elapsed_time": "2:04:06", "remaining_time": "3:30:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 712, "total_steps": 1918, "loss": 0.2022, "learning_rate": 3.7175079174771872e-06, "epoch": 0.3711474555287678, "percentage": 37.12, "elapsed_time": "2:04:16", "remaining_time": "3:30:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 713, "total_steps": 1918, "loss": 0.2009, "learning_rate": 3.713741197762323e-06, "epoch": 0.3716687300449599, "percentage": 37.17, "elapsed_time": "2:04:28", "remaining_time": "3:30:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 714, "total_steps": 1918, "loss": 0.1955, "learning_rate": 3.7099708695285436e-06, "epoch": 0.37219000456115203, "percentage": 37.23, "elapsed_time": "2:04:38", "remaining_time": "3:30:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 715, "total_steps": 1918, "loss": 0.198, "learning_rate": 3.706196943985245e-06, "epoch": 0.3727112790773441, "percentage": 37.28, "elapsed_time": "2:04:48", "remaining_time": "3:29:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 716, "total_steps": 1918, "loss": 0.2183, "learning_rate": 3.7024194323525115e-06, "epoch": 0.3732325535935362, "percentage": 37.33, "elapsed_time": "2:04:58", "remaining_time": "3:29:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 717, "total_steps": 1918, "loss": 0.1982, "learning_rate": 3.6986383458610925e-06, "epoch": 0.3737538281097283, "percentage": 37.38, "elapsed_time": "2:05:06", "remaining_time": "3:29:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 718, "total_steps": 1918, "loss": 0.1944, "learning_rate": 3.694853695752364e-06, "epoch": 0.3742751026259204, "percentage": 37.43, "elapsed_time": "2:05:16", "remaining_time": "3:29:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 719, "total_steps": 1918, "loss": 0.2017, "learning_rate": 3.6910654932782984e-06, "epoch": 0.37479637714211245, "percentage": 37.49, "elapsed_time": "2:05:27", "remaining_time": "3:29:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 720, "total_steps": 1918, "loss": 0.2002, "learning_rate": 3.6872737497014286e-06, "epoch": 0.37531765165830455, "percentage": 37.54, "elapsed_time": "2:05:37", "remaining_time": "3:29:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 721, "total_steps": 1918, "loss": 0.1982, "learning_rate": 3.6834784762948156e-06, "epoch": 0.37583892617449666, "percentage": 37.59, "elapsed_time": "2:05:49", "remaining_time": "3:28:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 722, "total_steps": 1918, "loss": 0.2071, "learning_rate": 3.6796796843420134e-06, "epoch": 0.3763602006906887, "percentage": 37.64, "elapsed_time": "2:06:00", "remaining_time": "3:28:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 723, "total_steps": 1918, "loss": 0.1884, "learning_rate": 3.67587738513704e-06, "epoch": 0.3768814752068808, "percentage": 37.7, "elapsed_time": "2:06:11", "remaining_time": "3:28:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 724, "total_steps": 1918, "loss": 0.1995, "learning_rate": 3.672071589984337e-06, "epoch": 0.3774027497230729, "percentage": 37.75, "elapsed_time": "2:06:21", "remaining_time": "3:28:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 725, "total_steps": 1918, "loss": 0.1981, "learning_rate": 3.6682623101987423e-06, "epoch": 0.377924024239265, "percentage": 37.8, "elapsed_time": "2:06:31", "remaining_time": "3:28:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 726, "total_steps": 1918, "loss": 0.2, "learning_rate": 3.664449557105454e-06, "epoch": 0.37844529875545707, "percentage": 37.85, "elapsed_time": "2:06:42", "remaining_time": "3:28:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 727, "total_steps": 1918, "loss": 0.2091, "learning_rate": 3.6606333420399933e-06, "epoch": 0.3789665732716492, "percentage": 37.9, "elapsed_time": "2:06:52", "remaining_time": "3:27:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 728, "total_steps": 1918, "loss": 0.2079, "learning_rate": 3.6568136763481766e-06, "epoch": 0.3794878477878413, "percentage": 37.96, "elapsed_time": "2:07:03", "remaining_time": "3:27:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 729, "total_steps": 1918, "loss": 0.2074, "learning_rate": 3.652990571386079e-06, "epoch": 0.3800091223040334, "percentage": 38.01, "elapsed_time": "2:07:13", "remaining_time": "3:27:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 730, "total_steps": 1918, "loss": 0.1935, "learning_rate": 3.649164038520001e-06, "epoch": 0.38053039682022544, "percentage": 38.06, "elapsed_time": "2:07:25", "remaining_time": "3:27:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 731, "total_steps": 1918, "loss": 0.2052, "learning_rate": 3.6453340891264344e-06, "epoch": 0.38105167133641754, "percentage": 38.11, "elapsed_time": "2:07:34", "remaining_time": "3:27:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 732, "total_steps": 1918, "loss": 0.205, "learning_rate": 3.641500734592026e-06, "epoch": 0.38157294585260965, "percentage": 38.16, "elapsed_time": "2:07:44", "remaining_time": "3:26:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 733, "total_steps": 1918, "loss": 0.2281, "learning_rate": 3.63766398631355e-06, "epoch": 0.3820942203688017, "percentage": 38.22, "elapsed_time": "2:07:54", "remaining_time": "3:26:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 734, "total_steps": 1918, "loss": 0.1834, "learning_rate": 3.633823855697869e-06, "epoch": 0.3826154948849938, "percentage": 38.27, "elapsed_time": "2:08:05", "remaining_time": "3:26:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 735, "total_steps": 1918, "loss": 0.2101, "learning_rate": 3.6299803541619e-06, "epoch": 0.3831367694011859, "percentage": 38.32, "elapsed_time": "2:08:14", "remaining_time": "3:26:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 736, "total_steps": 1918, "loss": 0.1819, "learning_rate": 3.6261334931325833e-06, "epoch": 0.383658043917378, "percentage": 38.37, "elapsed_time": "2:08:24", "remaining_time": "3:26:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 737, "total_steps": 1918, "loss": 0.1969, "learning_rate": 3.622283284046847e-06, "epoch": 0.38417931843357006, "percentage": 38.43, "elapsed_time": "2:08:35", "remaining_time": "3:26:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 738, "total_steps": 1918, "loss": 0.1955, "learning_rate": 3.618429738351574e-06, "epoch": 0.38470059294976217, "percentage": 38.48, "elapsed_time": "2:08:46", "remaining_time": "3:25:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 739, "total_steps": 1918, "loss": 0.2083, "learning_rate": 3.6145728675035658e-06, "epoch": 0.38522186746595427, "percentage": 38.53, "elapsed_time": "2:08:57", "remaining_time": "3:25:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 740, "total_steps": 1918, "loss": 0.1959, "learning_rate": 3.6107126829695093e-06, "epoch": 0.3857431419821463, "percentage": 38.58, "elapsed_time": "2:09:08", "remaining_time": "3:25:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 741, "total_steps": 1918, "loss": 0.1981, "learning_rate": 3.6068491962259457e-06, "epoch": 0.3862644164983384, "percentage": 38.63, "elapsed_time": "2:09:17", "remaining_time": "3:25:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 742, "total_steps": 1918, "loss": 0.1905, "learning_rate": 3.6029824187592304e-06, "epoch": 0.38678569101453053, "percentage": 38.69, "elapsed_time": "2:09:27", "remaining_time": "3:25:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 743, "total_steps": 1918, "loss": 0.1946, "learning_rate": 3.599112362065506e-06, "epoch": 0.38730696553072264, "percentage": 38.74, "elapsed_time": "2:09:38", "remaining_time": "3:25:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 744, "total_steps": 1918, "loss": 0.1982, "learning_rate": 3.5952390376506614e-06, "epoch": 0.3878282400469147, "percentage": 38.79, "elapsed_time": "2:09:49", "remaining_time": "3:24:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 745, "total_steps": 1918, "loss": 0.2241, "learning_rate": 3.591362457030302e-06, "epoch": 0.3883495145631068, "percentage": 38.84, "elapsed_time": "2:09:59", "remaining_time": "3:24:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 746, "total_steps": 1918, "loss": 0.2158, "learning_rate": 3.5874826317297135e-06, "epoch": 0.3888707890792989, "percentage": 38.89, "elapsed_time": "2:10:10", "remaining_time": "3:24:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 747, "total_steps": 1918, "loss": 0.2187, "learning_rate": 3.5835995732838292e-06, "epoch": 0.389392063595491, "percentage": 38.95, "elapsed_time": "2:10:20", "remaining_time": "3:24:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 748, "total_steps": 1918, "loss": 0.1909, "learning_rate": 3.579713293237194e-06, "epoch": 0.38991333811168305, "percentage": 39.0, "elapsed_time": "2:10:30", "remaining_time": "3:24:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 749, "total_steps": 1918, "loss": 0.2048, "learning_rate": 3.5758238031439306e-06, "epoch": 0.39043461262787515, "percentage": 39.05, "elapsed_time": "2:10:40", "remaining_time": "3:23:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 750, "total_steps": 1918, "loss": 0.195, "learning_rate": 3.5719311145677057e-06, "epoch": 0.39095588714406726, "percentage": 39.1, "elapsed_time": "2:10:50", "remaining_time": "3:23:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 751, "total_steps": 1918, "loss": 0.2078, "learning_rate": 3.5680352390816942e-06, "epoch": 0.3914771616602593, "percentage": 39.16, "elapsed_time": "2:11:01", "remaining_time": "3:23:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 752, "total_steps": 1918, "loss": 0.2055, "learning_rate": 3.5641361882685487e-06, "epoch": 0.3919984361764514, "percentage": 39.21, "elapsed_time": "2:11:11", "remaining_time": "3:23:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 753, "total_steps": 1918, "loss": 0.2047, "learning_rate": 3.5602339737203593e-06, "epoch": 0.3925197106926435, "percentage": 39.26, "elapsed_time": "2:11:20", "remaining_time": "3:23:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 754, "total_steps": 1918, "loss": 0.2145, "learning_rate": 3.5563286070386237e-06, "epoch": 0.3930409852088356, "percentage": 39.31, "elapsed_time": "2:11:31", "remaining_time": "3:23:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 755, "total_steps": 1918, "loss": 0.2122, "learning_rate": 3.5524200998342095e-06, "epoch": 0.3935622597250277, "percentage": 39.36, "elapsed_time": "2:11:41", "remaining_time": "3:22:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 756, "total_steps": 1918, "loss": 0.1982, "learning_rate": 3.5485084637273225e-06, "epoch": 0.3940835342412198, "percentage": 39.42, "elapsed_time": "2:11:52", "remaining_time": "3:22:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 757, "total_steps": 1918, "loss": 0.2047, "learning_rate": 3.5445937103474713e-06, "epoch": 0.3946048087574119, "percentage": 39.47, "elapsed_time": "2:12:03", "remaining_time": "3:22:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 758, "total_steps": 1918, "loss": 0.194, "learning_rate": 3.5406758513334316e-06, "epoch": 0.39512608327360393, "percentage": 39.52, "elapsed_time": "2:12:13", "remaining_time": "3:22:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 759, "total_steps": 1918, "loss": 0.2125, "learning_rate": 3.536754898333211e-06, "epoch": 0.39564735778979604, "percentage": 39.57, "elapsed_time": "2:12:24", "remaining_time": "3:22:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 760, "total_steps": 1918, "loss": 0.2018, "learning_rate": 3.532830863004018e-06, "epoch": 0.39616863230598814, "percentage": 39.62, "elapsed_time": "2:12:35", "remaining_time": "3:22:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 761, "total_steps": 1918, "loss": 0.1793, "learning_rate": 3.5289037570122246e-06, "epoch": 0.39668990682218025, "percentage": 39.68, "elapsed_time": "2:12:45", "remaining_time": "3:21:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 762, "total_steps": 1918, "loss": 0.2215, "learning_rate": 3.5249735920333312e-06, "epoch": 0.3972111813383723, "percentage": 39.73, "elapsed_time": "2:12:55", "remaining_time": "3:21:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 763, "total_steps": 1918, "loss": 0.212, "learning_rate": 3.521040379751933e-06, "epoch": 0.3977324558545644, "percentage": 39.78, "elapsed_time": "2:13:06", "remaining_time": "3:21:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 764, "total_steps": 1918, "loss": 0.2093, "learning_rate": 3.517104131861685e-06, "epoch": 0.3982537303707565, "percentage": 39.83, "elapsed_time": "2:13:16", "remaining_time": "3:21:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 765, "total_steps": 1918, "loss": 0.2047, "learning_rate": 3.513164860065267e-06, "epoch": 0.3987750048869486, "percentage": 39.89, "elapsed_time": "2:13:27", "remaining_time": "3:21:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 766, "total_steps": 1918, "loss": 0.2164, "learning_rate": 3.509222576074349e-06, "epoch": 0.39929627940314066, "percentage": 39.94, "elapsed_time": "2:13:37", "remaining_time": "3:20:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 767, "total_steps": 1918, "loss": 0.197, "learning_rate": 3.5052772916095584e-06, "epoch": 0.39981755391933277, "percentage": 39.99, "elapsed_time": "2:13:47", "remaining_time": "3:20:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 768, "total_steps": 1918, "loss": 0.1848, "learning_rate": 3.50132901840044e-06, "epoch": 0.4003388284355249, "percentage": 40.04, "elapsed_time": "2:13:57", "remaining_time": "3:20:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 769, "total_steps": 1918, "loss": 0.227, "learning_rate": 3.4973777681854265e-06, "epoch": 0.4008601029517169, "percentage": 40.09, "elapsed_time": "2:14:08", "remaining_time": "3:20:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 770, "total_steps": 1918, "loss": 0.2007, "learning_rate": 3.4934235527118e-06, "epoch": 0.40138137746790903, "percentage": 40.15, "elapsed_time": "2:14:17", "remaining_time": "3:20:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 771, "total_steps": 1918, "loss": 0.2062, "learning_rate": 3.4894663837356607e-06, "epoch": 0.40190265198410113, "percentage": 40.2, "elapsed_time": "2:14:28", "remaining_time": "3:20:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 772, "total_steps": 1918, "loss": 0.2174, "learning_rate": 3.485506273021887e-06, "epoch": 0.40242392650029324, "percentage": 40.25, "elapsed_time": "2:14:38", "remaining_time": "3:19:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 773, "total_steps": 1918, "loss": 0.2265, "learning_rate": 3.4815432323441043e-06, "epoch": 0.4029452010164853, "percentage": 40.3, "elapsed_time": "2:14:48", "remaining_time": "3:19:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 774, "total_steps": 1918, "loss": 0.2058, "learning_rate": 3.47757727348465e-06, "epoch": 0.4034664755326774, "percentage": 40.35, "elapsed_time": "2:14:59", "remaining_time": "3:19:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 775, "total_steps": 1918, "loss": 0.2093, "learning_rate": 3.4736084082345355e-06, "epoch": 0.4039877500488695, "percentage": 40.41, "elapsed_time": "2:15:09", "remaining_time": "3:19:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 776, "total_steps": 1918, "loss": 0.2004, "learning_rate": 3.4696366483934156e-06, "epoch": 0.40450902456506155, "percentage": 40.46, "elapsed_time": "2:15:20", "remaining_time": "3:19:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 777, "total_steps": 1918, "loss": 0.205, "learning_rate": 3.465662005769548e-06, "epoch": 0.40503029908125365, "percentage": 40.51, "elapsed_time": "2:15:30", "remaining_time": "3:18:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 778, "total_steps": 1918, "loss": 0.195, "learning_rate": 3.461684492179763e-06, "epoch": 0.40555157359744576, "percentage": 40.56, "elapsed_time": "2:15:40", "remaining_time": "3:18:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 779, "total_steps": 1918, "loss": 0.1955, "learning_rate": 3.4577041194494253e-06, "epoch": 0.40607284811363786, "percentage": 40.62, "elapsed_time": "2:15:50", "remaining_time": "3:18:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 780, "total_steps": 1918, "loss": 0.1829, "learning_rate": 3.4537208994124015e-06, "epoch": 0.4065941226298299, "percentage": 40.67, "elapsed_time": "2:16:01", "remaining_time": "3:18:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 781, "total_steps": 1918, "loss": 0.2034, "learning_rate": 3.449734843911022e-06, "epoch": 0.407115397146022, "percentage": 40.72, "elapsed_time": "2:16:10", "remaining_time": "3:18:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 782, "total_steps": 1918, "loss": 0.208, "learning_rate": 3.4457459647960477e-06, "epoch": 0.4076366716622141, "percentage": 40.77, "elapsed_time": "2:16:21", "remaining_time": "3:18:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 783, "total_steps": 1918, "loss": 0.1993, "learning_rate": 3.441754273926634e-06, "epoch": 0.40815794617840623, "percentage": 40.82, "elapsed_time": "2:16:32", "remaining_time": "3:17:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 784, "total_steps": 1918, "loss": 0.202, "learning_rate": 3.4377597831702962e-06, "epoch": 0.4086792206945983, "percentage": 40.88, "elapsed_time": "2:16:42", "remaining_time": "3:17:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 785, "total_steps": 1918, "loss": 0.1923, "learning_rate": 3.433762504402874e-06, "epoch": 0.4092004952107904, "percentage": 40.93, "elapsed_time": "2:16:53", "remaining_time": "3:17:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 786, "total_steps": 1918, "loss": 0.1877, "learning_rate": 3.429762449508495e-06, "epoch": 0.4097217697269825, "percentage": 40.98, "elapsed_time": "2:17:03", "remaining_time": "3:17:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 787, "total_steps": 1918, "loss": 0.1939, "learning_rate": 3.425759630379541e-06, "epoch": 0.41024304424317454, "percentage": 41.03, "elapsed_time": "2:17:13", "remaining_time": "3:17:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 788, "total_steps": 1918, "loss": 0.1932, "learning_rate": 3.421754058916612e-06, "epoch": 0.41076431875936664, "percentage": 41.08, "elapsed_time": "2:17:23", "remaining_time": "3:17:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 789, "total_steps": 1918, "loss": 0.2186, "learning_rate": 3.4177457470284916e-06, "epoch": 0.41128559327555875, "percentage": 41.14, "elapsed_time": "2:17:33", "remaining_time": "3:16:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 790, "total_steps": 1918, "loss": 0.2025, "learning_rate": 3.4137347066321097e-06, "epoch": 0.41180686779175085, "percentage": 41.19, "elapsed_time": "2:17:43", "remaining_time": "3:16:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 791, "total_steps": 1918, "loss": 0.2136, "learning_rate": 3.4097209496525087e-06, "epoch": 0.4123281423079429, "percentage": 41.24, "elapsed_time": "2:17:54", "remaining_time": "3:16:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 792, "total_steps": 1918, "loss": 0.1987, "learning_rate": 3.4057044880228064e-06, "epoch": 0.412849416824135, "percentage": 41.29, "elapsed_time": "2:18:05", "remaining_time": "3:16:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 793, "total_steps": 1918, "loss": 0.2165, "learning_rate": 3.4016853336841638e-06, "epoch": 0.4133706913403271, "percentage": 41.35, "elapsed_time": "2:18:14", "remaining_time": "3:16:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 794, "total_steps": 1918, "loss": 0.2091, "learning_rate": 3.397663498585747e-06, "epoch": 0.41389196585651916, "percentage": 41.4, "elapsed_time": "2:18:23", "remaining_time": "3:15:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 795, "total_steps": 1918, "loss": 0.1996, "learning_rate": 3.39363899468469e-06, "epoch": 0.41441324037271127, "percentage": 41.45, "elapsed_time": "2:18:36", "remaining_time": "3:15:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 796, "total_steps": 1918, "loss": 0.1855, "learning_rate": 3.3896118339460635e-06, "epoch": 0.41493451488890337, "percentage": 41.5, "elapsed_time": "2:18:45", "remaining_time": "3:15:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 797, "total_steps": 1918, "loss": 0.2087, "learning_rate": 3.385582028342837e-06, "epoch": 0.4154557894050955, "percentage": 41.55, "elapsed_time": "2:18:56", "remaining_time": "3:15:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 798, "total_steps": 1918, "loss": 0.2102, "learning_rate": 3.3815495898558424e-06, "epoch": 0.4159770639212875, "percentage": 41.61, "elapsed_time": "2:19:07", "remaining_time": "3:15:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 799, "total_steps": 1918, "loss": 0.1834, "learning_rate": 3.377514530473739e-06, "epoch": 0.41649833843747963, "percentage": 41.66, "elapsed_time": "2:19:19", "remaining_time": "3:15:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 800, "total_steps": 1918, "loss": 0.1974, "learning_rate": 3.3734768621929805e-06, "epoch": 0.41701961295367174, "percentage": 41.71, "elapsed_time": "2:19:28", "remaining_time": "3:14:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 801, "total_steps": 1918, "loss": 0.1978, "learning_rate": 3.369436597017774e-06, "epoch": 0.41754088746986384, "percentage": 41.76, "elapsed_time": "2:19:39", "remaining_time": "3:14:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 802, "total_steps": 1918, "loss": 0.2013, "learning_rate": 3.3653937469600483e-06, "epoch": 0.4180621619860559, "percentage": 41.81, "elapsed_time": "2:19:50", "remaining_time": "3:14:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 803, "total_steps": 1918, "loss": 0.1954, "learning_rate": 3.361348324039419e-06, "epoch": 0.418583436502248, "percentage": 41.87, "elapsed_time": "2:20:00", "remaining_time": "3:14:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 804, "total_steps": 1918, "loss": 0.1963, "learning_rate": 3.3573003402831487e-06, "epoch": 0.4191047110184401, "percentage": 41.92, "elapsed_time": "2:20:11", "remaining_time": "3:14:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 805, "total_steps": 1918, "loss": 0.2094, "learning_rate": 3.353249807726115e-06, "epoch": 0.41962598553463215, "percentage": 41.97, "elapsed_time": "2:20:22", "remaining_time": "3:14:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 806, "total_steps": 1918, "loss": 0.2095, "learning_rate": 3.349196738410771e-06, "epoch": 0.42014726005082426, "percentage": 42.02, "elapsed_time": "2:20:33", "remaining_time": "3:13:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 807, "total_steps": 1918, "loss": 0.2022, "learning_rate": 3.3451411443871145e-06, "epoch": 0.42066853456701636, "percentage": 42.08, "elapsed_time": "2:20:44", "remaining_time": "3:13:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 808, "total_steps": 1918, "loss": 0.2184, "learning_rate": 3.341083037712649e-06, "epoch": 0.42118980908320847, "percentage": 42.13, "elapsed_time": "2:20:53", "remaining_time": "3:13:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 809, "total_steps": 1918, "loss": 0.1967, "learning_rate": 3.337022430452346e-06, "epoch": 0.4217110835994005, "percentage": 42.18, "elapsed_time": "2:21:04", "remaining_time": "3:13:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 810, "total_steps": 1918, "loss": 0.1877, "learning_rate": 3.3329593346786125e-06, "epoch": 0.4222323581155926, "percentage": 42.23, "elapsed_time": "2:21:14", "remaining_time": "3:13:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 811, "total_steps": 1918, "loss": 0.2083, "learning_rate": 3.328893762471255e-06, "epoch": 0.4227536326317847, "percentage": 42.28, "elapsed_time": "2:21:25", "remaining_time": "3:13:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 812, "total_steps": 1918, "loss": 0.1969, "learning_rate": 3.324825725917442e-06, "epoch": 0.42327490714797683, "percentage": 42.34, "elapsed_time": "2:21:34", "remaining_time": "3:12:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 813, "total_steps": 1918, "loss": 0.2024, "learning_rate": 3.320755237111669e-06, "epoch": 0.4237961816641689, "percentage": 42.39, "elapsed_time": "2:21:45", "remaining_time": "3:12:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 814, "total_steps": 1918, "loss": 0.2061, "learning_rate": 3.316682308155721e-06, "epoch": 0.424317456180361, "percentage": 42.44, "elapsed_time": "2:21:54", "remaining_time": "3:12:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 815, "total_steps": 1918, "loss": 0.2134, "learning_rate": 3.312606951158638e-06, "epoch": 0.4248387306965531, "percentage": 42.49, "elapsed_time": "2:22:06", "remaining_time": "3:12:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 816, "total_steps": 1918, "loss": 0.1918, "learning_rate": 3.308529178236679e-06, "epoch": 0.42536000521274514, "percentage": 42.54, "elapsed_time": "2:22:16", "remaining_time": "3:12:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 817, "total_steps": 1918, "loss": 0.1989, "learning_rate": 3.304449001513287e-06, "epoch": 0.42588127972893725, "percentage": 42.6, "elapsed_time": "2:22:27", "remaining_time": "3:11:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 818, "total_steps": 1918, "loss": 0.1989, "learning_rate": 3.3003664331190487e-06, "epoch": 0.42640255424512935, "percentage": 42.65, "elapsed_time": "2:22:36", "remaining_time": "3:11:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 819, "total_steps": 1918, "loss": 0.1978, "learning_rate": 3.296281485191665e-06, "epoch": 0.42692382876132146, "percentage": 42.7, "elapsed_time": "2:22:47", "remaining_time": "3:11:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 820, "total_steps": 1918, "loss": 0.215, "learning_rate": 3.292194169875908e-06, "epoch": 0.4274451032775135, "percentage": 42.75, "elapsed_time": "2:22:57", "remaining_time": "3:11:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 821, "total_steps": 1918, "loss": 0.2011, "learning_rate": 3.2881044993235893e-06, "epoch": 0.4279663777937056, "percentage": 42.81, "elapsed_time": "2:23:07", "remaining_time": "3:11:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 822, "total_steps": 1918, "loss": 0.2068, "learning_rate": 3.284012485693524e-06, "epoch": 0.4284876523098977, "percentage": 42.86, "elapsed_time": "2:23:18", "remaining_time": "3:11:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 823, "total_steps": 1918, "loss": 0.2105, "learning_rate": 3.279918141151492e-06, "epoch": 0.42900892682608976, "percentage": 42.91, "elapsed_time": "2:23:29", "remaining_time": "3:10:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 824, "total_steps": 1918, "loss": 0.1845, "learning_rate": 3.2758214778702026e-06, "epoch": 0.42953020134228187, "percentage": 42.96, "elapsed_time": "2:23:37", "remaining_time": "3:10:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 825, "total_steps": 1918, "loss": 0.2034, "learning_rate": 3.2717225080292598e-06, "epoch": 0.430051475858474, "percentage": 43.01, "elapsed_time": "2:23:48", "remaining_time": "3:10:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 826, "total_steps": 1918, "loss": 0.1993, "learning_rate": 3.2676212438151256e-06, "epoch": 0.4305727503746661, "percentage": 43.07, "elapsed_time": "2:23:59", "remaining_time": "3:10:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 827, "total_steps": 1918, "loss": 0.1974, "learning_rate": 3.2635176974210824e-06, "epoch": 0.43109402489085813, "percentage": 43.12, "elapsed_time": "2:24:09", "remaining_time": "3:10:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 828, "total_steps": 1918, "loss": 0.2066, "learning_rate": 3.2594118810471982e-06, "epoch": 0.43161529940705023, "percentage": 43.17, "elapsed_time": "2:24:19", "remaining_time": "3:09:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 829, "total_steps": 1918, "loss": 0.2067, "learning_rate": 3.2553038069002885e-06, "epoch": 0.43213657392324234, "percentage": 43.22, "elapsed_time": "2:24:28", "remaining_time": "3:09:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 830, "total_steps": 1918, "loss": 0.2033, "learning_rate": 3.2511934871938825e-06, "epoch": 0.43265784843943444, "percentage": 43.27, "elapsed_time": "2:24:39", "remaining_time": "3:09:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 831, "total_steps": 1918, "loss": 0.199, "learning_rate": 3.247080934148186e-06, "epoch": 0.4331791229556265, "percentage": 43.33, "elapsed_time": "2:24:49", "remaining_time": "3:09:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 832, "total_steps": 1918, "loss": 0.201, "learning_rate": 3.242966159990044e-06, "epoch": 0.4337003974718186, "percentage": 43.38, "elapsed_time": "2:24:59", "remaining_time": "3:09:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 833, "total_steps": 1918, "loss": 0.1937, "learning_rate": 3.238849176952904e-06, "epoch": 0.4342216719880107, "percentage": 43.43, "elapsed_time": "2:25:11", "remaining_time": "3:09:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 834, "total_steps": 1918, "loss": 0.1908, "learning_rate": 3.2347299972767824e-06, "epoch": 0.43474294650420275, "percentage": 43.48, "elapsed_time": "2:25:21", "remaining_time": "3:08:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 835, "total_steps": 1918, "loss": 0.1956, "learning_rate": 3.230608633208225e-06, "epoch": 0.43526422102039486, "percentage": 43.53, "elapsed_time": "2:25:31", "remaining_time": "3:08:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 836, "total_steps": 1918, "loss": 0.195, "learning_rate": 3.226485097000273e-06, "epoch": 0.43578549553658696, "percentage": 43.59, "elapsed_time": "2:25:42", "remaining_time": "3:08:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 837, "total_steps": 1918, "loss": 0.2202, "learning_rate": 3.2223594009124247e-06, "epoch": 0.43630677005277907, "percentage": 43.64, "elapsed_time": "2:25:52", "remaining_time": "3:08:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 838, "total_steps": 1918, "loss": 0.1916, "learning_rate": 3.2182315572105995e-06, "epoch": 0.4368280445689711, "percentage": 43.69, "elapsed_time": "2:26:02", "remaining_time": "3:08:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 839, "total_steps": 1918, "loss": 0.2037, "learning_rate": 3.2141015781671025e-06, "epoch": 0.4373493190851632, "percentage": 43.74, "elapsed_time": "2:26:12", "remaining_time": "3:08:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 840, "total_steps": 1918, "loss": 0.1969, "learning_rate": 3.209969476060587e-06, "epoch": 0.43787059360135533, "percentage": 43.8, "elapsed_time": "2:26:23", "remaining_time": "3:07:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 841, "total_steps": 1918, "loss": 0.216, "learning_rate": 3.2058352631760198e-06, "epoch": 0.4383918681175474, "percentage": 43.85, "elapsed_time": "2:26:34", "remaining_time": "3:07:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 842, "total_steps": 1918, "loss": 0.1972, "learning_rate": 3.2016989518046397e-06, "epoch": 0.4389131426337395, "percentage": 43.9, "elapsed_time": "2:26:44", "remaining_time": "3:07:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 843, "total_steps": 1918, "loss": 0.1958, "learning_rate": 3.1975605542439276e-06, "epoch": 0.4394344171499316, "percentage": 43.95, "elapsed_time": "2:26:55", "remaining_time": "3:07:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 844, "total_steps": 1918, "loss": 0.2063, "learning_rate": 3.1934200827975654e-06, "epoch": 0.4399556916661237, "percentage": 44.0, "elapsed_time": "2:27:05", "remaining_time": "3:07:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 845, "total_steps": 1918, "loss": 0.1977, "learning_rate": 3.1892775497754014e-06, "epoch": 0.44047696618231574, "percentage": 44.06, "elapsed_time": "2:27:16", "remaining_time": "3:07:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 846, "total_steps": 1918, "loss": 0.2075, "learning_rate": 3.1851329674934116e-06, "epoch": 0.44099824069850785, "percentage": 44.11, "elapsed_time": "2:27:26", "remaining_time": "3:06:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 847, "total_steps": 1918, "loss": 0.1982, "learning_rate": 3.1809863482736663e-06, "epoch": 0.44151951521469995, "percentage": 44.16, "elapsed_time": "2:27:38", "remaining_time": "3:06:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 848, "total_steps": 1918, "loss": 0.1961, "learning_rate": 3.176837704444291e-06, "epoch": 0.44204078973089206, "percentage": 44.21, "elapsed_time": "2:27:48", "remaining_time": "3:06:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 849, "total_steps": 1918, "loss": 0.2122, "learning_rate": 3.1726870483394312e-06, "epoch": 0.4425620642470841, "percentage": 44.26, "elapsed_time": "2:27:59", "remaining_time": "3:06:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 850, "total_steps": 1918, "loss": 0.2044, "learning_rate": 3.168534392299214e-06, "epoch": 0.4430833387632762, "percentage": 44.32, "elapsed_time": "2:28:10", "remaining_time": "3:06:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 851, "total_steps": 1918, "loss": 0.1938, "learning_rate": 3.1643797486697116e-06, "epoch": 0.4436046132794683, "percentage": 44.37, "elapsed_time": "2:28:20", "remaining_time": "3:06:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 852, "total_steps": 1918, "loss": 0.1754, "learning_rate": 3.1602231298029074e-06, "epoch": 0.44412588779566037, "percentage": 44.42, "elapsed_time": "2:28:30", "remaining_time": "3:05:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 853, "total_steps": 1918, "loss": 0.1934, "learning_rate": 3.1560645480566566e-06, "epoch": 0.4446471623118525, "percentage": 44.47, "elapsed_time": "2:28:41", "remaining_time": "3:05:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 854, "total_steps": 1918, "loss": 0.2066, "learning_rate": 3.15190401579465e-06, "epoch": 0.4451684368280446, "percentage": 44.53, "elapsed_time": "2:28:51", "remaining_time": "3:05:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 855, "total_steps": 1918, "loss": 0.184, "learning_rate": 3.1477415453863772e-06, "epoch": 0.4456897113442367, "percentage": 44.58, "elapsed_time": "2:29:02", "remaining_time": "3:05:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 856, "total_steps": 1918, "loss": 0.1899, "learning_rate": 3.143577149207091e-06, "epoch": 0.44621098586042873, "percentage": 44.63, "elapsed_time": "2:29:12", "remaining_time": "3:05:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 857, "total_steps": 1918, "loss": 0.1962, "learning_rate": 3.139410839637767e-06, "epoch": 0.44673226037662084, "percentage": 44.68, "elapsed_time": "2:29:23", "remaining_time": "3:04:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 858, "total_steps": 1918, "loss": 0.2018, "learning_rate": 3.135242629065073e-06, "epoch": 0.44725353489281294, "percentage": 44.73, "elapsed_time": "2:29:34", "remaining_time": "3:04:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 859, "total_steps": 1918, "loss": 0.2001, "learning_rate": 3.131072529881326e-06, "epoch": 0.447774809409005, "percentage": 44.79, "elapsed_time": "2:29:44", "remaining_time": "3:04:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 860, "total_steps": 1918, "loss": 0.1917, "learning_rate": 3.126900554484459e-06, "epoch": 0.4482960839251971, "percentage": 44.84, "elapsed_time": "2:29:54", "remaining_time": "3:04:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 861, "total_steps": 1918, "loss": 0.1945, "learning_rate": 3.122726715277983e-06, "epoch": 0.4488173584413892, "percentage": 44.89, "elapsed_time": "2:30:04", "remaining_time": "3:04:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 862, "total_steps": 1918, "loss": 0.1887, "learning_rate": 3.1185510246709487e-06, "epoch": 0.4493386329575813, "percentage": 44.94, "elapsed_time": "2:30:14", "remaining_time": "3:04:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 863, "total_steps": 1918, "loss": 0.201, "learning_rate": 3.1143734950779155e-06, "epoch": 0.44985990747377336, "percentage": 44.99, "elapsed_time": "2:30:24", "remaining_time": "3:03:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 864, "total_steps": 1918, "loss": 0.1978, "learning_rate": 3.1101941389189045e-06, "epoch": 0.45038118198996546, "percentage": 45.05, "elapsed_time": "2:30:35", "remaining_time": "3:03:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 865, "total_steps": 1918, "loss": 0.2033, "learning_rate": 3.106012968619371e-06, "epoch": 0.45090245650615757, "percentage": 45.1, "elapsed_time": "2:30:44", "remaining_time": "3:03:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 866, "total_steps": 1918, "loss": 0.2013, "learning_rate": 3.1018299966101624e-06, "epoch": 0.4514237310223497, "percentage": 45.15, "elapsed_time": "2:30:55", "remaining_time": "3:03:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 867, "total_steps": 1918, "loss": 0.187, "learning_rate": 3.097645235327483e-06, "epoch": 0.4519450055385417, "percentage": 45.2, "elapsed_time": "2:31:04", "remaining_time": "3:03:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 868, "total_steps": 1918, "loss": 0.197, "learning_rate": 3.0934586972128574e-06, "epoch": 0.4524662800547338, "percentage": 45.26, "elapsed_time": "2:31:14", "remaining_time": "3:02:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 869, "total_steps": 1918, "loss": 0.184, "learning_rate": 3.0892703947130914e-06, "epoch": 0.45298755457092593, "percentage": 45.31, "elapsed_time": "2:31:24", "remaining_time": "3:02:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 870, "total_steps": 1918, "loss": 0.1827, "learning_rate": 3.085080340280239e-06, "epoch": 0.453508829087118, "percentage": 45.36, "elapsed_time": "2:31:35", "remaining_time": "3:02:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 871, "total_steps": 1918, "loss": 0.1935, "learning_rate": 3.0808885463715584e-06, "epoch": 0.4540301036033101, "percentage": 45.41, "elapsed_time": "2:31:46", "remaining_time": "3:02:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 872, "total_steps": 1918, "loss": 0.1976, "learning_rate": 3.076695025449484e-06, "epoch": 0.4545513781195022, "percentage": 45.46, "elapsed_time": "2:31:57", "remaining_time": "3:02:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 873, "total_steps": 1918, "loss": 0.1962, "learning_rate": 3.072499789981582e-06, "epoch": 0.4550726526356943, "percentage": 45.52, "elapsed_time": "2:32:08", "remaining_time": "3:02:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 874, "total_steps": 1918, "loss": 0.2036, "learning_rate": 3.068302852440517e-06, "epoch": 0.45559392715188635, "percentage": 45.57, "elapsed_time": "2:32:18", "remaining_time": "3:01:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 875, "total_steps": 1918, "loss": 0.2023, "learning_rate": 3.064104225304013e-06, "epoch": 0.45611520166807845, "percentage": 45.62, "elapsed_time": "2:32:28", "remaining_time": "3:01:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 876, "total_steps": 1918, "loss": 0.2098, "learning_rate": 3.059903921054818e-06, "epoch": 0.45663647618427056, "percentage": 45.67, "elapsed_time": "2:32:38", "remaining_time": "3:01:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 877, "total_steps": 1918, "loss": 0.1967, "learning_rate": 3.0557019521806667e-06, "epoch": 0.4571577507004626, "percentage": 45.72, "elapsed_time": "2:32:49", "remaining_time": "3:01:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 878, "total_steps": 1918, "loss": 0.1978, "learning_rate": 3.0514983311742426e-06, "epoch": 0.4576790252166547, "percentage": 45.78, "elapsed_time": "2:33:00", "remaining_time": "3:01:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 879, "total_steps": 1918, "loss": 0.2004, "learning_rate": 3.04729307053314e-06, "epoch": 0.4582002997328468, "percentage": 45.83, "elapsed_time": "2:33:10", "remaining_time": "3:01:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 880, "total_steps": 1918, "loss": 0.2061, "learning_rate": 3.0430861827598277e-06, "epoch": 0.4587215742490389, "percentage": 45.88, "elapsed_time": "2:33:21", "remaining_time": "3:00:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 881, "total_steps": 1918, "loss": 0.1846, "learning_rate": 3.0388776803616138e-06, "epoch": 0.45924284876523097, "percentage": 45.93, "elapsed_time": "2:33:31", "remaining_time": "3:00:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 882, "total_steps": 1918, "loss": 0.186, "learning_rate": 3.034667575850607e-06, "epoch": 0.4597641232814231, "percentage": 45.99, "elapsed_time": "2:33:41", "remaining_time": "3:00:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 883, "total_steps": 1918, "loss": 0.2038, "learning_rate": 3.0304558817436767e-06, "epoch": 0.4602853977976152, "percentage": 46.04, "elapsed_time": "2:33:51", "remaining_time": "3:00:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 884, "total_steps": 1918, "loss": 0.1934, "learning_rate": 3.02624261056242e-06, "epoch": 0.4608066723138073, "percentage": 46.09, "elapsed_time": "2:34:01", "remaining_time": "3:00:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 885, "total_steps": 1918, "loss": 0.1846, "learning_rate": 3.0220277748331223e-06, "epoch": 0.46132794682999934, "percentage": 46.14, "elapsed_time": "2:34:13", "remaining_time": "3:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 886, "total_steps": 1918, "loss": 0.1889, "learning_rate": 3.017811387086721e-06, "epoch": 0.46184922134619144, "percentage": 46.19, "elapsed_time": "2:34:21", "remaining_time": "2:59:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 887, "total_steps": 1918, "loss": 0.176, "learning_rate": 3.013593459858767e-06, "epoch": 0.46237049586238355, "percentage": 46.25, "elapsed_time": "2:34:32", "remaining_time": "2:59:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 888, "total_steps": 1918, "loss": 0.1887, "learning_rate": 3.0093740056893882e-06, "epoch": 0.4628917703785756, "percentage": 46.3, "elapsed_time": "2:34:42", "remaining_time": "2:59:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 889, "total_steps": 1918, "loss": 0.1909, "learning_rate": 3.005153037123253e-06, "epoch": 0.4634130448947677, "percentage": 46.35, "elapsed_time": "2:34:54", "remaining_time": "2:59:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 890, "total_steps": 1918, "loss": 0.1968, "learning_rate": 3.000930566709531e-06, "epoch": 0.4639343194109598, "percentage": 46.4, "elapsed_time": "2:35:04", "remaining_time": "2:59:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 891, "total_steps": 1918, "loss": 0.1984, "learning_rate": 2.996706607001858e-06, "epoch": 0.4644555939271519, "percentage": 46.45, "elapsed_time": "2:35:14", "remaining_time": "2:58:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 892, "total_steps": 1918, "loss": 0.1898, "learning_rate": 2.9924811705582966e-06, "epoch": 0.46497686844334396, "percentage": 46.51, "elapsed_time": "2:35:26", "remaining_time": "2:58:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 893, "total_steps": 1918, "loss": 0.2047, "learning_rate": 2.988254269941302e-06, "epoch": 0.46549814295953607, "percentage": 46.56, "elapsed_time": "2:35:36", "remaining_time": "2:58:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 894, "total_steps": 1918, "loss": 0.1903, "learning_rate": 2.984025917717678e-06, "epoch": 0.46601941747572817, "percentage": 46.61, "elapsed_time": "2:35:46", "remaining_time": "2:58:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 895, "total_steps": 1918, "loss": 0.1996, "learning_rate": 2.979796126458548e-06, "epoch": 0.4665406919919202, "percentage": 46.66, "elapsed_time": "2:35:57", "remaining_time": "2:58:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 896, "total_steps": 1918, "loss": 0.1927, "learning_rate": 2.975564908739313e-06, "epoch": 0.4670619665081123, "percentage": 46.72, "elapsed_time": "2:36:08", "remaining_time": "2:58:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 897, "total_steps": 1918, "loss": 0.1947, "learning_rate": 2.9713322771396147e-06, "epoch": 0.46758324102430443, "percentage": 46.77, "elapsed_time": "2:36:17", "remaining_time": "2:57:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 898, "total_steps": 1918, "loss": 0.1938, "learning_rate": 2.967098244243297e-06, "epoch": 0.46810451554049654, "percentage": 46.82, "elapsed_time": "2:36:27", "remaining_time": "2:57:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 899, "total_steps": 1918, "loss": 0.2085, "learning_rate": 2.962862822638372e-06, "epoch": 0.4686257900566886, "percentage": 46.87, "elapsed_time": "2:36:37", "remaining_time": "2:57:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 900, "total_steps": 1918, "loss": 0.177, "learning_rate": 2.95862602491698e-06, "epoch": 0.4691470645728807, "percentage": 46.92, "elapsed_time": "2:36:48", "remaining_time": "2:57:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 901, "total_steps": 1918, "loss": 0.2002, "learning_rate": 2.9543878636753514e-06, "epoch": 0.4696683390890728, "percentage": 46.98, "elapsed_time": "2:36:59", "remaining_time": "2:57:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 902, "total_steps": 1918, "loss": 0.207, "learning_rate": 2.950148351513771e-06, "epoch": 0.4701896136052649, "percentage": 47.03, "elapsed_time": "2:37:11", "remaining_time": "2:57:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 903, "total_steps": 1918, "loss": 0.1902, "learning_rate": 2.9459075010365406e-06, "epoch": 0.47071088812145695, "percentage": 47.08, "elapsed_time": "2:37:21", "remaining_time": "2:56:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 904, "total_steps": 1918, "loss": 0.1977, "learning_rate": 2.9416653248519404e-06, "epoch": 0.47123216263764905, "percentage": 47.13, "elapsed_time": "2:37:32", "remaining_time": "2:56:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 905, "total_steps": 1918, "loss": 0.1864, "learning_rate": 2.9374218355721925e-06, "epoch": 0.47175343715384116, "percentage": 47.18, "elapsed_time": "2:37:43", "remaining_time": "2:56:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 906, "total_steps": 1918, "loss": 0.1872, "learning_rate": 2.933177045813421e-06, "epoch": 0.4722747116700332, "percentage": 47.24, "elapsed_time": "2:37:54", "remaining_time": "2:56:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 907, "total_steps": 1918, "loss": 0.2047, "learning_rate": 2.9289309681956194e-06, "epoch": 0.4727959861862253, "percentage": 47.29, "elapsed_time": "2:38:04", "remaining_time": "2:56:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 908, "total_steps": 1918, "loss": 0.1969, "learning_rate": 2.924683615342607e-06, "epoch": 0.4733172607024174, "percentage": 47.34, "elapsed_time": "2:38:14", "remaining_time": "2:56:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 909, "total_steps": 1918, "loss": 0.2129, "learning_rate": 2.920434999881998e-06, "epoch": 0.4738385352186095, "percentage": 47.39, "elapsed_time": "2:38:26", "remaining_time": "2:55:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 910, "total_steps": 1918, "loss": 0.1817, "learning_rate": 2.9161851344451563e-06, "epoch": 0.4743598097348016, "percentage": 47.45, "elapsed_time": "2:38:36", "remaining_time": "2:55:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 911, "total_steps": 1918, "loss": 0.1979, "learning_rate": 2.9119340316671663e-06, "epoch": 0.4748810842509937, "percentage": 47.5, "elapsed_time": "2:38:47", "remaining_time": "2:55:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 912, "total_steps": 1918, "loss": 0.1922, "learning_rate": 2.9076817041867863e-06, "epoch": 0.4754023587671858, "percentage": 47.55, "elapsed_time": "2:38:57", "remaining_time": "2:55:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 913, "total_steps": 1918, "loss": 0.1732, "learning_rate": 2.9034281646464197e-06, "epoch": 0.47592363328337783, "percentage": 47.6, "elapsed_time": "2:39:08", "remaining_time": "2:55:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 914, "total_steps": 1918, "loss": 0.2053, "learning_rate": 2.8991734256920723e-06, "epoch": 0.47644490779956994, "percentage": 47.65, "elapsed_time": "2:39:17", "remaining_time": "2:54:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 915, "total_steps": 1918, "loss": 0.1949, "learning_rate": 2.894917499973315e-06, "epoch": 0.47696618231576204, "percentage": 47.71, "elapsed_time": "2:39:28", "remaining_time": "2:54:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 916, "total_steps": 1918, "loss": 0.1928, "learning_rate": 2.890660400143248e-06, "epoch": 0.47748745683195415, "percentage": 47.76, "elapsed_time": "2:39:38", "remaining_time": "2:54:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 917, "total_steps": 1918, "loss": 0.2108, "learning_rate": 2.8864021388584606e-06, "epoch": 0.4780087313481462, "percentage": 47.81, "elapsed_time": "2:39:49", "remaining_time": "2:54:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 918, "total_steps": 1918, "loss": 0.2022, "learning_rate": 2.882142728778997e-06, "epoch": 0.4785300058643383, "percentage": 47.86, "elapsed_time": "2:40:00", "remaining_time": "2:54:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 919, "total_steps": 1918, "loss": 0.1911, "learning_rate": 2.877882182568317e-06, "epoch": 0.4790512803805304, "percentage": 47.91, "elapsed_time": "2:40:11", "remaining_time": "2:54:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 920, "total_steps": 1918, "loss": 0.1821, "learning_rate": 2.873620512893257e-06, "epoch": 0.4795725548967225, "percentage": 47.97, "elapsed_time": "2:40:22", "remaining_time": "2:53:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 921, "total_steps": 1918, "loss": 0.1901, "learning_rate": 2.8693577324239925e-06, "epoch": 0.48009382941291456, "percentage": 48.02, "elapsed_time": "2:40:31", "remaining_time": "2:53:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 922, "total_steps": 1918, "loss": 0.1941, "learning_rate": 2.865093853834004e-06, "epoch": 0.48061510392910667, "percentage": 48.07, "elapsed_time": "2:40:43", "remaining_time": "2:53:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 923, "total_steps": 1918, "loss": 0.2062, "learning_rate": 2.8608288898000356e-06, "epoch": 0.4811363784452988, "percentage": 48.12, "elapsed_time": "2:40:53", "remaining_time": "2:53:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 924, "total_steps": 1918, "loss": 0.1969, "learning_rate": 2.8565628530020584e-06, "epoch": 0.4816576529614908, "percentage": 48.18, "elapsed_time": "2:41:03", "remaining_time": "2:53:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 925, "total_steps": 1918, "loss": 0.1889, "learning_rate": 2.8522957561232323e-06, "epoch": 0.48217892747768293, "percentage": 48.23, "elapsed_time": "2:41:13", "remaining_time": "2:53:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 926, "total_steps": 1918, "loss": 0.1923, "learning_rate": 2.84802761184987e-06, "epoch": 0.48270020199387503, "percentage": 48.28, "elapsed_time": "2:41:24", "remaining_time": "2:52:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 927, "total_steps": 1918, "loss": 0.2002, "learning_rate": 2.8437584328713976e-06, "epoch": 0.48322147651006714, "percentage": 48.33, "elapsed_time": "2:41:35", "remaining_time": "2:52:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 928, "total_steps": 1918, "loss": 0.1917, "learning_rate": 2.8394882318803174e-06, "epoch": 0.4837427510262592, "percentage": 48.38, "elapsed_time": "2:41:46", "remaining_time": "2:52:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 929, "total_steps": 1918, "loss": 0.1932, "learning_rate": 2.835217021572171e-06, "epoch": 0.4842640255424513, "percentage": 48.44, "elapsed_time": "2:41:57", "remaining_time": "2:52:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 930, "total_steps": 1918, "loss": 0.1861, "learning_rate": 2.8309448146454993e-06, "epoch": 0.4847853000586434, "percentage": 48.49, "elapsed_time": "2:42:07", "remaining_time": "2:52:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 931, "total_steps": 1918, "loss": 0.1877, "learning_rate": 2.8266716238018065e-06, "epoch": 0.48530657457483545, "percentage": 48.54, "elapsed_time": "2:42:18", "remaining_time": "2:52:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 932, "total_steps": 1918, "loss": 0.2025, "learning_rate": 2.822397461745524e-06, "epoch": 0.48582784909102755, "percentage": 48.59, "elapsed_time": "2:42:29", "remaining_time": "2:51:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 933, "total_steps": 1918, "loss": 0.2009, "learning_rate": 2.8181223411839686e-06, "epoch": 0.48634912360721966, "percentage": 48.64, "elapsed_time": "2:42:39", "remaining_time": "2:51:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 934, "total_steps": 1918, "loss": 0.1994, "learning_rate": 2.8138462748273072e-06, "epoch": 0.48687039812341176, "percentage": 48.7, "elapsed_time": "2:42:50", "remaining_time": "2:51:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 935, "total_steps": 1918, "loss": 0.1752, "learning_rate": 2.8095692753885177e-06, "epoch": 0.4873916726396038, "percentage": 48.75, "elapsed_time": "2:43:00", "remaining_time": "2:51:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 936, "total_steps": 1918, "loss": 0.2082, "learning_rate": 2.805291355583355e-06, "epoch": 0.4879129471557959, "percentage": 48.8, "elapsed_time": "2:43:11", "remaining_time": "2:51:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 937, "total_steps": 1918, "loss": 0.1888, "learning_rate": 2.8010125281303076e-06, "epoch": 0.488434221671988, "percentage": 48.85, "elapsed_time": "2:43:22", "remaining_time": "2:51:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 938, "total_steps": 1918, "loss": 0.1876, "learning_rate": 2.7967328057505637e-06, "epoch": 0.4889554961881801, "percentage": 48.91, "elapsed_time": "2:43:31", "remaining_time": "2:50:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 939, "total_steps": 1918, "loss": 0.194, "learning_rate": 2.792452201167971e-06, "epoch": 0.4894767707043722, "percentage": 48.96, "elapsed_time": "2:43:42", "remaining_time": "2:50:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 940, "total_steps": 1918, "loss": 0.2057, "learning_rate": 2.7881707271090018e-06, "epoch": 0.4899980452205643, "percentage": 49.01, "elapsed_time": "2:43:53", "remaining_time": "2:50:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 941, "total_steps": 1918, "loss": 0.2023, "learning_rate": 2.7838883963027118e-06, "epoch": 0.4905193197367564, "percentage": 49.06, "elapsed_time": "2:44:04", "remaining_time": "2:50:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 942, "total_steps": 1918, "loss": 0.2014, "learning_rate": 2.779605221480706e-06, "epoch": 0.49104059425294844, "percentage": 49.11, "elapsed_time": "2:44:14", "remaining_time": "2:50:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 943, "total_steps": 1918, "loss": 0.1861, "learning_rate": 2.7753212153770947e-06, "epoch": 0.49156186876914054, "percentage": 49.17, "elapsed_time": "2:44:25", "remaining_time": "2:50:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 944, "total_steps": 1918, "loss": 0.1863, "learning_rate": 2.7710363907284643e-06, "epoch": 0.49208314328533265, "percentage": 49.22, "elapsed_time": "2:44:35", "remaining_time": "2:49:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 945, "total_steps": 1918, "loss": 0.188, "learning_rate": 2.766750760273831e-06, "epoch": 0.49260441780152475, "percentage": 49.27, "elapsed_time": "2:44:46", "remaining_time": "2:49:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 946, "total_steps": 1918, "loss": 0.1951, "learning_rate": 2.76246433675461e-06, "epoch": 0.4931256923177168, "percentage": 49.32, "elapsed_time": "2:44:57", "remaining_time": "2:49:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 947, "total_steps": 1918, "loss": 0.203, "learning_rate": 2.7581771329145713e-06, "epoch": 0.4936469668339089, "percentage": 49.37, "elapsed_time": "2:45:07", "remaining_time": "2:49:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 948, "total_steps": 1918, "loss": 0.2, "learning_rate": 2.7538891614998074e-06, "epoch": 0.494168241350101, "percentage": 49.43, "elapsed_time": "2:45:18", "remaining_time": "2:49:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 949, "total_steps": 1918, "loss": 0.197, "learning_rate": 2.749600435258691e-06, "epoch": 0.49468951586629306, "percentage": 49.48, "elapsed_time": "2:45:28", "remaining_time": "2:48:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 950, "total_steps": 1918, "loss": 0.1904, "learning_rate": 2.745310966941839e-06, "epoch": 0.49521079038248517, "percentage": 49.53, "elapsed_time": "2:45:38", "remaining_time": "2:48:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 951, "total_steps": 1918, "loss": 0.1853, "learning_rate": 2.741020769302077e-06, "epoch": 0.49573206489867727, "percentage": 49.58, "elapsed_time": "2:45:48", "remaining_time": "2:48:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 952, "total_steps": 1918, "loss": 0.1875, "learning_rate": 2.7367298550943954e-06, "epoch": 0.4962533394148694, "percentage": 49.64, "elapsed_time": "2:45:59", "remaining_time": "2:48:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 953, "total_steps": 1918, "loss": 0.1855, "learning_rate": 2.7324382370759174e-06, "epoch": 0.4967746139310614, "percentage": 49.69, "elapsed_time": "2:46:10", "remaining_time": "2:48:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 954, "total_steps": 1918, "loss": 0.2108, "learning_rate": 2.7281459280058563e-06, "epoch": 0.49729588844725353, "percentage": 49.74, "elapsed_time": "2:46:20", "remaining_time": "2:48:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 955, "total_steps": 1918, "loss": 0.1819, "learning_rate": 2.7238529406454834e-06, "epoch": 0.49781716296344564, "percentage": 49.79, "elapsed_time": "2:46:30", "remaining_time": "2:47:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 956, "total_steps": 1918, "loss": 0.1796, "learning_rate": 2.719559287758085e-06, "epoch": 0.49833843747963774, "percentage": 49.84, "elapsed_time": "2:46:41", "remaining_time": "2:47:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 957, "total_steps": 1918, "loss": 0.1943, "learning_rate": 2.7152649821089245e-06, "epoch": 0.4988597119958298, "percentage": 49.9, "elapsed_time": "2:46:53", "remaining_time": "2:47:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 958, "total_steps": 1918, "loss": 0.1905, "learning_rate": 2.7109700364652075e-06, "epoch": 0.4993809865120219, "percentage": 49.95, "elapsed_time": "2:47:03", "remaining_time": "2:47:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 959, "total_steps": 1918, "loss": 0.1858, "learning_rate": 2.7066744635960423e-06, "epoch": 0.499902261028214, "percentage": 50.0, "elapsed_time": "2:47:14", "remaining_time": "2:47:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 960, "total_steps": 1918, "loss": 0.2101, "learning_rate": 2.702378276272402e-06, "epoch": 0.5004235355444061, "percentage": 50.05, "elapsed_time": "2:47:24", "remaining_time": "2:47:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 961, "total_steps": 1918, "loss": 0.1945, "learning_rate": 2.6980814872670863e-06, "epoch": 0.5009448100605982, "percentage": 50.1, "elapsed_time": "2:47:35", "remaining_time": "2:46:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 962, "total_steps": 1918, "loss": 0.1931, "learning_rate": 2.6937841093546842e-06, "epoch": 0.5014660845767902, "percentage": 50.16, "elapsed_time": "2:47:46", "remaining_time": "2:46:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 963, "total_steps": 1918, "loss": 0.2038, "learning_rate": 2.6894861553115337e-06, "epoch": 0.5019873590929823, "percentage": 50.21, "elapsed_time": "2:47:57", "remaining_time": "2:46:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 964, "total_steps": 1918, "loss": 0.1858, "learning_rate": 2.6851876379156884e-06, "epoch": 0.5025086336091744, "percentage": 50.26, "elapsed_time": "2:48:08", "remaining_time": "2:46:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 965, "total_steps": 1918, "loss": 0.2225, "learning_rate": 2.680888569946874e-06, "epoch": 0.5030299081253665, "percentage": 50.31, "elapsed_time": "2:48:18", "remaining_time": "2:46:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 966, "total_steps": 1918, "loss": 0.1881, "learning_rate": 2.6765889641864562e-06, "epoch": 0.5035511826415586, "percentage": 50.36, "elapsed_time": "2:48:29", "remaining_time": "2:46:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 967, "total_steps": 1918, "loss": 0.1936, "learning_rate": 2.6722888334173974e-06, "epoch": 0.5040724571577507, "percentage": 50.42, "elapsed_time": "2:48:40", "remaining_time": "2:45:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 968, "total_steps": 1918, "loss": 0.2029, "learning_rate": 2.6679881904242198e-06, "epoch": 0.5045937316739428, "percentage": 50.47, "elapsed_time": "2:48:51", "remaining_time": "2:45:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 969, "total_steps": 1918, "loss": 0.1841, "learning_rate": 2.663687047992972e-06, "epoch": 0.5051150061901348, "percentage": 50.52, "elapsed_time": "2:49:01", "remaining_time": "2:45:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 970, "total_steps": 1918, "loss": 0.1981, "learning_rate": 2.6593854189111857e-06, "epoch": 0.5056362807063269, "percentage": 50.57, "elapsed_time": "2:49:10", "remaining_time": "2:45:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 971, "total_steps": 1918, "loss": 0.1869, "learning_rate": 2.655083315967838e-06, "epoch": 0.506157555222519, "percentage": 50.63, "elapsed_time": "2:49:21", "remaining_time": "2:45:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 972, "total_steps": 1918, "loss": 0.1873, "learning_rate": 2.650780751953316e-06, "epoch": 0.5066788297387111, "percentage": 50.68, "elapsed_time": "2:49:32", "remaining_time": "2:45:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 973, "total_steps": 1918, "loss": 0.1952, "learning_rate": 2.646477739659378e-06, "epoch": 0.5072001042549033, "percentage": 50.73, "elapsed_time": "2:49:43", "remaining_time": "2:44:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 974, "total_steps": 1918, "loss": 0.1983, "learning_rate": 2.6421742918791155e-06, "epoch": 0.5077213787710954, "percentage": 50.78, "elapsed_time": "2:49:53", "remaining_time": "2:44:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 975, "total_steps": 1918, "loss": 0.1804, "learning_rate": 2.6378704214069133e-06, "epoch": 0.5082426532872875, "percentage": 50.83, "elapsed_time": "2:50:04", "remaining_time": "2:44:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 976, "total_steps": 1918, "loss": 0.2017, "learning_rate": 2.633566141038413e-06, "epoch": 0.5087639278034795, "percentage": 50.89, "elapsed_time": "2:50:14", "remaining_time": "2:44:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 977, "total_steps": 1918, "loss": 0.1983, "learning_rate": 2.629261463570476e-06, "epoch": 0.5092852023196716, "percentage": 50.94, "elapsed_time": "2:50:25", "remaining_time": "2:44:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 978, "total_steps": 1918, "loss": 0.1878, "learning_rate": 2.6249564018011437e-06, "epoch": 0.5098064768358637, "percentage": 50.99, "elapsed_time": "2:50:36", "remaining_time": "2:43:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 979, "total_steps": 1918, "loss": 0.1957, "learning_rate": 2.6206509685296e-06, "epoch": 0.5103277513520558, "percentage": 51.04, "elapsed_time": "2:50:46", "remaining_time": "2:43:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 980, "total_steps": 1918, "loss": 0.1963, "learning_rate": 2.6163451765561324e-06, "epoch": 0.5108490258682479, "percentage": 51.09, "elapsed_time": "2:50:55", "remaining_time": "2:43:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 981, "total_steps": 1918, "loss": 0.1999, "learning_rate": 2.6120390386820975e-06, "epoch": 0.51137030038444, "percentage": 51.15, "elapsed_time": "2:51:06", "remaining_time": "2:43:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 982, "total_steps": 1918, "loss": 0.1931, "learning_rate": 2.607732567709877e-06, "epoch": 0.5118915749006321, "percentage": 51.2, "elapsed_time": "2:51:17", "remaining_time": "2:43:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 983, "total_steps": 1918, "loss": 0.1997, "learning_rate": 2.6034257764428456e-06, "epoch": 0.5124128494168242, "percentage": 51.25, "elapsed_time": "2:51:27", "remaining_time": "2:43:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 984, "total_steps": 1918, "loss": 0.1849, "learning_rate": 2.5991186776853277e-06, "epoch": 0.5129341239330162, "percentage": 51.3, "elapsed_time": "2:51:37", "remaining_time": "2:42:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 985, "total_steps": 1918, "loss": 0.1783, "learning_rate": 2.594811284242565e-06, "epoch": 0.5134553984492083, "percentage": 51.36, "elapsed_time": "2:51:46", "remaining_time": "2:42:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 986, "total_steps": 1918, "loss": 0.1944, "learning_rate": 2.590503608920672e-06, "epoch": 0.5139766729654004, "percentage": 51.41, "elapsed_time": "2:51:56", "remaining_time": "2:42:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 987, "total_steps": 1918, "loss": 0.1949, "learning_rate": 2.5861956645266036e-06, "epoch": 0.5144979474815925, "percentage": 51.46, "elapsed_time": "2:52:06", "remaining_time": "2:42:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 988, "total_steps": 1918, "loss": 0.1887, "learning_rate": 2.581887463868114e-06, "epoch": 0.5150192219977846, "percentage": 51.51, "elapsed_time": "2:52:16", "remaining_time": "2:42:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 989, "total_steps": 1918, "loss": 0.1996, "learning_rate": 2.57757901975372e-06, "epoch": 0.5155404965139767, "percentage": 51.56, "elapsed_time": "2:52:26", "remaining_time": "2:41:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 990, "total_steps": 1918, "loss": 0.2055, "learning_rate": 2.5732703449926595e-06, "epoch": 0.5160617710301688, "percentage": 51.62, "elapsed_time": "2:52:38", "remaining_time": "2:41:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 991, "total_steps": 1918, "loss": 0.1906, "learning_rate": 2.568961452394859e-06, "epoch": 0.5165830455463608, "percentage": 51.67, "elapsed_time": "2:52:46", "remaining_time": "2:41:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 992, "total_steps": 1918, "loss": 0.1865, "learning_rate": 2.564652354770892e-06, "epoch": 0.5171043200625529, "percentage": 51.72, "elapsed_time": "2:52:56", "remaining_time": "2:41:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 993, "total_steps": 1918, "loss": 0.2152, "learning_rate": 2.560343064931941e-06, "epoch": 0.517625594578745, "percentage": 51.77, "elapsed_time": "2:53:06", "remaining_time": "2:41:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 994, "total_steps": 1918, "loss": 0.1862, "learning_rate": 2.5560335956897603e-06, "epoch": 0.5181468690949371, "percentage": 51.82, "elapsed_time": "2:53:18", "remaining_time": "2:41:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 995, "total_steps": 1918, "loss": 0.1889, "learning_rate": 2.551723959856637e-06, "epoch": 0.5186681436111292, "percentage": 51.88, "elapsed_time": "2:53:28", "remaining_time": "2:40:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 996, "total_steps": 1918, "loss": 0.1894, "learning_rate": 2.5474141702453536e-06, "epoch": 0.5191894181273213, "percentage": 51.93, "elapsed_time": "2:53:39", "remaining_time": "2:40:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 997, "total_steps": 1918, "loss": 0.2087, "learning_rate": 2.543104239669152e-06, "epoch": 0.5197106926435134, "percentage": 51.98, "elapsed_time": "2:53:50", "remaining_time": "2:40:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 998, "total_steps": 1918, "loss": 0.1795, "learning_rate": 2.5387941809416895e-06, "epoch": 0.5202319671597054, "percentage": 52.03, "elapsed_time": "2:54:01", "remaining_time": "2:40:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 999, "total_steps": 1918, "loss": 0.1873, "learning_rate": 2.5344840068770076e-06, "epoch": 0.5207532416758975, "percentage": 52.09, "elapsed_time": "2:54:10", "remaining_time": "2:40:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1000, "total_steps": 1918, "loss": 0.1946, "learning_rate": 2.530173730289488e-06, "epoch": 0.5212745161920896, "percentage": 52.14, "elapsed_time": "2:54:20", "remaining_time": "2:40:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1000, "total_steps": 1918, "eval_loss": 0.19480524957180023, "epoch": 0.5212745161920896, "percentage": 52.14, "elapsed_time": "2:55:12", "remaining_time": "2:40:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1001, "total_steps": 1918, "loss": 0.1995, "learning_rate": 2.5258633639938195e-06, "epoch": 0.5217957907082817, "percentage": 52.19, "elapsed_time": "2:55:21", "remaining_time": "2:40:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1002, "total_steps": 1918, "loss": 0.2085, "learning_rate": 2.521552920804956e-06, "epoch": 0.5223170652244739, "percentage": 52.24, "elapsed_time": "2:55:32", "remaining_time": "2:40:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1003, "total_steps": 1918, "loss": 0.2047, "learning_rate": 2.5172424135380817e-06, "epoch": 0.522838339740666, "percentage": 52.29, "elapsed_time": "2:55:44", "remaining_time": "2:40:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1004, "total_steps": 1918, "loss": 0.1905, "learning_rate": 2.51293185500857e-06, "epoch": 0.5233596142568581, "percentage": 52.35, "elapsed_time": "2:55:54", "remaining_time": "2:40:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1005, "total_steps": 1918, "loss": 0.1995, "learning_rate": 2.5086212580319457e-06, "epoch": 0.5238808887730501, "percentage": 52.4, "elapsed_time": "2:56:04", "remaining_time": "2:39:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1006, "total_steps": 1918, "loss": 0.1931, "learning_rate": 2.50431063542385e-06, "epoch": 0.5244021632892422, "percentage": 52.45, "elapsed_time": "2:56:14", "remaining_time": "2:39:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1007, "total_steps": 1918, "loss": 0.2001, "learning_rate": 2.5e-06, "epoch": 0.5249234378054343, "percentage": 52.5, "elapsed_time": "2:56:24", "remaining_time": "2:39:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1008, "total_steps": 1918, "loss": 0.197, "learning_rate": 2.49568936457615e-06, "epoch": 0.5254447123216264, "percentage": 52.55, "elapsed_time": "2:56:35", "remaining_time": "2:39:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1009, "total_steps": 1918, "loss": 0.1898, "learning_rate": 2.491378741968055e-06, "epoch": 0.5259659868378185, "percentage": 52.61, "elapsed_time": "2:56:46", "remaining_time": "2:39:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1010, "total_steps": 1918, "loss": 0.1935, "learning_rate": 2.487068144991431e-06, "epoch": 0.5264872613540106, "percentage": 52.66, "elapsed_time": "2:56:56", "remaining_time": "2:39:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1011, "total_steps": 1918, "loss": 0.2068, "learning_rate": 2.4827575864619183e-06, "epoch": 0.5270085358702027, "percentage": 52.71, "elapsed_time": "2:57:07", "remaining_time": "2:38:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1012, "total_steps": 1918, "loss": 0.1952, "learning_rate": 2.4784470791950442e-06, "epoch": 0.5275298103863947, "percentage": 52.76, "elapsed_time": "2:57:18", "remaining_time": "2:38:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1013, "total_steps": 1918, "loss": 0.1911, "learning_rate": 2.4741366360061813e-06, "epoch": 0.5280510849025868, "percentage": 52.82, "elapsed_time": "2:57:28", "remaining_time": "2:38:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1014, "total_steps": 1918, "loss": 0.1986, "learning_rate": 2.4698262697105128e-06, "epoch": 0.5285723594187789, "percentage": 52.87, "elapsed_time": "2:57:38", "remaining_time": "2:38:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1015, "total_steps": 1918, "loss": 0.1794, "learning_rate": 2.4655159931229932e-06, "epoch": 0.529093633934971, "percentage": 52.92, "elapsed_time": "2:57:49", "remaining_time": "2:38:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1016, "total_steps": 1918, "loss": 0.2025, "learning_rate": 2.461205819058311e-06, "epoch": 0.5296149084511631, "percentage": 52.97, "elapsed_time": "2:57:58", "remaining_time": "2:38:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1017, "total_steps": 1918, "loss": 0.1891, "learning_rate": 2.4568957603308494e-06, "epoch": 0.5301361829673552, "percentage": 53.02, "elapsed_time": "2:58:08", "remaining_time": "2:37:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1018, "total_steps": 1918, "loss": 0.1957, "learning_rate": 2.452585829754647e-06, "epoch": 0.5306574574835473, "percentage": 53.08, "elapsed_time": "2:58:18", "remaining_time": "2:37:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1019, "total_steps": 1918, "loss": 0.212, "learning_rate": 2.448276040143364e-06, "epoch": 0.5311787319997394, "percentage": 53.13, "elapsed_time": "2:58:29", "remaining_time": "2:37:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1020, "total_steps": 1918, "loss": 0.2078, "learning_rate": 2.4439664043102414e-06, "epoch": 0.5317000065159314, "percentage": 53.18, "elapsed_time": "2:58:39", "remaining_time": "2:37:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1021, "total_steps": 1918, "loss": 0.1905, "learning_rate": 2.43965693506806e-06, "epoch": 0.5322212810321235, "percentage": 53.23, "elapsed_time": "2:58:49", "remaining_time": "2:37:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1022, "total_steps": 1918, "loss": 0.1882, "learning_rate": 2.4353476452291086e-06, "epoch": 0.5327425555483156, "percentage": 53.28, "elapsed_time": "2:59:00", "remaining_time": "2:36:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1023, "total_steps": 1918, "loss": 0.1753, "learning_rate": 2.431038547605142e-06, "epoch": 0.5332638300645077, "percentage": 53.34, "elapsed_time": "2:59:10", "remaining_time": "2:36:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1024, "total_steps": 1918, "loss": 0.1985, "learning_rate": 2.4267296550073413e-06, "epoch": 0.5337851045806998, "percentage": 53.39, "elapsed_time": "2:59:20", "remaining_time": "2:36:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1025, "total_steps": 1918, "loss": 0.1889, "learning_rate": 2.4224209802462818e-06, "epoch": 0.5343063790968919, "percentage": 53.44, "elapsed_time": "2:59:31", "remaining_time": "2:36:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1026, "total_steps": 1918, "loss": 0.1883, "learning_rate": 2.4181125361318868e-06, "epoch": 0.534827653613084, "percentage": 53.49, "elapsed_time": "2:59:42", "remaining_time": "2:36:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1027, "total_steps": 1918, "loss": 0.1869, "learning_rate": 2.413804335473397e-06, "epoch": 0.535348928129276, "percentage": 53.55, "elapsed_time": "2:59:52", "remaining_time": "2:36:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1028, "total_steps": 1918, "loss": 0.1856, "learning_rate": 2.409496391079329e-06, "epoch": 0.5358702026454681, "percentage": 53.6, "elapsed_time": "3:00:02", "remaining_time": "2:35:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1029, "total_steps": 1918, "loss": 0.1971, "learning_rate": 2.4051887157574356e-06, "epoch": 0.5363914771616602, "percentage": 53.65, "elapsed_time": "3:00:13", "remaining_time": "2:35:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1030, "total_steps": 1918, "loss": 0.1774, "learning_rate": 2.4008813223146723e-06, "epoch": 0.5369127516778524, "percentage": 53.7, "elapsed_time": "3:00:23", "remaining_time": "2:35:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1031, "total_steps": 1918, "loss": 0.2078, "learning_rate": 2.3965742235571557e-06, "epoch": 0.5374340261940445, "percentage": 53.75, "elapsed_time": "3:00:32", "remaining_time": "2:35:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1032, "total_steps": 1918, "loss": 0.2026, "learning_rate": 2.3922674322901236e-06, "epoch": 0.5379553007102366, "percentage": 53.81, "elapsed_time": "3:00:42", "remaining_time": "2:35:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1033, "total_steps": 1918, "loss": 0.2027, "learning_rate": 2.387960961317903e-06, "epoch": 0.5384765752264287, "percentage": 53.86, "elapsed_time": "3:00:52", "remaining_time": "2:34:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1034, "total_steps": 1918, "loss": 0.1992, "learning_rate": 2.383654823443868e-06, "epoch": 0.5389978497426207, "percentage": 53.91, "elapsed_time": "3:01:01", "remaining_time": "2:34:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1035, "total_steps": 1918, "loss": 0.1914, "learning_rate": 2.3793490314704005e-06, "epoch": 0.5395191242588128, "percentage": 53.96, "elapsed_time": "3:01:11", "remaining_time": "2:34:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1036, "total_steps": 1918, "loss": 0.2115, "learning_rate": 2.3750435981988576e-06, "epoch": 0.5400403987750049, "percentage": 54.01, "elapsed_time": "3:01:21", "remaining_time": "2:34:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1037, "total_steps": 1918, "loss": 0.2009, "learning_rate": 2.3707385364295245e-06, "epoch": 0.540561673291197, "percentage": 54.07, "elapsed_time": "3:01:32", "remaining_time": "2:34:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1038, "total_steps": 1918, "loss": 0.195, "learning_rate": 2.366433858961587e-06, "epoch": 0.5410829478073891, "percentage": 54.12, "elapsed_time": "3:01:43", "remaining_time": "2:34:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1039, "total_steps": 1918, "loss": 0.1926, "learning_rate": 2.362129578593088e-06, "epoch": 0.5416042223235812, "percentage": 54.17, "elapsed_time": "3:01:52", "remaining_time": "2:33:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1040, "total_steps": 1918, "loss": 0.1947, "learning_rate": 2.3578257081208853e-06, "epoch": 0.5421254968397733, "percentage": 54.22, "elapsed_time": "3:02:03", "remaining_time": "2:33:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1041, "total_steps": 1918, "loss": 0.2107, "learning_rate": 2.3535222603406223e-06, "epoch": 0.5426467713559653, "percentage": 54.28, "elapsed_time": "3:02:13", "remaining_time": "2:33:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1042, "total_steps": 1918, "loss": 0.1857, "learning_rate": 2.3492192480466845e-06, "epoch": 0.5431680458721574, "percentage": 54.33, "elapsed_time": "3:02:25", "remaining_time": "2:33:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1043, "total_steps": 1918, "loss": 0.1784, "learning_rate": 2.344916684032163e-06, "epoch": 0.5436893203883495, "percentage": 54.38, "elapsed_time": "3:02:36", "remaining_time": "2:33:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1044, "total_steps": 1918, "loss": 0.1993, "learning_rate": 2.3406145810888143e-06, "epoch": 0.5442105949045416, "percentage": 54.43, "elapsed_time": "3:02:47", "remaining_time": "2:33:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1045, "total_steps": 1918, "loss": 0.1858, "learning_rate": 2.3363129520070286e-06, "epoch": 0.5447318694207337, "percentage": 54.48, "elapsed_time": "3:02:59", "remaining_time": "2:32:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1046, "total_steps": 1918, "loss": 0.2105, "learning_rate": 2.3320118095757806e-06, "epoch": 0.5452531439369258, "percentage": 54.54, "elapsed_time": "3:03:08", "remaining_time": "2:32:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1047, "total_steps": 1918, "loss": 0.1985, "learning_rate": 2.327711166582604e-06, "epoch": 0.5457744184531179, "percentage": 54.59, "elapsed_time": "3:03:19", "remaining_time": "2:32:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1048, "total_steps": 1918, "loss": 0.1802, "learning_rate": 2.3234110358135446e-06, "epoch": 0.5462956929693099, "percentage": 54.64, "elapsed_time": "3:03:30", "remaining_time": "2:32:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1049, "total_steps": 1918, "loss": 0.19, "learning_rate": 2.319111430053126e-06, "epoch": 0.546816967485502, "percentage": 54.69, "elapsed_time": "3:03:41", "remaining_time": "2:32:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1050, "total_steps": 1918, "loss": 0.1903, "learning_rate": 2.3148123620843132e-06, "epoch": 0.5473382420016941, "percentage": 54.74, "elapsed_time": "3:03:50", "remaining_time": "2:31:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1051, "total_steps": 1918, "loss": 0.1858, "learning_rate": 2.310513844688467e-06, "epoch": 0.5478595165178862, "percentage": 54.8, "elapsed_time": "3:03:59", "remaining_time": "2:31:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1052, "total_steps": 1918, "loss": 0.1864, "learning_rate": 2.306215890645316e-06, "epoch": 0.5483807910340783, "percentage": 54.85, "elapsed_time": "3:04:09", "remaining_time": "2:31:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1053, "total_steps": 1918, "loss": 0.1871, "learning_rate": 2.3019185127329145e-06, "epoch": 0.5489020655502704, "percentage": 54.9, "elapsed_time": "3:04:20", "remaining_time": "2:31:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1054, "total_steps": 1918, "loss": 0.1896, "learning_rate": 2.2976217237275983e-06, "epoch": 0.5494233400664625, "percentage": 54.95, "elapsed_time": "3:04:30", "remaining_time": "2:31:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1055, "total_steps": 1918, "loss": 0.2015, "learning_rate": 2.293325536403958e-06, "epoch": 0.5499446145826546, "percentage": 55.01, "elapsed_time": "3:04:40", "remaining_time": "2:31:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1056, "total_steps": 1918, "loss": 0.1978, "learning_rate": 2.2890299635347933e-06, "epoch": 0.5504658890988466, "percentage": 55.06, "elapsed_time": "3:04:51", "remaining_time": "2:30:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1057, "total_steps": 1918, "loss": 0.199, "learning_rate": 2.2847350178910763e-06, "epoch": 0.5509871636150387, "percentage": 55.11, "elapsed_time": "3:05:01", "remaining_time": "2:30:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1058, "total_steps": 1918, "loss": 0.1743, "learning_rate": 2.2804407122419165e-06, "epoch": 0.5515084381312308, "percentage": 55.16, "elapsed_time": "3:05:11", "remaining_time": "2:30:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1059, "total_steps": 1918, "loss": 0.1915, "learning_rate": 2.276147059354517e-06, "epoch": 0.552029712647423, "percentage": 55.21, "elapsed_time": "3:05:23", "remaining_time": "2:30:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1060, "total_steps": 1918, "loss": 0.1851, "learning_rate": 2.271854071994144e-06, "epoch": 0.5525509871636151, "percentage": 55.27, "elapsed_time": "3:05:33", "remaining_time": "2:30:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1061, "total_steps": 1918, "loss": 0.2026, "learning_rate": 2.2675617629240842e-06, "epoch": 0.5530722616798072, "percentage": 55.32, "elapsed_time": "3:05:44", "remaining_time": "2:30:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1062, "total_steps": 1918, "loss": 0.1985, "learning_rate": 2.2632701449056054e-06, "epoch": 0.5535935361959993, "percentage": 55.37, "elapsed_time": "3:05:55", "remaining_time": "2:29:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1063, "total_steps": 1918, "loss": 0.184, "learning_rate": 2.258979230697923e-06, "epoch": 0.5541148107121913, "percentage": 55.42, "elapsed_time": "3:06:04", "remaining_time": "2:29:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1064, "total_steps": 1918, "loss": 0.1861, "learning_rate": 2.2546890330581616e-06, "epoch": 0.5546360852283834, "percentage": 55.47, "elapsed_time": "3:06:15", "remaining_time": "2:29:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1065, "total_steps": 1918, "loss": 0.1878, "learning_rate": 2.25039956474131e-06, "epoch": 0.5551573597445755, "percentage": 55.53, "elapsed_time": "3:06:25", "remaining_time": "2:29:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1066, "total_steps": 1918, "loss": 0.1914, "learning_rate": 2.246110838500194e-06, "epoch": 0.5556786342607676, "percentage": 55.58, "elapsed_time": "3:06:36", "remaining_time": "2:29:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1067, "total_steps": 1918, "loss": 0.1935, "learning_rate": 2.241822867085429e-06, "epoch": 0.5561999087769597, "percentage": 55.63, "elapsed_time": "3:06:46", "remaining_time": "2:28:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1068, "total_steps": 1918, "loss": 0.1893, "learning_rate": 2.2375356632453906e-06, "epoch": 0.5567211832931518, "percentage": 55.68, "elapsed_time": "3:06:56", "remaining_time": "2:28:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1069, "total_steps": 1918, "loss": 0.1951, "learning_rate": 2.2332492397261695e-06, "epoch": 0.5572424578093439, "percentage": 55.74, "elapsed_time": "3:07:06", "remaining_time": "2:28:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1070, "total_steps": 1918, "loss": 0.1834, "learning_rate": 2.2289636092715365e-06, "epoch": 0.5577637323255359, "percentage": 55.79, "elapsed_time": "3:07:18", "remaining_time": "2:28:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1071, "total_steps": 1918, "loss": 0.1834, "learning_rate": 2.2246787846229057e-06, "epoch": 0.558285006841728, "percentage": 55.84, "elapsed_time": "3:07:29", "remaining_time": "2:28:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1072, "total_steps": 1918, "loss": 0.1878, "learning_rate": 2.2203947785192954e-06, "epoch": 0.5588062813579201, "percentage": 55.89, "elapsed_time": "3:07:39", "remaining_time": "2:28:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1073, "total_steps": 1918, "loss": 0.1943, "learning_rate": 2.2161116036972886e-06, "epoch": 0.5593275558741122, "percentage": 55.94, "elapsed_time": "3:07:50", "remaining_time": "2:27:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1074, "total_steps": 1918, "loss": 0.2069, "learning_rate": 2.2118292728909986e-06, "epoch": 0.5598488303903043, "percentage": 56.0, "elapsed_time": "3:08:01", "remaining_time": "2:27:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1075, "total_steps": 1918, "loss": 0.1849, "learning_rate": 2.2075477988320295e-06, "epoch": 0.5603701049064964, "percentage": 56.05, "elapsed_time": "3:08:11", "remaining_time": "2:27:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1076, "total_steps": 1918, "loss": 0.1844, "learning_rate": 2.2032671942494367e-06, "epoch": 0.5608913794226885, "percentage": 56.1, "elapsed_time": "3:08:20", "remaining_time": "2:27:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1077, "total_steps": 1918, "loss": 0.1926, "learning_rate": 2.1989874718696936e-06, "epoch": 0.5614126539388805, "percentage": 56.15, "elapsed_time": "3:08:29", "remaining_time": "2:27:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1078, "total_steps": 1918, "loss": 0.1971, "learning_rate": 2.194708644416646e-06, "epoch": 0.5619339284550726, "percentage": 56.2, "elapsed_time": "3:08:41", "remaining_time": "2:27:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1079, "total_steps": 1918, "loss": 0.1917, "learning_rate": 2.1904307246114827e-06, "epoch": 0.5624552029712647, "percentage": 56.26, "elapsed_time": "3:08:50", "remaining_time": "2:26:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1080, "total_steps": 1918, "loss": 0.2003, "learning_rate": 2.1861537251726944e-06, "epoch": 0.5629764774874568, "percentage": 56.31, "elapsed_time": "3:09:02", "remaining_time": "2:26:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1081, "total_steps": 1918, "loss": 0.1872, "learning_rate": 2.1818776588160323e-06, "epoch": 0.5634977520036489, "percentage": 56.36, "elapsed_time": "3:09:11", "remaining_time": "2:26:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1082, "total_steps": 1918, "loss": 0.2082, "learning_rate": 2.1776025382544765e-06, "epoch": 0.564019026519841, "percentage": 56.41, "elapsed_time": "3:09:21", "remaining_time": "2:26:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1083, "total_steps": 1918, "loss": 0.1894, "learning_rate": 2.173328376198194e-06, "epoch": 0.5645403010360331, "percentage": 56.47, "elapsed_time": "3:09:31", "remaining_time": "2:26:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1084, "total_steps": 1918, "loss": 0.2155, "learning_rate": 2.1690551853545016e-06, "epoch": 0.5650615755522251, "percentage": 56.52, "elapsed_time": "3:09:41", "remaining_time": "2:25:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1085, "total_steps": 1918, "loss": 0.1908, "learning_rate": 2.1647829784278294e-06, "epoch": 0.5655828500684172, "percentage": 56.57, "elapsed_time": "3:09:52", "remaining_time": "2:25:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1086, "total_steps": 1918, "loss": 0.1878, "learning_rate": 2.1605117681196834e-06, "epoch": 0.5661041245846093, "percentage": 56.62, "elapsed_time": "3:10:02", "remaining_time": "2:25:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1087, "total_steps": 1918, "loss": 0.2054, "learning_rate": 2.1562415671286032e-06, "epoch": 0.5666253991008015, "percentage": 56.67, "elapsed_time": "3:10:13", "remaining_time": "2:25:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1088, "total_steps": 1918, "loss": 0.2041, "learning_rate": 2.151972388150131e-06, "epoch": 0.5671466736169936, "percentage": 56.73, "elapsed_time": "3:10:23", "remaining_time": "2:25:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1089, "total_steps": 1918, "loss": 0.2039, "learning_rate": 2.1477042438767685e-06, "epoch": 0.5676679481331857, "percentage": 56.78, "elapsed_time": "3:10:33", "remaining_time": "2:25:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1090, "total_steps": 1918, "loss": 0.1968, "learning_rate": 2.1434371469979424e-06, "epoch": 0.5681892226493778, "percentage": 56.83, "elapsed_time": "3:10:44", "remaining_time": "2:24:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1091, "total_steps": 1918, "loss": 0.2044, "learning_rate": 2.1391711101999656e-06, "epoch": 0.5687104971655699, "percentage": 56.88, "elapsed_time": "3:10:55", "remaining_time": "2:24:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1092, "total_steps": 1918, "loss": 0.1994, "learning_rate": 2.1349061461659966e-06, "epoch": 0.5692317716817619, "percentage": 56.93, "elapsed_time": "3:11:06", "remaining_time": "2:24:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1093, "total_steps": 1918, "loss": 0.1848, "learning_rate": 2.130642267576008e-06, "epoch": 0.569753046197954, "percentage": 56.99, "elapsed_time": "3:11:17", "remaining_time": "2:24:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1094, "total_steps": 1918, "loss": 0.1999, "learning_rate": 2.1263794871067443e-06, "epoch": 0.5702743207141461, "percentage": 57.04, "elapsed_time": "3:11:27", "remaining_time": "2:24:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1095, "total_steps": 1918, "loss": 0.1693, "learning_rate": 2.1221178174316833e-06, "epoch": 0.5707955952303382, "percentage": 57.09, "elapsed_time": "3:11:37", "remaining_time": "2:24:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1096, "total_steps": 1918, "loss": 0.1859, "learning_rate": 2.117857271221003e-06, "epoch": 0.5713168697465303, "percentage": 57.14, "elapsed_time": "3:11:47", "remaining_time": "2:23:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1097, "total_steps": 1918, "loss": 0.1982, "learning_rate": 2.11359786114154e-06, "epoch": 0.5718381442627224, "percentage": 57.19, "elapsed_time": "3:11:58", "remaining_time": "2:23:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1098, "total_steps": 1918, "loss": 0.1798, "learning_rate": 2.1093395998567527e-06, "epoch": 0.5723594187789145, "percentage": 57.25, "elapsed_time": "3:12:08", "remaining_time": "2:23:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1099, "total_steps": 1918, "loss": 0.1765, "learning_rate": 2.1050825000266862e-06, "epoch": 0.5728806932951065, "percentage": 57.3, "elapsed_time": "3:12:18", "remaining_time": "2:23:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1100, "total_steps": 1918, "loss": 0.1958, "learning_rate": 2.1008265743079286e-06, "epoch": 0.5734019678112986, "percentage": 57.35, "elapsed_time": "3:12:27", "remaining_time": "2:23:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1101, "total_steps": 1918, "loss": 0.2055, "learning_rate": 2.0965718353535807e-06, "epoch": 0.5739232423274907, "percentage": 57.4, "elapsed_time": "3:12:38", "remaining_time": "2:22:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1102, "total_steps": 1918, "loss": 0.2047, "learning_rate": 2.0923182958132146e-06, "epoch": 0.5744445168436828, "percentage": 57.46, "elapsed_time": "3:12:48", "remaining_time": "2:22:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1103, "total_steps": 1918, "loss": 0.187, "learning_rate": 2.0880659683328346e-06, "epoch": 0.5749657913598749, "percentage": 57.51, "elapsed_time": "3:12:59", "remaining_time": "2:22:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1104, "total_steps": 1918, "loss": 0.2004, "learning_rate": 2.0838148655548433e-06, "epoch": 0.575487065876067, "percentage": 57.56, "elapsed_time": "3:13:11", "remaining_time": "2:22:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1105, "total_steps": 1918, "loss": 0.191, "learning_rate": 2.0795650001180028e-06, "epoch": 0.5760083403922591, "percentage": 57.61, "elapsed_time": "3:13:22", "remaining_time": "2:22:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1106, "total_steps": 1918, "loss": 0.1997, "learning_rate": 2.0753163846573933e-06, "epoch": 0.5765296149084511, "percentage": 57.66, "elapsed_time": "3:13:33", "remaining_time": "2:22:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1107, "total_steps": 1918, "loss": 0.1913, "learning_rate": 2.0710690318043814e-06, "epoch": 0.5770508894246432, "percentage": 57.72, "elapsed_time": "3:13:43", "remaining_time": "2:21:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1108, "total_steps": 1918, "loss": 0.1857, "learning_rate": 2.0668229541865796e-06, "epoch": 0.5775721639408353, "percentage": 57.77, "elapsed_time": "3:13:54", "remaining_time": "2:21:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1109, "total_steps": 1918, "loss": 0.1943, "learning_rate": 2.0625781644278083e-06, "epoch": 0.5780934384570274, "percentage": 57.82, "elapsed_time": "3:14:04", "remaining_time": "2:21:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1110, "total_steps": 1918, "loss": 0.1885, "learning_rate": 2.058334675148061e-06, "epoch": 0.5786147129732195, "percentage": 57.87, "elapsed_time": "3:14:14", "remaining_time": "2:21:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1111, "total_steps": 1918, "loss": 0.186, "learning_rate": 2.05409249896346e-06, "epoch": 0.5791359874894116, "percentage": 57.92, "elapsed_time": "3:14:24", "remaining_time": "2:21:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1112, "total_steps": 1918, "loss": 0.1935, "learning_rate": 2.049851648486229e-06, "epoch": 0.5796572620056037, "percentage": 57.98, "elapsed_time": "3:14:35", "remaining_time": "2:21:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1113, "total_steps": 1918, "loss": 0.1774, "learning_rate": 2.04561213632465e-06, "epoch": 0.5801785365217957, "percentage": 58.03, "elapsed_time": "3:14:45", "remaining_time": "2:20:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1114, "total_steps": 1918, "loss": 0.1978, "learning_rate": 2.041373975083021e-06, "epoch": 0.5806998110379878, "percentage": 58.08, "elapsed_time": "3:14:56", "remaining_time": "2:20:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1115, "total_steps": 1918, "loss": 0.2117, "learning_rate": 2.037137177361628e-06, "epoch": 0.58122108555418, "percentage": 58.13, "elapsed_time": "3:15:06", "remaining_time": "2:20:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1116, "total_steps": 1918, "loss": 0.1997, "learning_rate": 2.0329017557567034e-06, "epoch": 0.581742360070372, "percentage": 58.19, "elapsed_time": "3:15:16", "remaining_time": "2:20:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1117, "total_steps": 1918, "loss": 0.195, "learning_rate": 2.028667722860386e-06, "epoch": 0.5822636345865642, "percentage": 58.24, "elapsed_time": "3:15:27", "remaining_time": "2:20:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1118, "total_steps": 1918, "loss": 0.1965, "learning_rate": 2.024435091260687e-06, "epoch": 0.5827849091027563, "percentage": 58.29, "elapsed_time": "3:15:38", "remaining_time": "2:19:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1119, "total_steps": 1918, "loss": 0.2055, "learning_rate": 2.0202038735414532e-06, "epoch": 0.5833061836189484, "percentage": 58.34, "elapsed_time": "3:15:49", "remaining_time": "2:19:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1120, "total_steps": 1918, "loss": 0.1887, "learning_rate": 2.0159740822823233e-06, "epoch": 0.5838274581351404, "percentage": 58.39, "elapsed_time": "3:16:01", "remaining_time": "2:19:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1121, "total_steps": 1918, "loss": 0.1761, "learning_rate": 2.0117457300586996e-06, "epoch": 0.5843487326513325, "percentage": 58.45, "elapsed_time": "3:16:10", "remaining_time": "2:19:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1122, "total_steps": 1918, "loss": 0.1849, "learning_rate": 2.007518829441704e-06, "epoch": 0.5848700071675246, "percentage": 58.5, "elapsed_time": "3:16:21", "remaining_time": "2:19:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1123, "total_steps": 1918, "loss": 0.1974, "learning_rate": 2.0032933929981425e-06, "epoch": 0.5853912816837167, "percentage": 58.55, "elapsed_time": "3:16:32", "remaining_time": "2:19:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1124, "total_steps": 1918, "loss": 0.1903, "learning_rate": 1.9990694332904705e-06, "epoch": 0.5859125561999088, "percentage": 58.6, "elapsed_time": "3:16:43", "remaining_time": "2:18:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1125, "total_steps": 1918, "loss": 0.197, "learning_rate": 1.9948469628767475e-06, "epoch": 0.5864338307161009, "percentage": 58.65, "elapsed_time": "3:16:53", "remaining_time": "2:18:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1126, "total_steps": 1918, "loss": 0.1956, "learning_rate": 1.990625994310612e-06, "epoch": 0.586955105232293, "percentage": 58.71, "elapsed_time": "3:17:03", "remaining_time": "2:18:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1127, "total_steps": 1918, "loss": 0.1961, "learning_rate": 1.986406540141234e-06, "epoch": 0.5874763797484851, "percentage": 58.76, "elapsed_time": "3:17:14", "remaining_time": "2:18:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1128, "total_steps": 1918, "loss": 0.2008, "learning_rate": 1.98218861291328e-06, "epoch": 0.5879976542646771, "percentage": 58.81, "elapsed_time": "3:17:25", "remaining_time": "2:18:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1129, "total_steps": 1918, "loss": 0.1744, "learning_rate": 1.977972225166878e-06, "epoch": 0.5885189287808692, "percentage": 58.86, "elapsed_time": "3:17:34", "remaining_time": "2:18:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1130, "total_steps": 1918, "loss": 0.1786, "learning_rate": 1.973757389437581e-06, "epoch": 0.5890402032970613, "percentage": 58.92, "elapsed_time": "3:17:45", "remaining_time": "2:17:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1131, "total_steps": 1918, "loss": 0.201, "learning_rate": 1.9695441182563237e-06, "epoch": 0.5895614778132534, "percentage": 58.97, "elapsed_time": "3:17:58", "remaining_time": "2:17:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1132, "total_steps": 1918, "loss": 0.1978, "learning_rate": 1.965332424149394e-06, "epoch": 0.5900827523294455, "percentage": 59.02, "elapsed_time": "3:18:09", "remaining_time": "2:17:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1133, "total_steps": 1918, "loss": 0.1875, "learning_rate": 1.9611223196383866e-06, "epoch": 0.5906040268456376, "percentage": 59.07, "elapsed_time": "3:18:19", "remaining_time": "2:17:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1134, "total_steps": 1918, "loss": 0.199, "learning_rate": 1.956913817240173e-06, "epoch": 0.5911253013618297, "percentage": 59.12, "elapsed_time": "3:18:29", "remaining_time": "2:17:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1135, "total_steps": 1918, "loss": 0.1784, "learning_rate": 1.9527069294668617e-06, "epoch": 0.5916465758780217, "percentage": 59.18, "elapsed_time": "3:18:38", "remaining_time": "2:17:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1136, "total_steps": 1918, "loss": 0.1849, "learning_rate": 1.9485016688257578e-06, "epoch": 0.5921678503942138, "percentage": 59.23, "elapsed_time": "3:18:49", "remaining_time": "2:16:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1137, "total_steps": 1918, "loss": 0.1965, "learning_rate": 1.9442980478193332e-06, "epoch": 0.5926891249104059, "percentage": 59.28, "elapsed_time": "3:18:58", "remaining_time": "2:16:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1138, "total_steps": 1918, "loss": 0.1944, "learning_rate": 1.9400960789451827e-06, "epoch": 0.593210399426598, "percentage": 59.33, "elapsed_time": "3:19:10", "remaining_time": "2:16:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1139, "total_steps": 1918, "loss": 0.1932, "learning_rate": 1.935895774695988e-06, "epoch": 0.5937316739427901, "percentage": 59.38, "elapsed_time": "3:19:19", "remaining_time": "2:16:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1140, "total_steps": 1918, "loss": 0.187, "learning_rate": 1.9316971475594835e-06, "epoch": 0.5942529484589822, "percentage": 59.44, "elapsed_time": "3:19:29", "remaining_time": "2:16:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1141, "total_steps": 1918, "loss": 0.1755, "learning_rate": 1.9275002100184186e-06, "epoch": 0.5947742229751743, "percentage": 59.49, "elapsed_time": "3:19:40", "remaining_time": "2:15:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1142, "total_steps": 1918, "loss": 0.1822, "learning_rate": 1.9233049745505167e-06, "epoch": 0.5952954974913663, "percentage": 59.54, "elapsed_time": "3:19:50", "remaining_time": "2:15:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1143, "total_steps": 1918, "loss": 0.2018, "learning_rate": 1.919111453628442e-06, "epoch": 0.5958167720075584, "percentage": 59.59, "elapsed_time": "3:20:02", "remaining_time": "2:15:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1144, "total_steps": 1918, "loss": 0.1943, "learning_rate": 1.914919659719762e-06, "epoch": 0.5963380465237506, "percentage": 59.65, "elapsed_time": "3:20:13", "remaining_time": "2:15:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1145, "total_steps": 1918, "loss": 0.1993, "learning_rate": 1.9107296052869086e-06, "epoch": 0.5968593210399427, "percentage": 59.7, "elapsed_time": "3:20:24", "remaining_time": "2:15:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1146, "total_steps": 1918, "loss": 0.2039, "learning_rate": 1.9065413027871437e-06, "epoch": 0.5973805955561348, "percentage": 59.75, "elapsed_time": "3:20:34", "remaining_time": "2:15:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1147, "total_steps": 1918, "loss": 0.1835, "learning_rate": 1.902354764672518e-06, "epoch": 0.5979018700723269, "percentage": 59.8, "elapsed_time": "3:20:44", "remaining_time": "2:14:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1148, "total_steps": 1918, "loss": 0.1916, "learning_rate": 1.8981700033898387e-06, "epoch": 0.598423144588519, "percentage": 59.85, "elapsed_time": "3:20:54", "remaining_time": "2:14:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1149, "total_steps": 1918, "loss": 0.1709, "learning_rate": 1.8939870313806302e-06, "epoch": 0.598944419104711, "percentage": 59.91, "elapsed_time": "3:21:04", "remaining_time": "2:14:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1150, "total_steps": 1918, "loss": 0.1976, "learning_rate": 1.8898058610810963e-06, "epoch": 0.5994656936209031, "percentage": 59.96, "elapsed_time": "3:21:15", "remaining_time": "2:14:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1151, "total_steps": 1918, "loss": 0.1763, "learning_rate": 1.8856265049220852e-06, "epoch": 0.5999869681370952, "percentage": 60.01, "elapsed_time": "3:21:24", "remaining_time": "2:14:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1152, "total_steps": 1918, "loss": 0.1905, "learning_rate": 1.8814489753290517e-06, "epoch": 0.6005082426532873, "percentage": 60.06, "elapsed_time": "3:21:35", "remaining_time": "2:14:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1153, "total_steps": 1918, "loss": 0.1805, "learning_rate": 1.8772732847220182e-06, "epoch": 0.6010295171694794, "percentage": 60.11, "elapsed_time": "3:21:45", "remaining_time": "2:13:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1154, "total_steps": 1918, "loss": 0.1988, "learning_rate": 1.873099445515542e-06, "epoch": 0.6015507916856715, "percentage": 60.17, "elapsed_time": "3:21:55", "remaining_time": "2:13:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1155, "total_steps": 1918, "loss": 0.1873, "learning_rate": 1.868927470118675e-06, "epoch": 0.6020720662018636, "percentage": 60.22, "elapsed_time": "3:22:06", "remaining_time": "2:13:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1156, "total_steps": 1918, "loss": 0.19, "learning_rate": 1.8647573709349275e-06, "epoch": 0.6025933407180556, "percentage": 60.27, "elapsed_time": "3:22:16", "remaining_time": "2:13:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1157, "total_steps": 1918, "loss": 0.1855, "learning_rate": 1.860589160362234e-06, "epoch": 0.6031146152342477, "percentage": 60.32, "elapsed_time": "3:22:27", "remaining_time": "2:13:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1158, "total_steps": 1918, "loss": 0.1885, "learning_rate": 1.8564228507929099e-06, "epoch": 0.6036358897504398, "percentage": 60.38, "elapsed_time": "3:22:39", "remaining_time": "2:13:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1159, "total_steps": 1918, "loss": 0.1839, "learning_rate": 1.852258454613623e-06, "epoch": 0.6041571642666319, "percentage": 60.43, "elapsed_time": "3:22:49", "remaining_time": "2:12:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1160, "total_steps": 1918, "loss": 0.1871, "learning_rate": 1.8480959842053508e-06, "epoch": 0.604678438782824, "percentage": 60.48, "elapsed_time": "3:23:00", "remaining_time": "2:12:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1161, "total_steps": 1918, "loss": 0.1863, "learning_rate": 1.843935451943344e-06, "epoch": 0.6051997132990161, "percentage": 60.53, "elapsed_time": "3:23:11", "remaining_time": "2:12:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1162, "total_steps": 1918, "loss": 0.1895, "learning_rate": 1.839776870197093e-06, "epoch": 0.6057209878152082, "percentage": 60.58, "elapsed_time": "3:23:20", "remaining_time": "2:12:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1163, "total_steps": 1918, "loss": 0.1851, "learning_rate": 1.8356202513302896e-06, "epoch": 0.6062422623314003, "percentage": 60.64, "elapsed_time": "3:23:31", "remaining_time": "2:12:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1164, "total_steps": 1918, "loss": 0.1845, "learning_rate": 1.831465607700787e-06, "epoch": 0.6067635368475923, "percentage": 60.69, "elapsed_time": "3:23:41", "remaining_time": "2:11:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1165, "total_steps": 1918, "loss": 0.1938, "learning_rate": 1.8273129516605698e-06, "epoch": 0.6072848113637844, "percentage": 60.74, "elapsed_time": "3:23:51", "remaining_time": "2:11:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1166, "total_steps": 1918, "loss": 0.1871, "learning_rate": 1.8231622955557094e-06, "epoch": 0.6078060858799765, "percentage": 60.79, "elapsed_time": "3:24:01", "remaining_time": "2:11:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1167, "total_steps": 1918, "loss": 0.183, "learning_rate": 1.819013651726334e-06, "epoch": 0.6083273603961686, "percentage": 60.84, "elapsed_time": "3:24:11", "remaining_time": "2:11:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1168, "total_steps": 1918, "loss": 0.192, "learning_rate": 1.8148670325065893e-06, "epoch": 0.6088486349123607, "percentage": 60.9, "elapsed_time": "3:24:22", "remaining_time": "2:11:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1169, "total_steps": 1918, "loss": 0.1932, "learning_rate": 1.8107224502245997e-06, "epoch": 0.6093699094285528, "percentage": 60.95, "elapsed_time": "3:24:32", "remaining_time": "2:11:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1170, "total_steps": 1918, "loss": 0.1843, "learning_rate": 1.806579917202435e-06, "epoch": 0.609891183944745, "percentage": 61.0, "elapsed_time": "3:24:42", "remaining_time": "2:10:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1171, "total_steps": 1918, "loss": 0.1998, "learning_rate": 1.802439445756073e-06, "epoch": 0.610412458460937, "percentage": 61.05, "elapsed_time": "3:24:52", "remaining_time": "2:10:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1172, "total_steps": 1918, "loss": 0.2012, "learning_rate": 1.7983010481953605e-06, "epoch": 0.610933732977129, "percentage": 61.11, "elapsed_time": "3:25:03", "remaining_time": "2:10:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1173, "total_steps": 1918, "loss": 0.1767, "learning_rate": 1.7941647368239806e-06, "epoch": 0.6114550074933212, "percentage": 61.16, "elapsed_time": "3:25:13", "remaining_time": "2:10:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1174, "total_steps": 1918, "loss": 0.1962, "learning_rate": 1.7900305239394134e-06, "epoch": 0.6119762820095133, "percentage": 61.21, "elapsed_time": "3:25:24", "remaining_time": "2:10:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1175, "total_steps": 1918, "loss": 0.1991, "learning_rate": 1.785898421832898e-06, "epoch": 0.6124975565257054, "percentage": 61.26, "elapsed_time": "3:25:34", "remaining_time": "2:09:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1176, "total_steps": 1918, "loss": 0.175, "learning_rate": 1.7817684427894016e-06, "epoch": 0.6130188310418975, "percentage": 61.31, "elapsed_time": "3:25:45", "remaining_time": "2:09:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1177, "total_steps": 1918, "loss": 0.2054, "learning_rate": 1.7776405990875761e-06, "epoch": 0.6135401055580896, "percentage": 61.37, "elapsed_time": "3:25:54", "remaining_time": "2:09:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1178, "total_steps": 1918, "loss": 0.1742, "learning_rate": 1.7735149029997273e-06, "epoch": 0.6140613800742816, "percentage": 61.42, "elapsed_time": "3:26:04", "remaining_time": "2:09:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1179, "total_steps": 1918, "loss": 0.1904, "learning_rate": 1.7693913667917757e-06, "epoch": 0.6145826545904737, "percentage": 61.47, "elapsed_time": "3:26:14", "remaining_time": "2:09:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1180, "total_steps": 1918, "loss": 0.19, "learning_rate": 1.7652700027232184e-06, "epoch": 0.6151039291066658, "percentage": 61.52, "elapsed_time": "3:26:24", "remaining_time": "2:09:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1181, "total_steps": 1918, "loss": 0.1918, "learning_rate": 1.7611508230470963e-06, "epoch": 0.6156252036228579, "percentage": 61.57, "elapsed_time": "3:26:35", "remaining_time": "2:08:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1182, "total_steps": 1918, "loss": 0.1811, "learning_rate": 1.7570338400099569e-06, "epoch": 0.61614647813905, "percentage": 61.63, "elapsed_time": "3:26:46", "remaining_time": "2:08:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1183, "total_steps": 1918, "loss": 0.1946, "learning_rate": 1.7529190658518142e-06, "epoch": 0.6166677526552421, "percentage": 61.68, "elapsed_time": "3:26:56", "remaining_time": "2:08:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1184, "total_steps": 1918, "loss": 0.184, "learning_rate": 1.7488065128061187e-06, "epoch": 0.6171890271714342, "percentage": 61.73, "elapsed_time": "3:27:06", "remaining_time": "2:08:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1185, "total_steps": 1918, "loss": 0.1832, "learning_rate": 1.7446961930997126e-06, "epoch": 0.6177103016876262, "percentage": 61.78, "elapsed_time": "3:27:17", "remaining_time": "2:08:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1186, "total_steps": 1918, "loss": 0.2049, "learning_rate": 1.7405881189528024e-06, "epoch": 0.6182315762038183, "percentage": 61.84, "elapsed_time": "3:27:28", "remaining_time": "2:08:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1187, "total_steps": 1918, "loss": 0.195, "learning_rate": 1.7364823025789184e-06, "epoch": 0.6187528507200104, "percentage": 61.89, "elapsed_time": "3:27:37", "remaining_time": "2:07:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1188, "total_steps": 1918, "loss": 0.1893, "learning_rate": 1.732378756184875e-06, "epoch": 0.6192741252362025, "percentage": 61.94, "elapsed_time": "3:27:48", "remaining_time": "2:07:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1189, "total_steps": 1918, "loss": 0.1851, "learning_rate": 1.7282774919707406e-06, "epoch": 0.6197953997523946, "percentage": 61.99, "elapsed_time": "3:27:59", "remaining_time": "2:07:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1190, "total_steps": 1918, "loss": 0.1955, "learning_rate": 1.7241785221297984e-06, "epoch": 0.6203166742685867, "percentage": 62.04, "elapsed_time": "3:28:09", "remaining_time": "2:07:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1191, "total_steps": 1918, "loss": 0.1835, "learning_rate": 1.7200818588485088e-06, "epoch": 0.6208379487847788, "percentage": 62.1, "elapsed_time": "3:28:20", "remaining_time": "2:07:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1192, "total_steps": 1918, "loss": 0.192, "learning_rate": 1.715987514306476e-06, "epoch": 0.6213592233009708, "percentage": 62.15, "elapsed_time": "3:28:31", "remaining_time": "2:07:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1193, "total_steps": 1918, "loss": 0.1832, "learning_rate": 1.7118955006764116e-06, "epoch": 0.6218804978171629, "percentage": 62.2, "elapsed_time": "3:28:42", "remaining_time": "2:06:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1194, "total_steps": 1918, "loss": 0.1851, "learning_rate": 1.707805830124093e-06, "epoch": 0.622401772333355, "percentage": 62.25, "elapsed_time": "3:28:51", "remaining_time": "2:06:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1195, "total_steps": 1918, "loss": 0.1854, "learning_rate": 1.703718514808336e-06, "epoch": 0.6229230468495471, "percentage": 62.3, "elapsed_time": "3:29:02", "remaining_time": "2:06:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1196, "total_steps": 1918, "loss": 0.1872, "learning_rate": 1.6996335668809515e-06, "epoch": 0.6234443213657392, "percentage": 62.36, "elapsed_time": "3:29:12", "remaining_time": "2:06:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1197, "total_steps": 1918, "loss": 0.2012, "learning_rate": 1.6955509984867136e-06, "epoch": 0.6239655958819313, "percentage": 62.41, "elapsed_time": "3:29:23", "remaining_time": "2:06:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1198, "total_steps": 1918, "loss": 0.1918, "learning_rate": 1.691470821763322e-06, "epoch": 0.6244868703981235, "percentage": 62.46, "elapsed_time": "3:29:34", "remaining_time": "2:05:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1199, "total_steps": 1918, "loss": 0.2038, "learning_rate": 1.6873930488413628e-06, "epoch": 0.6250081449143156, "percentage": 62.51, "elapsed_time": "3:29:44", "remaining_time": "2:05:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1200, "total_steps": 1918, "loss": 0.172, "learning_rate": 1.6833176918442796e-06, "epoch": 0.6255294194305075, "percentage": 62.57, "elapsed_time": "3:29:54", "remaining_time": "2:05:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1201, "total_steps": 1918, "loss": 0.1931, "learning_rate": 1.6792447628883318e-06, "epoch": 0.6260506939466997, "percentage": 62.62, "elapsed_time": "3:30:06", "remaining_time": "2:05:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1202, "total_steps": 1918, "loss": 0.1859, "learning_rate": 1.6751742740825583e-06, "epoch": 0.6265719684628918, "percentage": 62.67, "elapsed_time": "3:30:15", "remaining_time": "2:05:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1203, "total_steps": 1918, "loss": 0.1886, "learning_rate": 1.6711062375287451e-06, "epoch": 0.6270932429790839, "percentage": 62.72, "elapsed_time": "3:30:26", "remaining_time": "2:05:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1204, "total_steps": 1918, "loss": 0.1879, "learning_rate": 1.6670406653213883e-06, "epoch": 0.627614517495276, "percentage": 62.77, "elapsed_time": "3:30:36", "remaining_time": "2:04:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1205, "total_steps": 1918, "loss": 0.1888, "learning_rate": 1.6629775695476551e-06, "epoch": 0.6281357920114681, "percentage": 62.83, "elapsed_time": "3:30:47", "remaining_time": "2:04:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1206, "total_steps": 1918, "loss": 0.1768, "learning_rate": 1.6589169622873524e-06, "epoch": 0.6286570665276602, "percentage": 62.88, "elapsed_time": "3:30:56", "remaining_time": "2:04:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1207, "total_steps": 1918, "loss": 0.1854, "learning_rate": 1.654858855612886e-06, "epoch": 0.6291783410438522, "percentage": 62.93, "elapsed_time": "3:31:05", "remaining_time": "2:04:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1208, "total_steps": 1918, "loss": 0.1941, "learning_rate": 1.6508032615892294e-06, "epoch": 0.6296996155600443, "percentage": 62.98, "elapsed_time": "3:31:16", "remaining_time": "2:04:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1209, "total_steps": 1918, "loss": 0.2016, "learning_rate": 1.6467501922738862e-06, "epoch": 0.6302208900762364, "percentage": 63.03, "elapsed_time": "3:31:26", "remaining_time": "2:03:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1210, "total_steps": 1918, "loss": 0.2032, "learning_rate": 1.6426996597168517e-06, "epoch": 0.6307421645924285, "percentage": 63.09, "elapsed_time": "3:31:36", "remaining_time": "2:03:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1211, "total_steps": 1918, "loss": 0.2042, "learning_rate": 1.6386516759605813e-06, "epoch": 0.6312634391086206, "percentage": 63.14, "elapsed_time": "3:31:46", "remaining_time": "2:03:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1212, "total_steps": 1918, "loss": 0.1806, "learning_rate": 1.6346062530399525e-06, "epoch": 0.6317847136248127, "percentage": 63.19, "elapsed_time": "3:31:56", "remaining_time": "2:03:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1213, "total_steps": 1918, "loss": 0.1953, "learning_rate": 1.6305634029822267e-06, "epoch": 0.6323059881410048, "percentage": 63.24, "elapsed_time": "3:32:06", "remaining_time": "2:03:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1214, "total_steps": 1918, "loss": 0.1896, "learning_rate": 1.6265231378070197e-06, "epoch": 0.6328272626571968, "percentage": 63.3, "elapsed_time": "3:32:16", "remaining_time": "2:03:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1215, "total_steps": 1918, "loss": 0.1931, "learning_rate": 1.6224854695262616e-06, "epoch": 0.6333485371733889, "percentage": 63.35, "elapsed_time": "3:32:27", "remaining_time": "2:02:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1216, "total_steps": 1918, "loss": 0.1796, "learning_rate": 1.6184504101441584e-06, "epoch": 0.633869811689581, "percentage": 63.4, "elapsed_time": "3:32:37", "remaining_time": "2:02:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1217, "total_steps": 1918, "loss": 0.1785, "learning_rate": 1.614417971657164e-06, "epoch": 0.6343910862057731, "percentage": 63.45, "elapsed_time": "3:32:49", "remaining_time": "2:02:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1218, "total_steps": 1918, "loss": 0.1989, "learning_rate": 1.6103881660539369e-06, "epoch": 0.6349123607219652, "percentage": 63.5, "elapsed_time": "3:32:58", "remaining_time": "2:02:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1219, "total_steps": 1918, "loss": 0.1953, "learning_rate": 1.6063610053153106e-06, "epoch": 0.6354336352381573, "percentage": 63.56, "elapsed_time": "3:33:09", "remaining_time": "2:02:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1220, "total_steps": 1918, "loss": 0.1887, "learning_rate": 1.6023365014142544e-06, "epoch": 0.6359549097543494, "percentage": 63.61, "elapsed_time": "3:33:18", "remaining_time": "2:02:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1221, "total_steps": 1918, "loss": 0.1912, "learning_rate": 1.5983146663158368e-06, "epoch": 0.6364761842705414, "percentage": 63.66, "elapsed_time": "3:33:29", "remaining_time": "2:01:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1222, "total_steps": 1918, "loss": 0.1931, "learning_rate": 1.5942955119771942e-06, "epoch": 0.6369974587867335, "percentage": 63.71, "elapsed_time": "3:33:40", "remaining_time": "2:01:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1223, "total_steps": 1918, "loss": 0.2011, "learning_rate": 1.5902790503474928e-06, "epoch": 0.6375187333029256, "percentage": 63.76, "elapsed_time": "3:33:51", "remaining_time": "2:01:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1224, "total_steps": 1918, "loss": 0.1898, "learning_rate": 1.586265293367891e-06, "epoch": 0.6380400078191177, "percentage": 63.82, "elapsed_time": "3:34:02", "remaining_time": "2:01:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1225, "total_steps": 1918, "loss": 0.193, "learning_rate": 1.5822542529715084e-06, "epoch": 0.6385612823353098, "percentage": 63.87, "elapsed_time": "3:34:12", "remaining_time": "2:01:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1226, "total_steps": 1918, "loss": 0.1713, "learning_rate": 1.578245941083389e-06, "epoch": 0.639082556851502, "percentage": 63.92, "elapsed_time": "3:34:23", "remaining_time": "2:01:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1227, "total_steps": 1918, "loss": 0.1879, "learning_rate": 1.57424036962046e-06, "epoch": 0.639603831367694, "percentage": 63.97, "elapsed_time": "3:34:33", "remaining_time": "2:00:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1228, "total_steps": 1918, "loss": 0.1802, "learning_rate": 1.5702375504915062e-06, "epoch": 0.640125105883886, "percentage": 64.03, "elapsed_time": "3:34:45", "remaining_time": "2:00:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1229, "total_steps": 1918, "loss": 0.1995, "learning_rate": 1.5662374955971268e-06, "epoch": 0.6406463804000782, "percentage": 64.08, "elapsed_time": "3:34:54", "remaining_time": "2:00:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1230, "total_steps": 1918, "loss": 0.1839, "learning_rate": 1.562240216829704e-06, "epoch": 0.6411676549162703, "percentage": 64.13, "elapsed_time": "3:35:04", "remaining_time": "2:00:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1231, "total_steps": 1918, "loss": 0.2073, "learning_rate": 1.5582457260733664e-06, "epoch": 0.6416889294324624, "percentage": 64.18, "elapsed_time": "3:35:16", "remaining_time": "2:00:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1232, "total_steps": 1918, "loss": 0.1994, "learning_rate": 1.5542540352039525e-06, "epoch": 0.6422102039486545, "percentage": 64.23, "elapsed_time": "3:35:28", "remaining_time": "1:59:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1233, "total_steps": 1918, "loss": 0.1987, "learning_rate": 1.550265156088978e-06, "epoch": 0.6427314784648466, "percentage": 64.29, "elapsed_time": "3:35:37", "remaining_time": "1:59:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1234, "total_steps": 1918, "loss": 0.1968, "learning_rate": 1.5462791005875994e-06, "epoch": 0.6432527529810387, "percentage": 64.34, "elapsed_time": "3:35:47", "remaining_time": "1:59:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1235, "total_steps": 1918, "loss": 0.1856, "learning_rate": 1.542295880550575e-06, "epoch": 0.6437740274972308, "percentage": 64.39, "elapsed_time": "3:35:57", "remaining_time": "1:59:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1236, "total_steps": 1918, "loss": 0.1789, "learning_rate": 1.5383155078202377e-06, "epoch": 0.6442953020134228, "percentage": 64.44, "elapsed_time": "3:36:08", "remaining_time": "1:59:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1237, "total_steps": 1918, "loss": 0.1833, "learning_rate": 1.534337994230453e-06, "epoch": 0.6448165765296149, "percentage": 64.49, "elapsed_time": "3:36:19", "remaining_time": "1:59:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1238, "total_steps": 1918, "loss": 0.2029, "learning_rate": 1.5303633516065852e-06, "epoch": 0.645337851045807, "percentage": 64.55, "elapsed_time": "3:36:30", "remaining_time": "1:58:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1239, "total_steps": 1918, "loss": 0.1895, "learning_rate": 1.5263915917654654e-06, "epoch": 0.6458591255619991, "percentage": 64.6, "elapsed_time": "3:36:41", "remaining_time": "1:58:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1240, "total_steps": 1918, "loss": 0.1843, "learning_rate": 1.5224227265153512e-06, "epoch": 0.6463804000781912, "percentage": 64.65, "elapsed_time": "3:36:51", "remaining_time": "1:58:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1241, "total_steps": 1918, "loss": 0.177, "learning_rate": 1.5184567676558965e-06, "epoch": 0.6469016745943833, "percentage": 64.7, "elapsed_time": "3:37:02", "remaining_time": "1:58:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1242, "total_steps": 1918, "loss": 0.1902, "learning_rate": 1.5144937269781142e-06, "epoch": 0.6474229491105754, "percentage": 64.75, "elapsed_time": "3:37:12", "remaining_time": "1:58:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1243, "total_steps": 1918, "loss": 0.1879, "learning_rate": 1.5105336162643403e-06, "epoch": 0.6479442236267674, "percentage": 64.81, "elapsed_time": "3:37:22", "remaining_time": "1:58:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1244, "total_steps": 1918, "loss": 0.1991, "learning_rate": 1.5065764472882e-06, "epoch": 0.6484654981429595, "percentage": 64.86, "elapsed_time": "3:37:31", "remaining_time": "1:57:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1245, "total_steps": 1918, "loss": 0.1776, "learning_rate": 1.5026222318145745e-06, "epoch": 0.6489867726591516, "percentage": 64.91, "elapsed_time": "3:37:42", "remaining_time": "1:57:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1246, "total_steps": 1918, "loss": 0.1811, "learning_rate": 1.4986709815995604e-06, "epoch": 0.6495080471753437, "percentage": 64.96, "elapsed_time": "3:37:51", "remaining_time": "1:57:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1247, "total_steps": 1918, "loss": 0.1829, "learning_rate": 1.494722708390442e-06, "epoch": 0.6500293216915358, "percentage": 65.02, "elapsed_time": "3:38:02", "remaining_time": "1:57:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1248, "total_steps": 1918, "loss": 0.2026, "learning_rate": 1.4907774239256517e-06, "epoch": 0.6505505962077279, "percentage": 65.07, "elapsed_time": "3:38:13", "remaining_time": "1:57:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1249, "total_steps": 1918, "loss": 0.1875, "learning_rate": 1.486835139934734e-06, "epoch": 0.65107187072392, "percentage": 65.12, "elapsed_time": "3:38:23", "remaining_time": "1:56:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1250, "total_steps": 1918, "loss": 0.1806, "learning_rate": 1.4828958681383163e-06, "epoch": 0.651593145240112, "percentage": 65.17, "elapsed_time": "3:38:32", "remaining_time": "1:56:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1251, "total_steps": 1918, "loss": 0.1954, "learning_rate": 1.4789596202480678e-06, "epoch": 0.6521144197563041, "percentage": 65.22, "elapsed_time": "3:38:43", "remaining_time": "1:56:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1252, "total_steps": 1918, "loss": 0.1919, "learning_rate": 1.475026407966669e-06, "epoch": 0.6526356942724962, "percentage": 65.28, "elapsed_time": "3:38:54", "remaining_time": "1:56:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1253, "total_steps": 1918, "loss": 0.1794, "learning_rate": 1.4710962429877763e-06, "epoch": 0.6531569687886883, "percentage": 65.33, "elapsed_time": "3:39:05", "remaining_time": "1:56:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1254, "total_steps": 1918, "loss": 0.1858, "learning_rate": 1.4671691369959826e-06, "epoch": 0.6536782433048804, "percentage": 65.38, "elapsed_time": "3:39:15", "remaining_time": "1:56:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1255, "total_steps": 1918, "loss": 0.1879, "learning_rate": 1.4632451016667899e-06, "epoch": 0.6541995178210726, "percentage": 65.43, "elapsed_time": "3:39:26", "remaining_time": "1:55:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1256, "total_steps": 1918, "loss": 0.17, "learning_rate": 1.4593241486665705e-06, "epoch": 0.6547207923372647, "percentage": 65.48, "elapsed_time": "3:39:37", "remaining_time": "1:55:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1257, "total_steps": 1918, "loss": 0.1882, "learning_rate": 1.4554062896525295e-06, "epoch": 0.6552420668534567, "percentage": 65.54, "elapsed_time": "3:39:47", "remaining_time": "1:55:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1258, "total_steps": 1918, "loss": 0.196, "learning_rate": 1.4514915362726773e-06, "epoch": 0.6557633413696488, "percentage": 65.59, "elapsed_time": "3:39:57", "remaining_time": "1:55:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1259, "total_steps": 1918, "loss": 0.1737, "learning_rate": 1.447579900165792e-06, "epoch": 0.6562846158858409, "percentage": 65.64, "elapsed_time": "3:40:06", "remaining_time": "1:55:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1260, "total_steps": 1918, "loss": 0.1839, "learning_rate": 1.4436713929613771e-06, "epoch": 0.656805890402033, "percentage": 65.69, "elapsed_time": "3:40:16", "remaining_time": "1:55:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1261, "total_steps": 1918, "loss": 0.1874, "learning_rate": 1.4397660262796411e-06, "epoch": 0.6573271649182251, "percentage": 65.75, "elapsed_time": "3:40:26", "remaining_time": "1:54:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1262, "total_steps": 1918, "loss": 0.1735, "learning_rate": 1.4358638117314521e-06, "epoch": 0.6578484394344172, "percentage": 65.8, "elapsed_time": "3:40:37", "remaining_time": "1:54:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1263, "total_steps": 1918, "loss": 0.1877, "learning_rate": 1.4319647609183058e-06, "epoch": 0.6583697139506093, "percentage": 65.85, "elapsed_time": "3:40:48", "remaining_time": "1:54:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1264, "total_steps": 1918, "loss": 0.1832, "learning_rate": 1.428068885432296e-06, "epoch": 0.6588909884668013, "percentage": 65.9, "elapsed_time": "3:40:58", "remaining_time": "1:54:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1265, "total_steps": 1918, "loss": 0.1707, "learning_rate": 1.4241761968560703e-06, "epoch": 0.6594122629829934, "percentage": 65.95, "elapsed_time": "3:41:08", "remaining_time": "1:54:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1266, "total_steps": 1918, "loss": 0.1935, "learning_rate": 1.4202867067628068e-06, "epoch": 0.6599335374991855, "percentage": 66.01, "elapsed_time": "3:41:17", "remaining_time": "1:53:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1267, "total_steps": 1918, "loss": 0.1972, "learning_rate": 1.4164004267161718e-06, "epoch": 0.6604548120153776, "percentage": 66.06, "elapsed_time": "3:41:28", "remaining_time": "1:53:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1268, "total_steps": 1918, "loss": 0.2, "learning_rate": 1.4125173682702869e-06, "epoch": 0.6609760865315697, "percentage": 66.11, "elapsed_time": "3:41:39", "remaining_time": "1:53:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1269, "total_steps": 1918, "loss": 0.184, "learning_rate": 1.4086375429696987e-06, "epoch": 0.6614973610477618, "percentage": 66.16, "elapsed_time": "3:41:48", "remaining_time": "1:53:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1270, "total_steps": 1918, "loss": 0.1728, "learning_rate": 1.4047609623493396e-06, "epoch": 0.6620186355639539, "percentage": 66.21, "elapsed_time": "3:41:58", "remaining_time": "1:53:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1271, "total_steps": 1918, "loss": 0.1812, "learning_rate": 1.400887637934495e-06, "epoch": 0.662539910080146, "percentage": 66.27, "elapsed_time": "3:42:07", "remaining_time": "1:53:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1272, "total_steps": 1918, "loss": 0.1807, "learning_rate": 1.3970175812407705e-06, "epoch": 0.663061184596338, "percentage": 66.32, "elapsed_time": "3:42:17", "remaining_time": "1:52:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1273, "total_steps": 1918, "loss": 0.1776, "learning_rate": 1.393150803774055e-06, "epoch": 0.6635824591125301, "percentage": 66.37, "elapsed_time": "3:42:27", "remaining_time": "1:52:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1274, "total_steps": 1918, "loss": 0.192, "learning_rate": 1.3892873170304913e-06, "epoch": 0.6641037336287222, "percentage": 66.42, "elapsed_time": "3:42:39", "remaining_time": "1:52:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1275, "total_steps": 1918, "loss": 0.2011, "learning_rate": 1.3854271324964353e-06, "epoch": 0.6646250081449143, "percentage": 66.48, "elapsed_time": "3:42:50", "remaining_time": "1:52:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1276, "total_steps": 1918, "loss": 0.1862, "learning_rate": 1.3815702616484262e-06, "epoch": 0.6651462826611064, "percentage": 66.53, "elapsed_time": "3:43:02", "remaining_time": "1:52:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1277, "total_steps": 1918, "loss": 0.1731, "learning_rate": 1.3777167159531532e-06, "epoch": 0.6656675571772985, "percentage": 66.58, "elapsed_time": "3:43:13", "remaining_time": "1:52:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1278, "total_steps": 1918, "loss": 0.1947, "learning_rate": 1.3738665068674176e-06, "epoch": 0.6661888316934906, "percentage": 66.63, "elapsed_time": "3:43:23", "remaining_time": "1:51:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1279, "total_steps": 1918, "loss": 0.1804, "learning_rate": 1.3700196458381012e-06, "epoch": 0.6667101062096826, "percentage": 66.68, "elapsed_time": "3:43:35", "remaining_time": "1:51:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1280, "total_steps": 1918, "loss": 0.1943, "learning_rate": 1.3661761443021316e-06, "epoch": 0.6672313807258747, "percentage": 66.74, "elapsed_time": "3:43:43", "remaining_time": "1:51:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1281, "total_steps": 1918, "loss": 0.1842, "learning_rate": 1.36233601368645e-06, "epoch": 0.6677526552420668, "percentage": 66.79, "elapsed_time": "3:43:54", "remaining_time": "1:51:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1282, "total_steps": 1918, "loss": 0.1867, "learning_rate": 1.3584992654079742e-06, "epoch": 0.6682739297582589, "percentage": 66.84, "elapsed_time": "3:44:04", "remaining_time": "1:51:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1283, "total_steps": 1918, "loss": 0.178, "learning_rate": 1.3546659108735666e-06, "epoch": 0.668795204274451, "percentage": 66.89, "elapsed_time": "3:44:13", "remaining_time": "1:50:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1284, "total_steps": 1918, "loss": 0.1867, "learning_rate": 1.3508359614799998e-06, "epoch": 0.6693164787906432, "percentage": 66.94, "elapsed_time": "3:44:24", "remaining_time": "1:50:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1285, "total_steps": 1918, "loss": 0.2016, "learning_rate": 1.3470094286139213e-06, "epoch": 0.6698377533068353, "percentage": 67.0, "elapsed_time": "3:44:33", "remaining_time": "1:50:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1286, "total_steps": 1918, "loss": 0.1878, "learning_rate": 1.3431863236518242e-06, "epoch": 0.6703590278230273, "percentage": 67.05, "elapsed_time": "3:44:43", "remaining_time": "1:50:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1287, "total_steps": 1918, "loss": 0.1778, "learning_rate": 1.3393666579600078e-06, "epoch": 0.6708803023392194, "percentage": 67.1, "elapsed_time": "3:44:53", "remaining_time": "1:50:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1288, "total_steps": 1918, "loss": 0.1897, "learning_rate": 1.3355504428945464e-06, "epoch": 0.6714015768554115, "percentage": 67.15, "elapsed_time": "3:45:03", "remaining_time": "1:50:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1289, "total_steps": 1918, "loss": 0.1864, "learning_rate": 1.3317376898012573e-06, "epoch": 0.6719228513716036, "percentage": 67.21, "elapsed_time": "3:45:13", "remaining_time": "1:49:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1290, "total_steps": 1918, "loss": 0.2057, "learning_rate": 1.3279284100156633e-06, "epoch": 0.6724441258877957, "percentage": 67.26, "elapsed_time": "3:45:22", "remaining_time": "1:49:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1291, "total_steps": 1918, "loss": 0.1848, "learning_rate": 1.32412261486296e-06, "epoch": 0.6729654004039878, "percentage": 67.31, "elapsed_time": "3:45:33", "remaining_time": "1:49:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1292, "total_steps": 1918, "loss": 0.1712, "learning_rate": 1.3203203156579875e-06, "epoch": 0.6734866749201799, "percentage": 67.36, "elapsed_time": "3:45:43", "remaining_time": "1:49:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1293, "total_steps": 1918, "loss": 0.1836, "learning_rate": 1.316521523705185e-06, "epoch": 0.6740079494363719, "percentage": 67.41, "elapsed_time": "3:45:54", "remaining_time": "1:49:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1294, "total_steps": 1918, "loss": 0.1837, "learning_rate": 1.3127262502985722e-06, "epoch": 0.674529223952564, "percentage": 67.47, "elapsed_time": "3:46:05", "remaining_time": "1:49:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1295, "total_steps": 1918, "loss": 0.1881, "learning_rate": 1.3089345067217025e-06, "epoch": 0.6750504984687561, "percentage": 67.52, "elapsed_time": "3:46:16", "remaining_time": "1:48:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1296, "total_steps": 1918, "loss": 0.1729, "learning_rate": 1.3051463042476358e-06, "epoch": 0.6755717729849482, "percentage": 67.57, "elapsed_time": "3:46:25", "remaining_time": "1:48:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1297, "total_steps": 1918, "loss": 0.1734, "learning_rate": 1.301361654138909e-06, "epoch": 0.6760930475011403, "percentage": 67.62, "elapsed_time": "3:46:34", "remaining_time": "1:48:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1298, "total_steps": 1918, "loss": 0.1936, "learning_rate": 1.297580567647489e-06, "epoch": 0.6766143220173324, "percentage": 67.67, "elapsed_time": "3:46:45", "remaining_time": "1:48:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1299, "total_steps": 1918, "loss": 0.1824, "learning_rate": 1.2938030560147558e-06, "epoch": 0.6771355965335245, "percentage": 67.73, "elapsed_time": "3:46:55", "remaining_time": "1:48:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1300, "total_steps": 1918, "loss": 0.1937, "learning_rate": 1.2900291304714568e-06, "epoch": 0.6776568710497165, "percentage": 67.78, "elapsed_time": "3:47:07", "remaining_time": "1:47:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1301, "total_steps": 1918, "loss": 0.1999, "learning_rate": 1.2862588022376782e-06, "epoch": 0.6781781455659086, "percentage": 67.83, "elapsed_time": "3:47:17", "remaining_time": "1:47:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1302, "total_steps": 1918, "loss": 0.1801, "learning_rate": 1.2824920825228132e-06, "epoch": 0.6786994200821007, "percentage": 67.88, "elapsed_time": "3:47:28", "remaining_time": "1:47:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1303, "total_steps": 1918, "loss": 0.2058, "learning_rate": 1.278728982525525e-06, "epoch": 0.6792206945982928, "percentage": 67.94, "elapsed_time": "3:47:38", "remaining_time": "1:47:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1304, "total_steps": 1918, "loss": 0.1842, "learning_rate": 1.2749695134337149e-06, "epoch": 0.6797419691144849, "percentage": 67.99, "elapsed_time": "3:47:48", "remaining_time": "1:47:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1305, "total_steps": 1918, "loss": 0.1608, "learning_rate": 1.2712136864244917e-06, "epoch": 0.680263243630677, "percentage": 68.04, "elapsed_time": "3:47:58", "remaining_time": "1:47:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1306, "total_steps": 1918, "loss": 0.1855, "learning_rate": 1.2674615126641313e-06, "epoch": 0.6807845181468691, "percentage": 68.09, "elapsed_time": "3:48:08", "remaining_time": "1:46:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1307, "total_steps": 1918, "loss": 0.1778, "learning_rate": 1.2637130033080541e-06, "epoch": 0.6813057926630612, "percentage": 68.14, "elapsed_time": "3:48:20", "remaining_time": "1:46:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1308, "total_steps": 1918, "loss": 0.1908, "learning_rate": 1.2599681695007822e-06, "epoch": 0.6818270671792532, "percentage": 68.2, "elapsed_time": "3:48:30", "remaining_time": "1:46:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1309, "total_steps": 1918, "loss": 0.1896, "learning_rate": 1.2562270223759104e-06, "epoch": 0.6823483416954453, "percentage": 68.25, "elapsed_time": "3:48:40", "remaining_time": "1:46:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1310, "total_steps": 1918, "loss": 0.188, "learning_rate": 1.2524895730560755e-06, "epoch": 0.6828696162116374, "percentage": 68.3, "elapsed_time": "3:48:51", "remaining_time": "1:46:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1311, "total_steps": 1918, "loss": 0.1936, "learning_rate": 1.2487558326529177e-06, "epoch": 0.6833908907278295, "percentage": 68.35, "elapsed_time": "3:49:01", "remaining_time": "1:46:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1312, "total_steps": 1918, "loss": 0.1765, "learning_rate": 1.2450258122670508e-06, "epoch": 0.6839121652440217, "percentage": 68.4, "elapsed_time": "3:49:12", "remaining_time": "1:45:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1313, "total_steps": 1918, "loss": 0.1826, "learning_rate": 1.2412995229880295e-06, "epoch": 0.6844334397602138, "percentage": 68.46, "elapsed_time": "3:49:23", "remaining_time": "1:45:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1314, "total_steps": 1918, "loss": 0.1991, "learning_rate": 1.2375769758943148e-06, "epoch": 0.6849547142764059, "percentage": 68.51, "elapsed_time": "3:49:33", "remaining_time": "1:45:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1315, "total_steps": 1918, "loss": 0.1942, "learning_rate": 1.2338581820532442e-06, "epoch": 0.6854759887925979, "percentage": 68.56, "elapsed_time": "3:49:43", "remaining_time": "1:45:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1316, "total_steps": 1918, "loss": 0.1787, "learning_rate": 1.2301431525209942e-06, "epoch": 0.68599726330879, "percentage": 68.61, "elapsed_time": "3:49:55", "remaining_time": "1:45:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1317, "total_steps": 1918, "loss": 0.1861, "learning_rate": 1.2264318983425498e-06, "epoch": 0.6865185378249821, "percentage": 68.67, "elapsed_time": "3:50:05", "remaining_time": "1:44:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1318, "total_steps": 1918, "loss": 0.1753, "learning_rate": 1.222724430551674e-06, "epoch": 0.6870398123411742, "percentage": 68.72, "elapsed_time": "3:50:14", "remaining_time": "1:44:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1319, "total_steps": 1918, "loss": 0.1778, "learning_rate": 1.2190207601708707e-06, "epoch": 0.6875610868573663, "percentage": 68.77, "elapsed_time": "3:50:24", "remaining_time": "1:44:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1320, "total_steps": 1918, "loss": 0.1705, "learning_rate": 1.215320898211354e-06, "epoch": 0.6880823613735584, "percentage": 68.82, "elapsed_time": "3:50:33", "remaining_time": "1:44:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1321, "total_steps": 1918, "loss": 0.1853, "learning_rate": 1.2116248556730151e-06, "epoch": 0.6886036358897505, "percentage": 68.87, "elapsed_time": "3:50:44", "remaining_time": "1:44:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1322, "total_steps": 1918, "loss": 0.1869, "learning_rate": 1.207932643544392e-06, "epoch": 0.6891249104059425, "percentage": 68.93, "elapsed_time": "3:50:55", "remaining_time": "1:44:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1323, "total_steps": 1918, "loss": 0.1817, "learning_rate": 1.2042442728026325e-06, "epoch": 0.6896461849221346, "percentage": 68.98, "elapsed_time": "3:51:05", "remaining_time": "1:43:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1324, "total_steps": 1918, "loss": 0.2027, "learning_rate": 1.200559754413464e-06, "epoch": 0.6901674594383267, "percentage": 69.03, "elapsed_time": "3:51:15", "remaining_time": "1:43:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1325, "total_steps": 1918, "loss": 0.1875, "learning_rate": 1.1968790993311613e-06, "epoch": 0.6906887339545188, "percentage": 69.08, "elapsed_time": "3:51:25", "remaining_time": "1:43:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1326, "total_steps": 1918, "loss": 0.1863, "learning_rate": 1.193202318498512e-06, "epoch": 0.6912100084707109, "percentage": 69.13, "elapsed_time": "3:51:35", "remaining_time": "1:43:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1327, "total_steps": 1918, "loss": 0.1888, "learning_rate": 1.1895294228467886e-06, "epoch": 0.691731282986903, "percentage": 69.19, "elapsed_time": "3:51:44", "remaining_time": "1:43:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1328, "total_steps": 1918, "loss": 0.1849, "learning_rate": 1.1858604232957096e-06, "epoch": 0.6922525575030951, "percentage": 69.24, "elapsed_time": "3:51:55", "remaining_time": "1:43:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1329, "total_steps": 1918, "loss": 0.1911, "learning_rate": 1.18219533075341e-06, "epoch": 0.6927738320192871, "percentage": 69.29, "elapsed_time": "3:52:04", "remaining_time": "1:42:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1330, "total_steps": 1918, "loss": 0.1748, "learning_rate": 1.1785341561164135e-06, "epoch": 0.6932951065354792, "percentage": 69.34, "elapsed_time": "3:52:15", "remaining_time": "1:42:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1331, "total_steps": 1918, "loss": 0.1812, "learning_rate": 1.1748769102695882e-06, "epoch": 0.6938163810516713, "percentage": 69.4, "elapsed_time": "3:52:25", "remaining_time": "1:42:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1332, "total_steps": 1918, "loss": 0.1847, "learning_rate": 1.1712236040861278e-06, "epoch": 0.6943376555678634, "percentage": 69.45, "elapsed_time": "3:52:37", "remaining_time": "1:42:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1333, "total_steps": 1918, "loss": 0.1868, "learning_rate": 1.1675742484275132e-06, "epoch": 0.6948589300840555, "percentage": 69.5, "elapsed_time": "3:52:47", "remaining_time": "1:42:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1334, "total_steps": 1918, "loss": 0.1892, "learning_rate": 1.1639288541434745e-06, "epoch": 0.6953802046002476, "percentage": 69.55, "elapsed_time": "3:52:58", "remaining_time": "1:41:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1335, "total_steps": 1918, "loss": 0.1736, "learning_rate": 1.160287432071971e-06, "epoch": 0.6959014791164397, "percentage": 69.6, "elapsed_time": "3:53:08", "remaining_time": "1:41:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1336, "total_steps": 1918, "loss": 0.1714, "learning_rate": 1.1566499930391484e-06, "epoch": 0.6964227536326317, "percentage": 69.66, "elapsed_time": "3:53:18", "remaining_time": "1:41:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1337, "total_steps": 1918, "loss": 0.1859, "learning_rate": 1.153016547859311e-06, "epoch": 0.6969440281488238, "percentage": 69.71, "elapsed_time": "3:53:27", "remaining_time": "1:41:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1338, "total_steps": 1918, "loss": 0.1839, "learning_rate": 1.1493871073348926e-06, "epoch": 0.6974653026650159, "percentage": 69.76, "elapsed_time": "3:53:36", "remaining_time": "1:41:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1339, "total_steps": 1918, "loss": 0.1862, "learning_rate": 1.1457616822564145e-06, "epoch": 0.697986577181208, "percentage": 69.81, "elapsed_time": "3:53:47", "remaining_time": "1:41:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1340, "total_steps": 1918, "loss": 0.1773, "learning_rate": 1.1421402834024662e-06, "epoch": 0.6985078516974002, "percentage": 69.86, "elapsed_time": "3:53:57", "remaining_time": "1:40:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1341, "total_steps": 1918, "loss": 0.1854, "learning_rate": 1.1385229215396638e-06, "epoch": 0.6990291262135923, "percentage": 69.92, "elapsed_time": "3:54:06", "remaining_time": "1:40:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1342, "total_steps": 1918, "loss": 0.1813, "learning_rate": 1.1349096074226205e-06, "epoch": 0.6995504007297844, "percentage": 69.97, "elapsed_time": "3:54:17", "remaining_time": "1:40:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1343, "total_steps": 1918, "loss": 0.1893, "learning_rate": 1.1313003517939189e-06, "epoch": 0.7000716752459765, "percentage": 70.02, "elapsed_time": "3:54:27", "remaining_time": "1:40:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1344, "total_steps": 1918, "loss": 0.1781, "learning_rate": 1.127695165384072e-06, "epoch": 0.7005929497621685, "percentage": 70.07, "elapsed_time": "3:54:39", "remaining_time": "1:40:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1345, "total_steps": 1918, "loss": 0.1937, "learning_rate": 1.1240940589114953e-06, "epoch": 0.7011142242783606, "percentage": 70.13, "elapsed_time": "3:54:50", "remaining_time": "1:40:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1346, "total_steps": 1918, "loss": 0.188, "learning_rate": 1.1204970430824782e-06, "epoch": 0.7016354987945527, "percentage": 70.18, "elapsed_time": "3:55:01", "remaining_time": "1:39:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1347, "total_steps": 1918, "loss": 0.1978, "learning_rate": 1.1169041285911411e-06, "epoch": 0.7021567733107448, "percentage": 70.23, "elapsed_time": "3:55:12", "remaining_time": "1:39:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1348, "total_steps": 1918, "loss": 0.1869, "learning_rate": 1.113315326119418e-06, "epoch": 0.7026780478269369, "percentage": 70.28, "elapsed_time": "3:55:22", "remaining_time": "1:39:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1349, "total_steps": 1918, "loss": 0.1939, "learning_rate": 1.1097306463370142e-06, "epoch": 0.703199322343129, "percentage": 70.33, "elapsed_time": "3:55:33", "remaining_time": "1:39:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1350, "total_steps": 1918, "loss": 0.1764, "learning_rate": 1.1061500999013771e-06, "epoch": 0.7037205968593211, "percentage": 70.39, "elapsed_time": "3:55:43", "remaining_time": "1:39:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1351, "total_steps": 1918, "loss": 0.1818, "learning_rate": 1.1025736974576693e-06, "epoch": 0.7042418713755131, "percentage": 70.44, "elapsed_time": "3:55:53", "remaining_time": "1:39:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1352, "total_steps": 1918, "loss": 0.1705, "learning_rate": 1.0990014496387296e-06, "epoch": 0.7047631458917052, "percentage": 70.49, "elapsed_time": "3:56:04", "remaining_time": "1:38:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1353, "total_steps": 1918, "loss": 0.1925, "learning_rate": 1.0954333670650461e-06, "epoch": 0.7052844204078973, "percentage": 70.54, "elapsed_time": "3:56:15", "remaining_time": "1:38:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1354, "total_steps": 1918, "loss": 0.1837, "learning_rate": 1.0918694603447221e-06, "epoch": 0.7058056949240894, "percentage": 70.59, "elapsed_time": "3:56:26", "remaining_time": "1:38:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1355, "total_steps": 1918, "loss": 0.1962, "learning_rate": 1.0883097400734494e-06, "epoch": 0.7063269694402815, "percentage": 70.65, "elapsed_time": "3:56:38", "remaining_time": "1:38:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1356, "total_steps": 1918, "loss": 0.1801, "learning_rate": 1.0847542168344695e-06, "epoch": 0.7068482439564736, "percentage": 70.7, "elapsed_time": "3:56:49", "remaining_time": "1:38:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1357, "total_steps": 1918, "loss": 0.1976, "learning_rate": 1.0812029011985472e-06, "epoch": 0.7073695184726657, "percentage": 70.75, "elapsed_time": "3:56:59", "remaining_time": "1:37:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1358, "total_steps": 1918, "loss": 0.1817, "learning_rate": 1.0776558037239385e-06, "epoch": 0.7078907929888577, "percentage": 70.8, "elapsed_time": "3:57:09", "remaining_time": "1:37:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1359, "total_steps": 1918, "loss": 0.1893, "learning_rate": 1.0741129349563567e-06, "epoch": 0.7084120675050498, "percentage": 70.86, "elapsed_time": "3:57:18", "remaining_time": "1:37:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1360, "total_steps": 1918, "loss": 0.1691, "learning_rate": 1.0705743054289464e-06, "epoch": 0.7089333420212419, "percentage": 70.91, "elapsed_time": "3:57:28", "remaining_time": "1:37:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1361, "total_steps": 1918, "loss": 0.1811, "learning_rate": 1.0670399256622455e-06, "epoch": 0.709454616537434, "percentage": 70.96, "elapsed_time": "3:57:39", "remaining_time": "1:37:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1362, "total_steps": 1918, "loss": 0.1951, "learning_rate": 1.0635098061641572e-06, "epoch": 0.7099758910536261, "percentage": 71.01, "elapsed_time": "3:57:51", "remaining_time": "1:37:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1363, "total_steps": 1918, "loss": 0.1877, "learning_rate": 1.0599839574299217e-06, "epoch": 0.7104971655698182, "percentage": 71.06, "elapsed_time": "3:58:01", "remaining_time": "1:36:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1364, "total_steps": 1918, "loss": 0.1644, "learning_rate": 1.056462389942079e-06, "epoch": 0.7110184400860103, "percentage": 71.12, "elapsed_time": "3:58:12", "remaining_time": "1:36:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1365, "total_steps": 1918, "loss": 0.1759, "learning_rate": 1.052945114170441e-06, "epoch": 0.7115397146022023, "percentage": 71.17, "elapsed_time": "3:58:23", "remaining_time": "1:36:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1366, "total_steps": 1918, "loss": 0.1829, "learning_rate": 1.0494321405720627e-06, "epoch": 0.7120609891183944, "percentage": 71.22, "elapsed_time": "3:58:32", "remaining_time": "1:36:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1367, "total_steps": 1918, "loss": 0.1684, "learning_rate": 1.045923479591204e-06, "epoch": 0.7125822636345865, "percentage": 71.27, "elapsed_time": "3:58:42", "remaining_time": "1:36:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1368, "total_steps": 1918, "loss": 0.1912, "learning_rate": 1.042419141659308e-06, "epoch": 0.7131035381507786, "percentage": 71.32, "elapsed_time": "3:58:54", "remaining_time": "1:36:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1369, "total_steps": 1918, "loss": 0.1941, "learning_rate": 1.038919137194962e-06, "epoch": 0.7136248126669708, "percentage": 71.38, "elapsed_time": "3:59:05", "remaining_time": "1:35:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1370, "total_steps": 1918, "loss": 0.1791, "learning_rate": 1.0354234766038696e-06, "epoch": 0.7141460871831629, "percentage": 71.43, "elapsed_time": "3:59:16", "remaining_time": "1:35:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1371, "total_steps": 1918, "loss": 0.1962, "learning_rate": 1.0319321702788234e-06, "epoch": 0.714667361699355, "percentage": 71.48, "elapsed_time": "3:59:27", "remaining_time": "1:35:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1372, "total_steps": 1918, "loss": 0.1905, "learning_rate": 1.028445228599665e-06, "epoch": 0.715188636215547, "percentage": 71.53, "elapsed_time": "3:59:39", "remaining_time": "1:35:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1373, "total_steps": 1918, "loss": 0.1848, "learning_rate": 1.0249626619332642e-06, "epoch": 0.7157099107317391, "percentage": 71.58, "elapsed_time": "3:59:49", "remaining_time": "1:35:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1374, "total_steps": 1918, "loss": 0.1794, "learning_rate": 1.0214844806334817e-06, "epoch": 0.7162311852479312, "percentage": 71.64, "elapsed_time": "3:59:59", "remaining_time": "1:35:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1375, "total_steps": 1918, "loss": 0.1918, "learning_rate": 1.0180106950411397e-06, "epoch": 0.7167524597641233, "percentage": 71.69, "elapsed_time": "4:00:08", "remaining_time": "1:34:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1376, "total_steps": 1918, "loss": 0.1701, "learning_rate": 1.0145413154839945e-06, "epoch": 0.7172737342803154, "percentage": 71.74, "elapsed_time": "4:00:18", "remaining_time": "1:34:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1377, "total_steps": 1918, "loss": 0.1876, "learning_rate": 1.0110763522767e-06, "epoch": 0.7177950087965075, "percentage": 71.79, "elapsed_time": "4:00:27", "remaining_time": "1:34:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1378, "total_steps": 1918, "loss": 0.1768, "learning_rate": 1.0076158157207801e-06, "epoch": 0.7183162833126996, "percentage": 71.85, "elapsed_time": "4:00:37", "remaining_time": "1:34:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1379, "total_steps": 1918, "loss": 0.1765, "learning_rate": 1.0041597161046025e-06, "epoch": 0.7188375578288917, "percentage": 71.9, "elapsed_time": "4:00:47", "remaining_time": "1:34:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1380, "total_steps": 1918, "loss": 0.192, "learning_rate": 1.0007080637033359e-06, "epoch": 0.7193588323450837, "percentage": 71.95, "elapsed_time": "4:00:57", "remaining_time": "1:33:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1381, "total_steps": 1918, "loss": 0.1785, "learning_rate": 9.972608687789346e-07, "epoch": 0.7198801068612758, "percentage": 72.0, "elapsed_time": "4:01:07", "remaining_time": "1:33:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1382, "total_steps": 1918, "loss": 0.1815, "learning_rate": 9.938181415800966e-07, "epoch": 0.7204013813774679, "percentage": 72.05, "elapsed_time": "4:01:17", "remaining_time": "1:33:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1383, "total_steps": 1918, "loss": 0.1688, "learning_rate": 9.903798923422369e-07, "epoch": 0.72092265589366, "percentage": 72.11, "elapsed_time": "4:01:27", "remaining_time": "1:33:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1384, "total_steps": 1918, "loss": 0.1782, "learning_rate": 9.869461312874603e-07, "epoch": 0.7214439304098521, "percentage": 72.16, "elapsed_time": "4:01:38", "remaining_time": "1:33:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1385, "total_steps": 1918, "loss": 0.1847, "learning_rate": 9.835168686245252e-07, "epoch": 0.7219652049260442, "percentage": 72.21, "elapsed_time": "4:01:48", "remaining_time": "1:33:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1386, "total_steps": 1918, "loss": 0.1933, "learning_rate": 9.800921145488171e-07, "epoch": 0.7224864794422363, "percentage": 72.26, "elapsed_time": "4:01:58", "remaining_time": "1:32:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1387, "total_steps": 1918, "loss": 0.1772, "learning_rate": 9.766718792423159e-07, "epoch": 0.7230077539584283, "percentage": 72.31, "elapsed_time": "4:02:08", "remaining_time": "1:32:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1388, "total_steps": 1918, "loss": 0.1914, "learning_rate": 9.732561728735698e-07, "epoch": 0.7235290284746204, "percentage": 72.37, "elapsed_time": "4:02:19", "remaining_time": "1:32:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1389, "total_steps": 1918, "loss": 0.1804, "learning_rate": 9.698450055976596e-07, "epoch": 0.7240503029908125, "percentage": 72.42, "elapsed_time": "4:02:29", "remaining_time": "1:32:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1390, "total_steps": 1918, "loss": 0.1887, "learning_rate": 9.664383875561726e-07, "epoch": 0.7245715775070046, "percentage": 72.47, "elapsed_time": "4:02:39", "remaining_time": "1:32:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1391, "total_steps": 1918, "loss": 0.1806, "learning_rate": 9.630363288771689e-07, "epoch": 0.7250928520231967, "percentage": 72.52, "elapsed_time": "4:02:49", "remaining_time": "1:31:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1392, "total_steps": 1918, "loss": 0.1752, "learning_rate": 9.596388396751567e-07, "epoch": 0.7256141265393888, "percentage": 72.58, "elapsed_time": "4:02:59", "remaining_time": "1:31:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1393, "total_steps": 1918, "loss": 0.1963, "learning_rate": 9.562459300510562e-07, "epoch": 0.7261354010555809, "percentage": 72.63, "elapsed_time": "4:03:09", "remaining_time": "1:31:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1394, "total_steps": 1918, "loss": 0.1914, "learning_rate": 9.528576100921736e-07, "epoch": 0.7266566755717729, "percentage": 72.68, "elapsed_time": "4:03:20", "remaining_time": "1:31:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1395, "total_steps": 1918, "loss": 0.1888, "learning_rate": 9.494738898721681e-07, "epoch": 0.727177950087965, "percentage": 72.73, "elapsed_time": "4:03:29", "remaining_time": "1:31:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1396, "total_steps": 1918, "loss": 0.199, "learning_rate": 9.460947794510264e-07, "epoch": 0.7276992246041571, "percentage": 72.78, "elapsed_time": "4:03:39", "remaining_time": "1:31:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1397, "total_steps": 1918, "loss": 0.1906, "learning_rate": 9.427202888750278e-07, "epoch": 0.7282204991203493, "percentage": 72.84, "elapsed_time": "4:03:49", "remaining_time": "1:30:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1398, "total_steps": 1918, "loss": 0.1728, "learning_rate": 9.393504281767163e-07, "epoch": 0.7287417736365414, "percentage": 72.89, "elapsed_time": "4:04:00", "remaining_time": "1:30:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1399, "total_steps": 1918, "loss": 0.1757, "learning_rate": 9.359852073748746e-07, "epoch": 0.7292630481527335, "percentage": 72.94, "elapsed_time": "4:04:11", "remaining_time": "1:30:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1400, "total_steps": 1918, "loss": 0.1774, "learning_rate": 9.326246364744845e-07, "epoch": 0.7297843226689256, "percentage": 72.99, "elapsed_time": "4:04:21", "remaining_time": "1:30:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1401, "total_steps": 1918, "loss": 0.1655, "learning_rate": 9.292687254667096e-07, "epoch": 0.7303055971851176, "percentage": 73.04, "elapsed_time": "4:04:32", "remaining_time": "1:30:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1402, "total_steps": 1918, "loss": 0.1858, "learning_rate": 9.259174843288557e-07, "epoch": 0.7308268717013097, "percentage": 73.1, "elapsed_time": "4:04:43", "remaining_time": "1:30:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1403, "total_steps": 1918, "loss": 0.1643, "learning_rate": 9.225709230243455e-07, "epoch": 0.7313481462175018, "percentage": 73.15, "elapsed_time": "4:04:53", "remaining_time": "1:29:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1404, "total_steps": 1918, "loss": 0.1656, "learning_rate": 9.192290515026903e-07, "epoch": 0.7318694207336939, "percentage": 73.2, "elapsed_time": "4:05:03", "remaining_time": "1:29:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1405, "total_steps": 1918, "loss": 0.1882, "learning_rate": 9.158918796994543e-07, "epoch": 0.732390695249886, "percentage": 73.25, "elapsed_time": "4:05:13", "remaining_time": "1:29:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1406, "total_steps": 1918, "loss": 0.1671, "learning_rate": 9.125594175362326e-07, "epoch": 0.7329119697660781, "percentage": 73.31, "elapsed_time": "4:05:23", "remaining_time": "1:29:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1407, "total_steps": 1918, "loss": 0.1761, "learning_rate": 9.092316749206198e-07, "epoch": 0.7334332442822702, "percentage": 73.36, "elapsed_time": "4:05:34", "remaining_time": "1:29:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1408, "total_steps": 1918, "loss": 0.199, "learning_rate": 9.059086617461723e-07, "epoch": 0.7339545187984622, "percentage": 73.41, "elapsed_time": "4:05:44", "remaining_time": "1:29:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1409, "total_steps": 1918, "loss": 0.1887, "learning_rate": 9.025903878923934e-07, "epoch": 0.7344757933146543, "percentage": 73.46, "elapsed_time": "4:05:54", "remaining_time": "1:28:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1410, "total_steps": 1918, "loss": 0.211, "learning_rate": 8.992768632246907e-07, "epoch": 0.7349970678308464, "percentage": 73.51, "elapsed_time": "4:06:05", "remaining_time": "1:28:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1411, "total_steps": 1918, "loss": 0.1875, "learning_rate": 8.959680975943541e-07, "epoch": 0.7355183423470385, "percentage": 73.57, "elapsed_time": "4:06:16", "remaining_time": "1:28:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1412, "total_steps": 1918, "loss": 0.1819, "learning_rate": 8.926641008385268e-07, "epoch": 0.7360396168632306, "percentage": 73.62, "elapsed_time": "4:06:27", "remaining_time": "1:28:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1413, "total_steps": 1918, "loss": 0.1946, "learning_rate": 8.893648827801685e-07, "epoch": 0.7365608913794227, "percentage": 73.67, "elapsed_time": "4:06:37", "remaining_time": "1:28:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1414, "total_steps": 1918, "loss": 0.1786, "learning_rate": 8.860704532280373e-07, "epoch": 0.7370821658956148, "percentage": 73.72, "elapsed_time": "4:06:49", "remaining_time": "1:27:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1415, "total_steps": 1918, "loss": 0.1729, "learning_rate": 8.827808219766513e-07, "epoch": 0.7376034404118069, "percentage": 73.77, "elapsed_time": "4:06:59", "remaining_time": "1:27:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1416, "total_steps": 1918, "loss": 0.1749, "learning_rate": 8.794959988062632e-07, "epoch": 0.7381247149279989, "percentage": 73.83, "elapsed_time": "4:07:10", "remaining_time": "1:27:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1417, "total_steps": 1918, "loss": 0.1777, "learning_rate": 8.762159934828337e-07, "epoch": 0.738645989444191, "percentage": 73.88, "elapsed_time": "4:07:19", "remaining_time": "1:27:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1418, "total_steps": 1918, "loss": 0.1918, "learning_rate": 8.729408157579968e-07, "epoch": 0.7391672639603831, "percentage": 73.93, "elapsed_time": "4:07:30", "remaining_time": "1:27:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1419, "total_steps": 1918, "loss": 0.1819, "learning_rate": 8.696704753690344e-07, "epoch": 0.7396885384765752, "percentage": 73.98, "elapsed_time": "4:07:40", "remaining_time": "1:27:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1420, "total_steps": 1918, "loss": 0.1968, "learning_rate": 8.664049820388492e-07, "epoch": 0.7402098129927673, "percentage": 74.04, "elapsed_time": "4:07:49", "remaining_time": "1:26:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1421, "total_steps": 1918, "loss": 0.1915, "learning_rate": 8.631443454759283e-07, "epoch": 0.7407310875089594, "percentage": 74.09, "elapsed_time": "4:08:00", "remaining_time": "1:26:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1422, "total_steps": 1918, "loss": 0.1858, "learning_rate": 8.598885753743247e-07, "epoch": 0.7412523620251515, "percentage": 74.14, "elapsed_time": "4:08:10", "remaining_time": "1:26:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1423, "total_steps": 1918, "loss": 0.1759, "learning_rate": 8.566376814136201e-07, "epoch": 0.7417736365413435, "percentage": 74.19, "elapsed_time": "4:08:20", "remaining_time": "1:26:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1424, "total_steps": 1918, "loss": 0.1965, "learning_rate": 8.533916732588996e-07, "epoch": 0.7422949110575356, "percentage": 74.24, "elapsed_time": "4:08:31", "remaining_time": "1:26:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1425, "total_steps": 1918, "loss": 0.1918, "learning_rate": 8.501505605607236e-07, "epoch": 0.7428161855737277, "percentage": 74.3, "elapsed_time": "4:08:41", "remaining_time": "1:26:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1426, "total_steps": 1918, "loss": 0.1882, "learning_rate": 8.469143529550968e-07, "epoch": 0.7433374600899199, "percentage": 74.35, "elapsed_time": "4:08:50", "remaining_time": "1:25:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1427, "total_steps": 1918, "loss": 0.1785, "learning_rate": 8.436830600634416e-07, "epoch": 0.743858734606112, "percentage": 74.4, "elapsed_time": "4:09:01", "remaining_time": "1:25:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1428, "total_steps": 1918, "loss": 0.1726, "learning_rate": 8.404566914925672e-07, "epoch": 0.7443800091223041, "percentage": 74.45, "elapsed_time": "4:09:10", "remaining_time": "1:25:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1429, "total_steps": 1918, "loss": 0.1942, "learning_rate": 8.372352568346453e-07, "epoch": 0.7449012836384962, "percentage": 74.5, "elapsed_time": "4:09:21", "remaining_time": "1:25:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1430, "total_steps": 1918, "loss": 0.1898, "learning_rate": 8.340187656671767e-07, "epoch": 0.7454225581546882, "percentage": 74.56, "elapsed_time": "4:09:31", "remaining_time": "1:25:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1431, "total_steps": 1918, "loss": 0.1793, "learning_rate": 8.308072275529652e-07, "epoch": 0.7459438326708803, "percentage": 74.61, "elapsed_time": "4:09:41", "remaining_time": "1:24:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1432, "total_steps": 1918, "loss": 0.195, "learning_rate": 8.27600652040089e-07, "epoch": 0.7464651071870724, "percentage": 74.66, "elapsed_time": "4:09:53", "remaining_time": "1:24:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1433, "total_steps": 1918, "loss": 0.1837, "learning_rate": 8.243990486618717e-07, "epoch": 0.7469863817032645, "percentage": 74.71, "elapsed_time": "4:10:03", "remaining_time": "1:24:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1434, "total_steps": 1918, "loss": 0.1723, "learning_rate": 8.212024269368565e-07, "epoch": 0.7475076562194566, "percentage": 74.77, "elapsed_time": "4:10:14", "remaining_time": "1:24:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1435, "total_steps": 1918, "loss": 0.1743, "learning_rate": 8.180107963687741e-07, "epoch": 0.7480289307356487, "percentage": 74.82, "elapsed_time": "4:10:25", "remaining_time": "1:24:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1436, "total_steps": 1918, "loss": 0.1703, "learning_rate": 8.148241664465157e-07, "epoch": 0.7485502052518408, "percentage": 74.87, "elapsed_time": "4:10:36", "remaining_time": "1:24:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1437, "total_steps": 1918, "loss": 0.1702, "learning_rate": 8.116425466441077e-07, "epoch": 0.7490714797680328, "percentage": 74.92, "elapsed_time": "4:10:47", "remaining_time": "1:23:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1438, "total_steps": 1918, "loss": 0.1754, "learning_rate": 8.084659464206787e-07, "epoch": 0.7495927542842249, "percentage": 74.97, "elapsed_time": "4:10:57", "remaining_time": "1:23:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1439, "total_steps": 1918, "loss": 0.1951, "learning_rate": 8.052943752204339e-07, "epoch": 0.750114028800417, "percentage": 75.03, "elapsed_time": "4:11:08", "remaining_time": "1:23:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1440, "total_steps": 1918, "loss": 0.182, "learning_rate": 8.021278424726308e-07, "epoch": 0.7506353033166091, "percentage": 75.08, "elapsed_time": "4:11:18", "remaining_time": "1:23:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1441, "total_steps": 1918, "loss": 0.183, "learning_rate": 7.989663575915407e-07, "epoch": 0.7511565778328012, "percentage": 75.13, "elapsed_time": "4:11:29", "remaining_time": "1:23:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1442, "total_steps": 1918, "loss": 0.1816, "learning_rate": 7.958099299764332e-07, "epoch": 0.7516778523489933, "percentage": 75.18, "elapsed_time": "4:11:39", "remaining_time": "1:23:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1443, "total_steps": 1918, "loss": 0.1849, "learning_rate": 7.926585690115396e-07, "epoch": 0.7521991268651854, "percentage": 75.23, "elapsed_time": "4:11:50", "remaining_time": "1:22:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1444, "total_steps": 1918, "loss": 0.1891, "learning_rate": 7.895122840660272e-07, "epoch": 0.7527204013813774, "percentage": 75.29, "elapsed_time": "4:12:01", "remaining_time": "1:22:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1445, "total_steps": 1918, "loss": 0.1813, "learning_rate": 7.863710844939759e-07, "epoch": 0.7532416758975695, "percentage": 75.34, "elapsed_time": "4:12:11", "remaining_time": "1:22:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1446, "total_steps": 1918, "loss": 0.196, "learning_rate": 7.8323497963434e-07, "epoch": 0.7537629504137616, "percentage": 75.39, "elapsed_time": "4:12:23", "remaining_time": "1:22:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1447, "total_steps": 1918, "loss": 0.1818, "learning_rate": 7.801039788109332e-07, "epoch": 0.7542842249299537, "percentage": 75.44, "elapsed_time": "4:12:34", "remaining_time": "1:22:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1448, "total_steps": 1918, "loss": 0.1862, "learning_rate": 7.769780913323916e-07, "epoch": 0.7548054994461458, "percentage": 75.5, "elapsed_time": "4:12:44", "remaining_time": "1:22:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1449, "total_steps": 1918, "loss": 0.1837, "learning_rate": 7.738573264921481e-07, "epoch": 0.7553267739623379, "percentage": 75.55, "elapsed_time": "4:12:56", "remaining_time": "1:21:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1450, "total_steps": 1918, "loss": 0.1841, "learning_rate": 7.707416935684092e-07, "epoch": 0.75584804847853, "percentage": 75.6, "elapsed_time": "4:13:06", "remaining_time": "1:21:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1451, "total_steps": 1918, "loss": 0.182, "learning_rate": 7.676312018241211e-07, "epoch": 0.7563693229947221, "percentage": 75.65, "elapsed_time": "4:13:17", "remaining_time": "1:21:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1452, "total_steps": 1918, "loss": 0.1822, "learning_rate": 7.645258605069444e-07, "epoch": 0.7568905975109141, "percentage": 75.7, "elapsed_time": "4:13:28", "remaining_time": "1:21:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1453, "total_steps": 1918, "loss": 0.1748, "learning_rate": 7.614256788492316e-07, "epoch": 0.7574118720271062, "percentage": 75.76, "elapsed_time": "4:13:39", "remaining_time": "1:21:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1454, "total_steps": 1918, "loss": 0.1759, "learning_rate": 7.583306660679888e-07, "epoch": 0.7579331465432984, "percentage": 75.81, "elapsed_time": "4:13:48", "remaining_time": "1:20:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1455, "total_steps": 1918, "loss": 0.1874, "learning_rate": 7.552408313648602e-07, "epoch": 0.7584544210594905, "percentage": 75.86, "elapsed_time": "4:14:00", "remaining_time": "1:20:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1456, "total_steps": 1918, "loss": 0.1733, "learning_rate": 7.521561839260927e-07, "epoch": 0.7589756955756826, "percentage": 75.91, "elapsed_time": "4:14:09", "remaining_time": "1:20:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1457, "total_steps": 1918, "loss": 0.1912, "learning_rate": 7.49076732922511e-07, "epoch": 0.7594969700918747, "percentage": 75.96, "elapsed_time": "4:14:20", "remaining_time": "1:20:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1458, "total_steps": 1918, "loss": 0.1791, "learning_rate": 7.460024875094926e-07, "epoch": 0.7600182446080668, "percentage": 76.02, "elapsed_time": "4:14:31", "remaining_time": "1:20:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1459, "total_steps": 1918, "loss": 0.1951, "learning_rate": 7.429334568269364e-07, "epoch": 0.7605395191242588, "percentage": 76.07, "elapsed_time": "4:14:42", "remaining_time": "1:20:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1460, "total_steps": 1918, "loss": 0.1678, "learning_rate": 7.398696499992386e-07, "epoch": 0.7610607936404509, "percentage": 76.12, "elapsed_time": "4:14:53", "remaining_time": "1:19:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1461, "total_steps": 1918, "loss": 0.1872, "learning_rate": 7.368110761352631e-07, "epoch": 0.761582068156643, "percentage": 76.17, "elapsed_time": "4:15:03", "remaining_time": "1:19:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1462, "total_steps": 1918, "loss": 0.1775, "learning_rate": 7.337577443283192e-07, "epoch": 0.7621033426728351, "percentage": 76.23, "elapsed_time": "4:15:14", "remaining_time": "1:19:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1463, "total_steps": 1918, "loss": 0.1801, "learning_rate": 7.307096636561281e-07, "epoch": 0.7626246171890272, "percentage": 76.28, "elapsed_time": "4:15:25", "remaining_time": "1:19:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1464, "total_steps": 1918, "loss": 0.1828, "learning_rate": 7.276668431808004e-07, "epoch": 0.7631458917052193, "percentage": 76.33, "elapsed_time": "4:15:35", "remaining_time": "1:19:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1465, "total_steps": 1918, "loss": 0.1752, "learning_rate": 7.246292919488068e-07, "epoch": 0.7636671662214114, "percentage": 76.38, "elapsed_time": "4:15:44", "remaining_time": "1:19:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1466, "total_steps": 1918, "loss": 0.1814, "learning_rate": 7.215970189909546e-07, "epoch": 0.7641884407376034, "percentage": 76.43, "elapsed_time": "4:15:54", "remaining_time": "1:18:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1467, "total_steps": 1918, "loss": 0.2006, "learning_rate": 7.185700333223564e-07, "epoch": 0.7647097152537955, "percentage": 76.49, "elapsed_time": "4:16:05", "remaining_time": "1:18:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1468, "total_steps": 1918, "loss": 0.1843, "learning_rate": 7.155483439424058e-07, "epoch": 0.7652309897699876, "percentage": 76.54, "elapsed_time": "4:16:16", "remaining_time": "1:18:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1469, "total_steps": 1918, "loss": 0.1867, "learning_rate": 7.1253195983475e-07, "epoch": 0.7657522642861797, "percentage": 76.59, "elapsed_time": "4:16:25", "remaining_time": "1:18:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1470, "total_steps": 1918, "loss": 0.1819, "learning_rate": 7.09520889967265e-07, "epoch": 0.7662735388023718, "percentage": 76.64, "elapsed_time": "4:16:36", "remaining_time": "1:18:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1471, "total_steps": 1918, "loss": 0.1841, "learning_rate": 7.065151432920258e-07, "epoch": 0.7667948133185639, "percentage": 76.69, "elapsed_time": "4:16:46", "remaining_time": "1:18:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1472, "total_steps": 1918, "loss": 0.1995, "learning_rate": 7.035147287452803e-07, "epoch": 0.767316087834756, "percentage": 76.75, "elapsed_time": "4:16:57", "remaining_time": "1:17:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1473, "total_steps": 1918, "loss": 0.1871, "learning_rate": 7.005196552474275e-07, "epoch": 0.767837362350948, "percentage": 76.8, "elapsed_time": "4:17:07", "remaining_time": "1:17:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1474, "total_steps": 1918, "loss": 0.1922, "learning_rate": 6.975299317029813e-07, "epoch": 0.7683586368671401, "percentage": 76.85, "elapsed_time": "4:17:19", "remaining_time": "1:17:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1475, "total_steps": 1918, "loss": 0.191, "learning_rate": 6.945455670005558e-07, "epoch": 0.7688799113833322, "percentage": 76.9, "elapsed_time": "4:17:29", "remaining_time": "1:17:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1476, "total_steps": 1918, "loss": 0.1786, "learning_rate": 6.915665700128291e-07, "epoch": 0.7694011858995243, "percentage": 76.96, "elapsed_time": "4:17:39", "remaining_time": "1:17:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1477, "total_steps": 1918, "loss": 0.188, "learning_rate": 6.885929495965216e-07, "epoch": 0.7699224604157164, "percentage": 77.01, "elapsed_time": "4:17:50", "remaining_time": "1:16:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1478, "total_steps": 1918, "loss": 0.1857, "learning_rate": 6.856247145923708e-07, "epoch": 0.7704437349319085, "percentage": 77.06, "elapsed_time": "4:18:00", "remaining_time": "1:16:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1479, "total_steps": 1918, "loss": 0.176, "learning_rate": 6.82661873825101e-07, "epoch": 0.7709650094481006, "percentage": 77.11, "elapsed_time": "4:18:10", "remaining_time": "1:16:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1480, "total_steps": 1918, "loss": 0.195, "learning_rate": 6.797044361033986e-07, "epoch": 0.7714862839642926, "percentage": 77.16, "elapsed_time": "4:18:21", "remaining_time": "1:16:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1481, "total_steps": 1918, "loss": 0.1812, "learning_rate": 6.767524102198903e-07, "epoch": 0.7720075584804847, "percentage": 77.22, "elapsed_time": "4:18:32", "remaining_time": "1:16:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1482, "total_steps": 1918, "loss": 0.2003, "learning_rate": 6.738058049511067e-07, "epoch": 0.7725288329966769, "percentage": 77.27, "elapsed_time": "4:18:42", "remaining_time": "1:16:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1483, "total_steps": 1918, "loss": 0.1962, "learning_rate": 6.708646290574694e-07, "epoch": 0.773050107512869, "percentage": 77.32, "elapsed_time": "4:18:53", "remaining_time": "1:15:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1484, "total_steps": 1918, "loss": 0.1913, "learning_rate": 6.679288912832538e-07, "epoch": 0.7735713820290611, "percentage": 77.37, "elapsed_time": "4:19:03", "remaining_time": "1:15:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1485, "total_steps": 1918, "loss": 0.1768, "learning_rate": 6.649986003565678e-07, "epoch": 0.7740926565452532, "percentage": 77.42, "elapsed_time": "4:19:13", "remaining_time": "1:15:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1486, "total_steps": 1918, "loss": 0.1678, "learning_rate": 6.620737649893291e-07, "epoch": 0.7746139310614453, "percentage": 77.48, "elapsed_time": "4:19:23", "remaining_time": "1:15:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1487, "total_steps": 1918, "loss": 0.1949, "learning_rate": 6.591543938772302e-07, "epoch": 0.7751352055776374, "percentage": 77.53, "elapsed_time": "4:19:33", "remaining_time": "1:15:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1488, "total_steps": 1918, "loss": 0.1736, "learning_rate": 6.562404956997229e-07, "epoch": 0.7756564800938294, "percentage": 77.58, "elapsed_time": "4:19:43", "remaining_time": "1:15:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1489, "total_steps": 1918, "loss": 0.1779, "learning_rate": 6.533320791199848e-07, "epoch": 0.7761777546100215, "percentage": 77.63, "elapsed_time": "4:19:54", "remaining_time": "1:14:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1490, "total_steps": 1918, "loss": 0.1834, "learning_rate": 6.504291527848972e-07, "epoch": 0.7766990291262136, "percentage": 77.69, "elapsed_time": "4:20:03", "remaining_time": "1:14:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1491, "total_steps": 1918, "loss": 0.1854, "learning_rate": 6.475317253250196e-07, "epoch": 0.7772203036424057, "percentage": 77.74, "elapsed_time": "4:20:13", "remaining_time": "1:14:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1492, "total_steps": 1918, "loss": 0.1679, "learning_rate": 6.446398053545619e-07, "epoch": 0.7777415781585978, "percentage": 77.79, "elapsed_time": "4:20:23", "remaining_time": "1:14:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1493, "total_steps": 1918, "loss": 0.182, "learning_rate": 6.417534014713594e-07, "epoch": 0.7782628526747899, "percentage": 77.84, "elapsed_time": "4:20:33", "remaining_time": "1:14:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1494, "total_steps": 1918, "loss": 0.1922, "learning_rate": 6.388725222568498e-07, "epoch": 0.778784127190982, "percentage": 77.89, "elapsed_time": "4:20:44", "remaining_time": "1:13:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1495, "total_steps": 1918, "loss": 0.182, "learning_rate": 6.359971762760442e-07, "epoch": 0.779305401707174, "percentage": 77.95, "elapsed_time": "4:20:55", "remaining_time": "1:13:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1496, "total_steps": 1918, "loss": 0.1754, "learning_rate": 6.331273720775028e-07, "epoch": 0.7798266762233661, "percentage": 78.0, "elapsed_time": "4:21:05", "remaining_time": "1:13:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1497, "total_steps": 1918, "loss": 0.1863, "learning_rate": 6.302631181933106e-07, "epoch": 0.7803479507395582, "percentage": 78.05, "elapsed_time": "4:21:15", "remaining_time": "1:13:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1498, "total_steps": 1918, "loss": 0.1845, "learning_rate": 6.274044231390503e-07, "epoch": 0.7808692252557503, "percentage": 78.1, "elapsed_time": "4:21:28", "remaining_time": "1:13:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1499, "total_steps": 1918, "loss": 0.187, "learning_rate": 6.245512954137795e-07, "epoch": 0.7813904997719424, "percentage": 78.15, "elapsed_time": "4:21:37", "remaining_time": "1:13:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1500, "total_steps": 1918, "loss": 0.1811, "learning_rate": 6.217037435000028e-07, "epoch": 0.7819117742881345, "percentage": 78.21, "elapsed_time": "4:21:48", "remaining_time": "1:12:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1500, "total_steps": 1918, "eval_loss": 0.18243278563022614, "epoch": 0.7819117742881345, "percentage": 78.21, "elapsed_time": "4:22:40", "remaining_time": "1:13:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1501, "total_steps": 1918, "loss": 0.1843, "learning_rate": 6.18861775863647e-07, "epoch": 0.7824330488043266, "percentage": 78.26, "elapsed_time": "4:22:50", "remaining_time": "1:13:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1502, "total_steps": 1918, "loss": 0.1844, "learning_rate": 6.16025400954037e-07, "epoch": 0.7829543233205186, "percentage": 78.31, "elapsed_time": "4:23:00", "remaining_time": "1:12:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1503, "total_steps": 1918, "loss": 0.1747, "learning_rate": 6.131946272038719e-07, "epoch": 0.7834755978367107, "percentage": 78.36, "elapsed_time": "4:23:10", "remaining_time": "1:12:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1504, "total_steps": 1918, "loss": 0.1889, "learning_rate": 6.103694630291954e-07, "epoch": 0.7839968723529028, "percentage": 78.42, "elapsed_time": "4:23:19", "remaining_time": "1:12:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1505, "total_steps": 1918, "loss": 0.1693, "learning_rate": 6.07549916829375e-07, "epoch": 0.7845181468690949, "percentage": 78.47, "elapsed_time": "4:23:30", "remaining_time": "1:12:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1506, "total_steps": 1918, "loss": 0.1752, "learning_rate": 6.047359969870773e-07, "epoch": 0.785039421385287, "percentage": 78.52, "elapsed_time": "4:23:40", "remaining_time": "1:12:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1507, "total_steps": 1918, "loss": 0.1932, "learning_rate": 6.019277118682371e-07, "epoch": 0.7855606959014791, "percentage": 78.57, "elapsed_time": "4:23:49", "remaining_time": "1:11:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1508, "total_steps": 1918, "loss": 0.185, "learning_rate": 5.991250698220416e-07, "epoch": 0.7860819704176712, "percentage": 78.62, "elapsed_time": "4:24:00", "remaining_time": "1:11:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1509, "total_steps": 1918, "loss": 0.1962, "learning_rate": 5.963280791808984e-07, "epoch": 0.7866032449338632, "percentage": 78.68, "elapsed_time": "4:24:10", "remaining_time": "1:11:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1510, "total_steps": 1918, "loss": 0.1802, "learning_rate": 5.935367482604124e-07, "epoch": 0.7871245194500553, "percentage": 78.73, "elapsed_time": "4:24:22", "remaining_time": "1:11:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1511, "total_steps": 1918, "loss": 0.1857, "learning_rate": 5.907510853593642e-07, "epoch": 0.7876457939662475, "percentage": 78.78, "elapsed_time": "4:24:34", "remaining_time": "1:11:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1512, "total_steps": 1918, "loss": 0.1887, "learning_rate": 5.879710987596818e-07, "epoch": 0.7881670684824396, "percentage": 78.83, "elapsed_time": "4:24:44", "remaining_time": "1:11:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1513, "total_steps": 1918, "loss": 0.1718, "learning_rate": 5.851967967264164e-07, "epoch": 0.7886883429986317, "percentage": 78.88, "elapsed_time": "4:24:56", "remaining_time": "1:10:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1514, "total_steps": 1918, "loss": 0.1747, "learning_rate": 5.824281875077212e-07, "epoch": 0.7892096175148238, "percentage": 78.94, "elapsed_time": "4:25:06", "remaining_time": "1:10:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1515, "total_steps": 1918, "loss": 0.1698, "learning_rate": 5.796652793348203e-07, "epoch": 0.7897308920310159, "percentage": 78.99, "elapsed_time": "4:25:17", "remaining_time": "1:10:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1516, "total_steps": 1918, "loss": 0.1823, "learning_rate": 5.769080804219929e-07, "epoch": 0.7902521665472079, "percentage": 79.04, "elapsed_time": "4:25:27", "remaining_time": "1:10:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1517, "total_steps": 1918, "loss": 0.1914, "learning_rate": 5.741565989665413e-07, "epoch": 0.7907734410634, "percentage": 79.09, "elapsed_time": "4:25:38", "remaining_time": "1:10:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1518, "total_steps": 1918, "loss": 0.1919, "learning_rate": 5.714108431487692e-07, "epoch": 0.7912947155795921, "percentage": 79.14, "elapsed_time": "4:25:48", "remaining_time": "1:10:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1519, "total_steps": 1918, "loss": 0.1886, "learning_rate": 5.68670821131961e-07, "epoch": 0.7918159900957842, "percentage": 79.2, "elapsed_time": "4:25:58", "remaining_time": "1:09:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1520, "total_steps": 1918, "loss": 0.1932, "learning_rate": 5.659365410623491e-07, "epoch": 0.7923372646119763, "percentage": 79.25, "elapsed_time": "4:26:10", "remaining_time": "1:09:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1521, "total_steps": 1918, "loss": 0.1841, "learning_rate": 5.63208011069099e-07, "epoch": 0.7928585391281684, "percentage": 79.3, "elapsed_time": "4:26:20", "remaining_time": "1:09:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1522, "total_steps": 1918, "loss": 0.179, "learning_rate": 5.604852392642813e-07, "epoch": 0.7933798136443605, "percentage": 79.35, "elapsed_time": "4:26:30", "remaining_time": "1:09:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1523, "total_steps": 1918, "loss": 0.1882, "learning_rate": 5.577682337428417e-07, "epoch": 0.7939010881605526, "percentage": 79.41, "elapsed_time": "4:26:39", "remaining_time": "1:09:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1524, "total_steps": 1918, "loss": 0.185, "learning_rate": 5.550570025825888e-07, "epoch": 0.7944223626767446, "percentage": 79.46, "elapsed_time": "4:26:50", "remaining_time": "1:08:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1525, "total_steps": 1918, "loss": 0.1885, "learning_rate": 5.523515538441604e-07, "epoch": 0.7949436371929367, "percentage": 79.51, "elapsed_time": "4:27:01", "remaining_time": "1:08:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1526, "total_steps": 1918, "loss": 0.1642, "learning_rate": 5.496518955710023e-07, "epoch": 0.7954649117091288, "percentage": 79.56, "elapsed_time": "4:27:11", "remaining_time": "1:08:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1527, "total_steps": 1918, "loss": 0.1834, "learning_rate": 5.469580357893484e-07, "epoch": 0.7959861862253209, "percentage": 79.61, "elapsed_time": "4:27:22", "remaining_time": "1:08:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1528, "total_steps": 1918, "loss": 0.1781, "learning_rate": 5.442699825081885e-07, "epoch": 0.796507460741513, "percentage": 79.67, "elapsed_time": "4:27:31", "remaining_time": "1:08:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1529, "total_steps": 1918, "loss": 0.1871, "learning_rate": 5.415877437192535e-07, "epoch": 0.7970287352577051, "percentage": 79.72, "elapsed_time": "4:27:41", "remaining_time": "1:08:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1530, "total_steps": 1918, "loss": 0.1916, "learning_rate": 5.389113273969857e-07, "epoch": 0.7975500097738972, "percentage": 79.77, "elapsed_time": "4:27:51", "remaining_time": "1:07:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1531, "total_steps": 1918, "loss": 0.1715, "learning_rate": 5.36240741498516e-07, "epoch": 0.7980712842900892, "percentage": 79.82, "elapsed_time": "4:28:01", "remaining_time": "1:07:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1532, "total_steps": 1918, "loss": 0.1677, "learning_rate": 5.33575993963644e-07, "epoch": 0.7985925588062813, "percentage": 79.87, "elapsed_time": "4:28:11", "remaining_time": "1:07:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1533, "total_steps": 1918, "loss": 0.173, "learning_rate": 5.309170927148088e-07, "epoch": 0.7991138333224734, "percentage": 79.93, "elapsed_time": "4:28:21", "remaining_time": "1:07:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1534, "total_steps": 1918, "loss": 0.19, "learning_rate": 5.282640456570692e-07, "epoch": 0.7996351078386655, "percentage": 79.98, "elapsed_time": "4:28:32", "remaining_time": "1:07:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1535, "total_steps": 1918, "loss": 0.1826, "learning_rate": 5.256168606780784e-07, "epoch": 0.8001563823548576, "percentage": 80.03, "elapsed_time": "4:28:43", "remaining_time": "1:07:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1536, "total_steps": 1918, "loss": 0.1661, "learning_rate": 5.229755456480635e-07, "epoch": 0.8006776568710497, "percentage": 80.08, "elapsed_time": "4:28:53", "remaining_time": "1:06:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1537, "total_steps": 1918, "loss": 0.1888, "learning_rate": 5.203401084197973e-07, "epoch": 0.8011989313872419, "percentage": 80.14, "elapsed_time": "4:29:03", "remaining_time": "1:06:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1538, "total_steps": 1918, "loss": 0.1745, "learning_rate": 5.177105568285793e-07, "epoch": 0.8017202059034338, "percentage": 80.19, "elapsed_time": "4:29:13", "remaining_time": "1:06:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1539, "total_steps": 1918, "loss": 0.1841, "learning_rate": 5.150868986922092e-07, "epoch": 0.802241480419626, "percentage": 80.24, "elapsed_time": "4:29:23", "remaining_time": "1:06:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1540, "total_steps": 1918, "loss": 0.1698, "learning_rate": 5.124691418109673e-07, "epoch": 0.8027627549358181, "percentage": 80.29, "elapsed_time": "4:29:33", "remaining_time": "1:06:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1541, "total_steps": 1918, "loss": 0.1911, "learning_rate": 5.09857293967587e-07, "epoch": 0.8032840294520102, "percentage": 80.34, "elapsed_time": "4:29:44", "remaining_time": "1:05:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1542, "total_steps": 1918, "loss": 0.1792, "learning_rate": 5.072513629272352e-07, "epoch": 0.8038053039682023, "percentage": 80.4, "elapsed_time": "4:29:54", "remaining_time": "1:05:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1543, "total_steps": 1918, "loss": 0.1918, "learning_rate": 5.046513564374861e-07, "epoch": 0.8043265784843944, "percentage": 80.45, "elapsed_time": "4:30:03", "remaining_time": "1:05:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1544, "total_steps": 1918, "loss": 0.2082, "learning_rate": 5.020572822283027e-07, "epoch": 0.8048478530005865, "percentage": 80.5, "elapsed_time": "4:30:14", "remaining_time": "1:05:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1545, "total_steps": 1918, "loss": 0.1778, "learning_rate": 4.994691480120086e-07, "epoch": 0.8053691275167785, "percentage": 80.55, "elapsed_time": "4:30:25", "remaining_time": "1:05:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1546, "total_steps": 1918, "loss": 0.1616, "learning_rate": 4.968869614832681e-07, "epoch": 0.8058904020329706, "percentage": 80.6, "elapsed_time": "4:30:35", "remaining_time": "1:05:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1547, "total_steps": 1918, "loss": 0.1946, "learning_rate": 4.943107303190639e-07, "epoch": 0.8064116765491627, "percentage": 80.66, "elapsed_time": "4:30:45", "remaining_time": "1:04:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1548, "total_steps": 1918, "loss": 0.1729, "learning_rate": 4.917404621786703e-07, "epoch": 0.8069329510653548, "percentage": 80.71, "elapsed_time": "4:30:55", "remaining_time": "1:04:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1549, "total_steps": 1918, "loss": 0.1881, "learning_rate": 4.891761647036364e-07, "epoch": 0.8074542255815469, "percentage": 80.76, "elapsed_time": "4:31:06", "remaining_time": "1:04:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1550, "total_steps": 1918, "loss": 0.1739, "learning_rate": 4.866178455177584e-07, "epoch": 0.807975500097739, "percentage": 80.81, "elapsed_time": "4:31:16", "remaining_time": "1:04:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1551, "total_steps": 1918, "loss": 0.1649, "learning_rate": 4.840655122270582e-07, "epoch": 0.8084967746139311, "percentage": 80.87, "elapsed_time": "4:31:26", "remaining_time": "1:04:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1552, "total_steps": 1918, "loss": 0.1782, "learning_rate": 4.815191724197634e-07, "epoch": 0.8090180491301231, "percentage": 80.92, "elapsed_time": "4:31:37", "remaining_time": "1:04:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1553, "total_steps": 1918, "loss": 0.171, "learning_rate": 4.78978833666281e-07, "epoch": 0.8095393236463152, "percentage": 80.97, "elapsed_time": "4:31:48", "remaining_time": "1:03:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1554, "total_steps": 1918, "loss": 0.1779, "learning_rate": 4.7644450351917617e-07, "epoch": 0.8100605981625073, "percentage": 81.02, "elapsed_time": "4:31:58", "remaining_time": "1:03:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1555, "total_steps": 1918, "loss": 0.1831, "learning_rate": 4.7391618951315277e-07, "epoch": 0.8105818726786994, "percentage": 81.07, "elapsed_time": "4:32:09", "remaining_time": "1:03:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1556, "total_steps": 1918, "loss": 0.1961, "learning_rate": 4.713938991650241e-07, "epoch": 0.8111031471948915, "percentage": 81.13, "elapsed_time": "4:32:19", "remaining_time": "1:03:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1557, "total_steps": 1918, "loss": 0.1789, "learning_rate": 4.688776399736991e-07, "epoch": 0.8116244217110836, "percentage": 81.18, "elapsed_time": "4:32:29", "remaining_time": "1:03:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1558, "total_steps": 1918, "loss": 0.1812, "learning_rate": 4.6636741942015314e-07, "epoch": 0.8121456962272757, "percentage": 81.23, "elapsed_time": "4:32:39", "remaining_time": "1:03:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1559, "total_steps": 1918, "loss": 0.174, "learning_rate": 4.6386324496740855e-07, "epoch": 0.8126669707434678, "percentage": 81.28, "elapsed_time": "4:32:49", "remaining_time": "1:02:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1560, "total_steps": 1918, "loss": 0.1804, "learning_rate": 4.6136512406051495e-07, "epoch": 0.8131882452596598, "percentage": 81.33, "elapsed_time": "4:32:59", "remaining_time": "1:02:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1561, "total_steps": 1918, "loss": 0.1897, "learning_rate": 4.5887306412651933e-07, "epoch": 0.8137095197758519, "percentage": 81.39, "elapsed_time": "4:33:10", "remaining_time": "1:02:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1562, "total_steps": 1918, "loss": 0.186, "learning_rate": 4.563870725744543e-07, "epoch": 0.814230794292044, "percentage": 81.44, "elapsed_time": "4:33:22", "remaining_time": "1:02:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1563, "total_steps": 1918, "loss": 0.1911, "learning_rate": 4.539071567953077e-07, "epoch": 0.8147520688082361, "percentage": 81.49, "elapsed_time": "4:33:33", "remaining_time": "1:02:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1564, "total_steps": 1918, "loss": 0.1864, "learning_rate": 4.514333241620045e-07, "epoch": 0.8152733433244282, "percentage": 81.54, "elapsed_time": "4:33:44", "remaining_time": "1:01:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1565, "total_steps": 1918, "loss": 0.1849, "learning_rate": 4.4896558202938505e-07, "epoch": 0.8157946178406204, "percentage": 81.6, "elapsed_time": "4:33:53", "remaining_time": "1:01:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1566, "total_steps": 1918, "loss": 0.1726, "learning_rate": 4.4650393773418123e-07, "epoch": 0.8163158923568125, "percentage": 81.65, "elapsed_time": "4:34:04", "remaining_time": "1:01:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1567, "total_steps": 1918, "loss": 0.1772, "learning_rate": 4.440483985949953e-07, "epoch": 0.8168371668730044, "percentage": 81.7, "elapsed_time": "4:34:14", "remaining_time": "1:01:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1568, "total_steps": 1918, "loss": 0.1784, "learning_rate": 4.4159897191228096e-07, "epoch": 0.8173584413891966, "percentage": 81.75, "elapsed_time": "4:34:25", "remaining_time": "1:01:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1569, "total_steps": 1918, "loss": 0.1889, "learning_rate": 4.3915566496831654e-07, "epoch": 0.8178797159053887, "percentage": 81.8, "elapsed_time": "4:34:36", "remaining_time": "1:01:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1570, "total_steps": 1918, "loss": 0.1879, "learning_rate": 4.367184850271872e-07, "epoch": 0.8184009904215808, "percentage": 81.86, "elapsed_time": "4:34:46", "remaining_time": "1:00:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1571, "total_steps": 1918, "loss": 0.1717, "learning_rate": 4.3428743933476207e-07, "epoch": 0.8189222649377729, "percentage": 81.91, "elapsed_time": "4:34:55", "remaining_time": "1:00:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1572, "total_steps": 1918, "loss": 0.1798, "learning_rate": 4.3186253511867227e-07, "epoch": 0.819443539453965, "percentage": 81.96, "elapsed_time": "4:35:06", "remaining_time": "1:00:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1573, "total_steps": 1918, "loss": 0.1855, "learning_rate": 4.294437795882919e-07, "epoch": 0.8199648139701571, "percentage": 82.01, "elapsed_time": "4:35:17", "remaining_time": "1:00:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1574, "total_steps": 1918, "loss": 0.1857, "learning_rate": 4.2703117993471295e-07, "epoch": 0.8204860884863491, "percentage": 82.06, "elapsed_time": "4:35:26", "remaining_time": "1:00:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1575, "total_steps": 1918, "loss": 0.1813, "learning_rate": 4.2462474333072544e-07, "epoch": 0.8210073630025412, "percentage": 82.12, "elapsed_time": "4:35:36", "remaining_time": "1:00:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1576, "total_steps": 1918, "loss": 0.1835, "learning_rate": 4.222244769307965e-07, "epoch": 0.8215286375187333, "percentage": 82.17, "elapsed_time": "4:35:47", "remaining_time": "0:59:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1577, "total_steps": 1918, "loss": 0.1791, "learning_rate": 4.198303878710508e-07, "epoch": 0.8220499120349254, "percentage": 82.22, "elapsed_time": "4:35:58", "remaining_time": "0:59:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1578, "total_steps": 1918, "loss": 0.1799, "learning_rate": 4.174424832692453e-07, "epoch": 0.8225711865511175, "percentage": 82.27, "elapsed_time": "4:36:08", "remaining_time": "0:59:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1579, "total_steps": 1918, "loss": 0.1864, "learning_rate": 4.1506077022475e-07, "epoch": 0.8230924610673096, "percentage": 82.33, "elapsed_time": "4:36:17", "remaining_time": "0:59:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1580, "total_steps": 1918, "loss": 0.1797, "learning_rate": 4.1268525581853015e-07, "epoch": 0.8236137355835017, "percentage": 82.38, "elapsed_time": "4:36:28", "remaining_time": "0:59:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1581, "total_steps": 1918, "loss": 0.1792, "learning_rate": 4.1031594711311686e-07, "epoch": 0.8241350100996937, "percentage": 82.43, "elapsed_time": "4:36:39", "remaining_time": "0:58:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1582, "total_steps": 1918, "loss": 0.1886, "learning_rate": 4.079528511525968e-07, "epoch": 0.8246562846158858, "percentage": 82.48, "elapsed_time": "4:36:49", "remaining_time": "0:58:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1583, "total_steps": 1918, "loss": 0.1861, "learning_rate": 4.0559597496258263e-07, "epoch": 0.8251775591320779, "percentage": 82.53, "elapsed_time": "4:36:59", "remaining_time": "0:58:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1584, "total_steps": 1918, "loss": 0.1828, "learning_rate": 4.032453255501956e-07, "epoch": 0.82569883364827, "percentage": 82.59, "elapsed_time": "4:37:08", "remaining_time": "0:58:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1585, "total_steps": 1918, "loss": 0.1763, "learning_rate": 4.0090090990404563e-07, "epoch": 0.8262201081644621, "percentage": 82.64, "elapsed_time": "4:37:17", "remaining_time": "0:58:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1586, "total_steps": 1918, "loss": 0.1872, "learning_rate": 3.9856273499420837e-07, "epoch": 0.8267413826806542, "percentage": 82.69, "elapsed_time": "4:37:27", "remaining_time": "0:58:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1587, "total_steps": 1918, "loss": 0.1806, "learning_rate": 3.962308077722049e-07, "epoch": 0.8272626571968463, "percentage": 82.74, "elapsed_time": "4:37:37", "remaining_time": "0:57:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1588, "total_steps": 1918, "loss": 0.1691, "learning_rate": 3.9390513517098413e-07, "epoch": 0.8277839317130383, "percentage": 82.79, "elapsed_time": "4:37:47", "remaining_time": "0:57:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1589, "total_steps": 1918, "loss": 0.153, "learning_rate": 3.9158572410489537e-07, "epoch": 0.8283052062292304, "percentage": 82.85, "elapsed_time": "4:37:56", "remaining_time": "0:57:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1590, "total_steps": 1918, "loss": 0.1703, "learning_rate": 3.8927258146967626e-07, "epoch": 0.8288264807454225, "percentage": 82.9, "elapsed_time": "4:38:07", "remaining_time": "0:57:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1591, "total_steps": 1918, "loss": 0.1929, "learning_rate": 3.8696571414242546e-07, "epoch": 0.8293477552616146, "percentage": 82.95, "elapsed_time": "4:38:17", "remaining_time": "0:57:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1592, "total_steps": 1918, "loss": 0.1699, "learning_rate": 3.846651289815856e-07, "epoch": 0.8298690297778067, "percentage": 83.0, "elapsed_time": "4:38:26", "remaining_time": "0:57:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1593, "total_steps": 1918, "loss": 0.183, "learning_rate": 3.823708328269232e-07, "epoch": 0.8303903042939988, "percentage": 83.06, "elapsed_time": "4:38:36", "remaining_time": "0:56:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1594, "total_steps": 1918, "loss": 0.1776, "learning_rate": 3.800828324995043e-07, "epoch": 0.830911578810191, "percentage": 83.11, "elapsed_time": "4:38:46", "remaining_time": "0:56:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1595, "total_steps": 1918, "loss": 0.1698, "learning_rate": 3.7780113480167967e-07, "epoch": 0.8314328533263831, "percentage": 83.16, "elapsed_time": "4:38:55", "remaining_time": "0:56:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1596, "total_steps": 1918, "loss": 0.187, "learning_rate": 3.7552574651706253e-07, "epoch": 0.831954127842575, "percentage": 83.21, "elapsed_time": "4:39:06", "remaining_time": "0:56:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1597, "total_steps": 1918, "loss": 0.189, "learning_rate": 3.7325667441050457e-07, "epoch": 0.8324754023587672, "percentage": 83.26, "elapsed_time": "4:39:16", "remaining_time": "0:56:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1598, "total_steps": 1918, "loss": 0.1814, "learning_rate": 3.7099392522808253e-07, "epoch": 0.8329966768749593, "percentage": 83.32, "elapsed_time": "4:39:26", "remaining_time": "0:55:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1599, "total_steps": 1918, "loss": 0.1837, "learning_rate": 3.6873750569707297e-07, "epoch": 0.8335179513911514, "percentage": 83.37, "elapsed_time": "4:39:36", "remaining_time": "0:55:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1600, "total_steps": 1918, "loss": 0.1926, "learning_rate": 3.664874225259338e-07, "epoch": 0.8340392259073435, "percentage": 83.42, "elapsed_time": "4:39:45", "remaining_time": "0:55:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1601, "total_steps": 1918, "loss": 0.1805, "learning_rate": 3.6424368240428666e-07, "epoch": 0.8345605004235356, "percentage": 83.47, "elapsed_time": "4:39:56", "remaining_time": "0:55:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1602, "total_steps": 1918, "loss": 0.1822, "learning_rate": 3.62006292002893e-07, "epoch": 0.8350817749397277, "percentage": 83.52, "elapsed_time": "4:40:06", "remaining_time": "0:55:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1603, "total_steps": 1918, "loss": 0.1773, "learning_rate": 3.597752579736363e-07, "epoch": 0.8356030494559197, "percentage": 83.58, "elapsed_time": "4:40:17", "remaining_time": "0:55:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1604, "total_steps": 1918, "loss": 0.1773, "learning_rate": 3.57550586949503e-07, "epoch": 0.8361243239721118, "percentage": 83.63, "elapsed_time": "4:40:29", "remaining_time": "0:54:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1605, "total_steps": 1918, "loss": 0.1749, "learning_rate": 3.5533228554456095e-07, "epoch": 0.8366455984883039, "percentage": 83.68, "elapsed_time": "4:40:38", "remaining_time": "0:54:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1606, "total_steps": 1918, "loss": 0.1668, "learning_rate": 3.5312036035394263e-07, "epoch": 0.837166873004496, "percentage": 83.73, "elapsed_time": "4:40:49", "remaining_time": "0:54:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1607, "total_steps": 1918, "loss": 0.1908, "learning_rate": 3.5091481795382216e-07, "epoch": 0.8376881475206881, "percentage": 83.79, "elapsed_time": "4:41:00", "remaining_time": "0:54:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1608, "total_steps": 1918, "loss": 0.175, "learning_rate": 3.487156649013973e-07, "epoch": 0.8382094220368802, "percentage": 83.84, "elapsed_time": "4:41:10", "remaining_time": "0:54:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1609, "total_steps": 1918, "loss": 0.2001, "learning_rate": 3.4652290773487003e-07, "epoch": 0.8387306965530723, "percentage": 83.89, "elapsed_time": "4:41:21", "remaining_time": "0:54:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1610, "total_steps": 1918, "loss": 0.1861, "learning_rate": 3.44336552973428e-07, "epoch": 0.8392519710692643, "percentage": 83.94, "elapsed_time": "4:41:32", "remaining_time": "0:53:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1611, "total_steps": 1918, "loss": 0.1882, "learning_rate": 3.4215660711722276e-07, "epoch": 0.8397732455854564, "percentage": 83.99, "elapsed_time": "4:41:43", "remaining_time": "0:53:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1612, "total_steps": 1918, "loss": 0.2053, "learning_rate": 3.399830766473525e-07, "epoch": 0.8402945201016485, "percentage": 84.05, "elapsed_time": "4:41:54", "remaining_time": "0:53:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1613, "total_steps": 1918, "loss": 0.1869, "learning_rate": 3.378159680258428e-07, "epoch": 0.8408157946178406, "percentage": 84.1, "elapsed_time": "4:42:04", "remaining_time": "0:53:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1614, "total_steps": 1918, "loss": 0.1716, "learning_rate": 3.356552876956257e-07, "epoch": 0.8413370691340327, "percentage": 84.15, "elapsed_time": "4:42:15", "remaining_time": "0:53:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1615, "total_steps": 1918, "loss": 0.1794, "learning_rate": 3.3350104208052153e-07, "epoch": 0.8418583436502248, "percentage": 84.2, "elapsed_time": "4:42:25", "remaining_time": "0:52:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1616, "total_steps": 1918, "loss": 0.179, "learning_rate": 3.3135323758522047e-07, "epoch": 0.8423796181664169, "percentage": 84.25, "elapsed_time": "4:42:36", "remaining_time": "0:52:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1617, "total_steps": 1918, "loss": 0.1666, "learning_rate": 3.292118805952621e-07, "epoch": 0.8429008926826089, "percentage": 84.31, "elapsed_time": "4:42:47", "remaining_time": "0:52:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1618, "total_steps": 1918, "loss": 0.1817, "learning_rate": 3.2707697747701913e-07, "epoch": 0.843422167198801, "percentage": 84.36, "elapsed_time": "4:42:58", "remaining_time": "0:52:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1619, "total_steps": 1918, "loss": 0.1818, "learning_rate": 3.249485345776743e-07, "epoch": 0.8439434417149931, "percentage": 84.41, "elapsed_time": "4:43:10", "remaining_time": "0:52:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1620, "total_steps": 1918, "loss": 0.1842, "learning_rate": 3.228265582252041e-07, "epoch": 0.8444647162311852, "percentage": 84.46, "elapsed_time": "4:43:20", "remaining_time": "0:52:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1621, "total_steps": 1918, "loss": 0.1842, "learning_rate": 3.2071105472836207e-07, "epoch": 0.8449859907473773, "percentage": 84.52, "elapsed_time": "4:43:30", "remaining_time": "0:51:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1622, "total_steps": 1918, "loss": 0.1678, "learning_rate": 3.186020303766532e-07, "epoch": 0.8455072652635695, "percentage": 84.57, "elapsed_time": "4:43:40", "remaining_time": "0:51:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1623, "total_steps": 1918, "loss": 0.1692, "learning_rate": 3.164994914403241e-07, "epoch": 0.8460285397797616, "percentage": 84.62, "elapsed_time": "4:43:50", "remaining_time": "0:51:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1624, "total_steps": 1918, "loss": 0.1798, "learning_rate": 3.1440344417033754e-07, "epoch": 0.8465498142959537, "percentage": 84.67, "elapsed_time": "4:44:02", "remaining_time": "0:51:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1625, "total_steps": 1918, "loss": 0.1724, "learning_rate": 3.123138947983556e-07, "epoch": 0.8470710888121457, "percentage": 84.72, "elapsed_time": "4:44:12", "remaining_time": "0:51:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1626, "total_steps": 1918, "loss": 0.173, "learning_rate": 3.102308495367243e-07, "epoch": 0.8475923633283378, "percentage": 84.78, "elapsed_time": "4:44:23", "remaining_time": "0:51:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1627, "total_steps": 1918, "loss": 0.1792, "learning_rate": 3.081543145784499e-07, "epoch": 0.8481136378445299, "percentage": 84.83, "elapsed_time": "4:44:33", "remaining_time": "0:50:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1628, "total_steps": 1918, "loss": 0.1919, "learning_rate": 3.060842960971844e-07, "epoch": 0.848634912360722, "percentage": 84.88, "elapsed_time": "4:44:44", "remaining_time": "0:50:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1629, "total_steps": 1918, "loss": 0.1862, "learning_rate": 3.0402080024720724e-07, "epoch": 0.8491561868769141, "percentage": 84.93, "elapsed_time": "4:44:54", "remaining_time": "0:50:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1630, "total_steps": 1918, "loss": 0.1857, "learning_rate": 3.0196383316340226e-07, "epoch": 0.8496774613931062, "percentage": 84.98, "elapsed_time": "4:45:04", "remaining_time": "0:50:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1631, "total_steps": 1918, "loss": 0.1734, "learning_rate": 2.9991340096124644e-07, "epoch": 0.8501987359092983, "percentage": 85.04, "elapsed_time": "4:45:15", "remaining_time": "0:50:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1632, "total_steps": 1918, "loss": 0.2025, "learning_rate": 2.978695097367862e-07, "epoch": 0.8507200104254903, "percentage": 85.09, "elapsed_time": "4:45:26", "remaining_time": "0:50:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1633, "total_steps": 1918, "loss": 0.1762, "learning_rate": 2.958321655666219e-07, "epoch": 0.8512412849416824, "percentage": 85.14, "elapsed_time": "4:45:37", "remaining_time": "0:49:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1634, "total_steps": 1918, "loss": 0.1817, "learning_rate": 2.938013745078899e-07, "epoch": 0.8517625594578745, "percentage": 85.19, "elapsed_time": "4:45:47", "remaining_time": "0:49:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1635, "total_steps": 1918, "loss": 0.1582, "learning_rate": 2.917771425982413e-07, "epoch": 0.8522838339740666, "percentage": 85.25, "elapsed_time": "4:45:56", "remaining_time": "0:49:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1636, "total_steps": 1918, "loss": 0.1726, "learning_rate": 2.897594758558298e-07, "epoch": 0.8528051084902587, "percentage": 85.3, "elapsed_time": "4:46:07", "remaining_time": "0:49:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1637, "total_steps": 1918, "loss": 0.1754, "learning_rate": 2.8774838027928854e-07, "epoch": 0.8533263830064508, "percentage": 85.35, "elapsed_time": "4:46:18", "remaining_time": "0:49:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1638, "total_steps": 1918, "loss": 0.1734, "learning_rate": 2.857438618477135e-07, "epoch": 0.8538476575226429, "percentage": 85.4, "elapsed_time": "4:46:28", "remaining_time": "0:48:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1639, "total_steps": 1918, "loss": 0.1781, "learning_rate": 2.837459265206491e-07, "epoch": 0.8543689320388349, "percentage": 85.45, "elapsed_time": "4:46:39", "remaining_time": "0:48:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1640, "total_steps": 1918, "loss": 0.2084, "learning_rate": 2.817545802380653e-07, "epoch": 0.854890206555027, "percentage": 85.51, "elapsed_time": "4:46:49", "remaining_time": "0:48:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1641, "total_steps": 1918, "loss": 0.1814, "learning_rate": 2.797698289203432e-07, "epoch": 0.8554114810712191, "percentage": 85.56, "elapsed_time": "4:47:00", "remaining_time": "0:48:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1642, "total_steps": 1918, "loss": 0.1742, "learning_rate": 2.7779167846825797e-07, "epoch": 0.8559327555874112, "percentage": 85.61, "elapsed_time": "4:47:10", "remaining_time": "0:48:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1643, "total_steps": 1918, "loss": 0.1826, "learning_rate": 2.7582013476295826e-07, "epoch": 0.8564540301036033, "percentage": 85.66, "elapsed_time": "4:47:20", "remaining_time": "0:48:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1644, "total_steps": 1918, "loss": 0.1838, "learning_rate": 2.738552036659517e-07, "epoch": 0.8569753046197954, "percentage": 85.71, "elapsed_time": "4:47:29", "remaining_time": "0:47:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1645, "total_steps": 1918, "loss": 0.1674, "learning_rate": 2.718968910190853e-07, "epoch": 0.8574965791359875, "percentage": 85.77, "elapsed_time": "4:47:40", "remaining_time": "0:47:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1646, "total_steps": 1918, "loss": 0.1753, "learning_rate": 2.6994520264452957e-07, "epoch": 0.8580178536521795, "percentage": 85.82, "elapsed_time": "4:47:49", "remaining_time": "0:47:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1647, "total_steps": 1918, "loss": 0.1621, "learning_rate": 2.6800014434476137e-07, "epoch": 0.8585391281683716, "percentage": 85.87, "elapsed_time": "4:48:00", "remaining_time": "0:47:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1648, "total_steps": 1918, "loss": 0.1722, "learning_rate": 2.6606172190254467e-07, "epoch": 0.8590604026845637, "percentage": 85.92, "elapsed_time": "4:48:11", "remaining_time": "0:47:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1649, "total_steps": 1918, "loss": 0.1856, "learning_rate": 2.6412994108091586e-07, "epoch": 0.8595816772007558, "percentage": 85.97, "elapsed_time": "4:48:22", "remaining_time": "0:47:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1650, "total_steps": 1918, "loss": 0.1905, "learning_rate": 2.6220480762316396e-07, "epoch": 0.860102951716948, "percentage": 86.03, "elapsed_time": "4:48:32", "remaining_time": "0:46:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1651, "total_steps": 1918, "loss": 0.192, "learning_rate": 2.6028632725281723e-07, "epoch": 0.86062422623314, "percentage": 86.08, "elapsed_time": "4:48:42", "remaining_time": "0:46:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1652, "total_steps": 1918, "loss": 0.2076, "learning_rate": 2.58374505673622e-07, "epoch": 0.8611455007493322, "percentage": 86.13, "elapsed_time": "4:48:52", "remaining_time": "0:46:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1653, "total_steps": 1918, "loss": 0.1964, "learning_rate": 2.56469348569528e-07, "epoch": 0.8616667752655242, "percentage": 86.18, "elapsed_time": "4:49:03", "remaining_time": "0:46:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1654, "total_steps": 1918, "loss": 0.1753, "learning_rate": 2.5457086160467187e-07, "epoch": 0.8621880497817163, "percentage": 86.24, "elapsed_time": "4:49:13", "remaining_time": "0:46:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1655, "total_steps": 1918, "loss": 0.176, "learning_rate": 2.526790504233592e-07, "epoch": 0.8627093242979084, "percentage": 86.29, "elapsed_time": "4:49:23", "remaining_time": "0:45:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1656, "total_steps": 1918, "loss": 0.1791, "learning_rate": 2.507939206500479e-07, "epoch": 0.8632305988141005, "percentage": 86.34, "elapsed_time": "4:49:33", "remaining_time": "0:45:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1657, "total_steps": 1918, "loss": 0.1931, "learning_rate": 2.4891547788933185e-07, "epoch": 0.8637518733302926, "percentage": 86.39, "elapsed_time": "4:49:45", "remaining_time": "0:45:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1658, "total_steps": 1918, "loss": 0.1797, "learning_rate": 2.4704372772592326e-07, "epoch": 0.8642731478464847, "percentage": 86.44, "elapsed_time": "4:49:55", "remaining_time": "0:45:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1659, "total_steps": 1918, "loss": 0.1743, "learning_rate": 2.4517867572463884e-07, "epoch": 0.8647944223626768, "percentage": 86.5, "elapsed_time": "4:50:05", "remaining_time": "0:45:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1660, "total_steps": 1918, "loss": 0.1689, "learning_rate": 2.433203274303794e-07, "epoch": 0.8653156968788689, "percentage": 86.55, "elapsed_time": "4:50:15", "remaining_time": "0:45:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1661, "total_steps": 1918, "loss": 0.1753, "learning_rate": 2.414686883681158e-07, "epoch": 0.8658369713950609, "percentage": 86.6, "elapsed_time": "4:50:25", "remaining_time": "0:44:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1662, "total_steps": 1918, "loss": 0.1825, "learning_rate": 2.3962376404287365e-07, "epoch": 0.866358245911253, "percentage": 86.65, "elapsed_time": "4:50:35", "remaining_time": "0:44:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1663, "total_steps": 1918, "loss": 0.1866, "learning_rate": 2.3778555993971164e-07, "epoch": 0.8668795204274451, "percentage": 86.7, "elapsed_time": "4:50:45", "remaining_time": "0:44:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1664, "total_steps": 1918, "loss": 0.1811, "learning_rate": 2.359540815237124e-07, "epoch": 0.8674007949436372, "percentage": 86.76, "elapsed_time": "4:50:56", "remaining_time": "0:44:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1665, "total_steps": 1918, "loss": 0.1909, "learning_rate": 2.3412933423996114e-07, "epoch": 0.8679220694598293, "percentage": 86.81, "elapsed_time": "4:51:06", "remaining_time": "0:44:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1666, "total_steps": 1918, "loss": 0.1809, "learning_rate": 2.3231132351353075e-07, "epoch": 0.8684433439760214, "percentage": 86.86, "elapsed_time": "4:51:17", "remaining_time": "0:44:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1667, "total_steps": 1918, "loss": 0.1878, "learning_rate": 2.305000547494679e-07, "epoch": 0.8689646184922135, "percentage": 86.91, "elapsed_time": "4:51:27", "remaining_time": "0:43:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1668, "total_steps": 1918, "loss": 0.1852, "learning_rate": 2.2869553333277145e-07, "epoch": 0.8694858930084055, "percentage": 86.97, "elapsed_time": "4:51:38", "remaining_time": "0:43:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1669, "total_steps": 1918, "loss": 0.1733, "learning_rate": 2.2689776462838348e-07, "epoch": 0.8700071675245976, "percentage": 87.02, "elapsed_time": "4:51:49", "remaining_time": "0:43:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1670, "total_steps": 1918, "loss": 0.1897, "learning_rate": 2.251067539811691e-07, "epoch": 0.8705284420407897, "percentage": 87.07, "elapsed_time": "4:51:59", "remaining_time": "0:43:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1671, "total_steps": 1918, "loss": 0.1735, "learning_rate": 2.233225067158995e-07, "epoch": 0.8710497165569818, "percentage": 87.12, "elapsed_time": "4:52:08", "remaining_time": "0:43:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1672, "total_steps": 1918, "loss": 0.1938, "learning_rate": 2.2154502813724026e-07, "epoch": 0.8715709910731739, "percentage": 87.17, "elapsed_time": "4:52:19", "remaining_time": "0:43:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1673, "total_steps": 1918, "loss": 0.1958, "learning_rate": 2.1977432352973226e-07, "epoch": 0.872092265589366, "percentage": 87.23, "elapsed_time": "4:52:29", "remaining_time": "0:42:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1674, "total_steps": 1918, "loss": 0.184, "learning_rate": 2.1801039815777637e-07, "epoch": 0.8726135401055581, "percentage": 87.28, "elapsed_time": "4:52:40", "remaining_time": "0:42:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1675, "total_steps": 1918, "loss": 0.1737, "learning_rate": 2.1625325726562009e-07, "epoch": 0.8731348146217501, "percentage": 87.33, "elapsed_time": "4:52:50", "remaining_time": "0:42:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1676, "total_steps": 1918, "loss": 0.1892, "learning_rate": 2.1450290607733903e-07, "epoch": 0.8736560891379422, "percentage": 87.38, "elapsed_time": "4:53:01", "remaining_time": "0:42:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1677, "total_steps": 1918, "loss": 0.1625, "learning_rate": 2.127593497968225e-07, "epoch": 0.8741773636541343, "percentage": 87.43, "elapsed_time": "4:53:11", "remaining_time": "0:42:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1678, "total_steps": 1918, "loss": 0.1869, "learning_rate": 2.1102259360775895e-07, "epoch": 0.8746986381703264, "percentage": 87.49, "elapsed_time": "4:53:22", "remaining_time": "0:41:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1679, "total_steps": 1918, "loss": 0.1876, "learning_rate": 2.0929264267361888e-07, "epoch": 0.8752199126865186, "percentage": 87.54, "elapsed_time": "4:53:33", "remaining_time": "0:41:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1680, "total_steps": 1918, "loss": 0.1662, "learning_rate": 2.07569502137642e-07, "epoch": 0.8757411872027107, "percentage": 87.59, "elapsed_time": "4:53:44", "remaining_time": "0:41:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1681, "total_steps": 1918, "loss": 0.1799, "learning_rate": 2.0585317712281866e-07, "epoch": 0.8762624617189028, "percentage": 87.64, "elapsed_time": "4:53:54", "remaining_time": "0:41:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1682, "total_steps": 1918, "loss": 0.1897, "learning_rate": 2.0414367273187713e-07, "epoch": 0.8767837362350948, "percentage": 87.7, "elapsed_time": "4:54:05", "remaining_time": "0:41:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1683, "total_steps": 1918, "loss": 0.1916, "learning_rate": 2.0244099404726686e-07, "epoch": 0.8773050107512869, "percentage": 87.75, "elapsed_time": "4:54:15", "remaining_time": "0:41:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1684, "total_steps": 1918, "loss": 0.1784, "learning_rate": 2.007451461311455e-07, "epoch": 0.877826285267479, "percentage": 87.8, "elapsed_time": "4:54:24", "remaining_time": "0:40:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1685, "total_steps": 1918, "loss": 0.1858, "learning_rate": 1.990561340253608e-07, "epoch": 0.8783475597836711, "percentage": 87.85, "elapsed_time": "4:54:34", "remaining_time": "0:40:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1686, "total_steps": 1918, "loss": 0.1876, "learning_rate": 1.9737396275143816e-07, "epoch": 0.8788688342998632, "percentage": 87.9, "elapsed_time": "4:54:45", "remaining_time": "0:40:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1687, "total_steps": 1918, "loss": 0.1865, "learning_rate": 1.9569863731056544e-07, "epoch": 0.8793901088160553, "percentage": 87.96, "elapsed_time": "4:54:56", "remaining_time": "0:40:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1688, "total_steps": 1918, "loss": 0.1725, "learning_rate": 1.940301626835761e-07, "epoch": 0.8799113833322474, "percentage": 88.01, "elapsed_time": "4:55:08", "remaining_time": "0:40:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1689, "total_steps": 1918, "loss": 0.1896, "learning_rate": 1.9236854383093668e-07, "epoch": 0.8804326578484394, "percentage": 88.06, "elapsed_time": "4:55:17", "remaining_time": "0:40:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1690, "total_steps": 1918, "loss": 0.1713, "learning_rate": 1.9071378569273047e-07, "epoch": 0.8809539323646315, "percentage": 88.11, "elapsed_time": "4:55:28", "remaining_time": "0:39:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1691, "total_steps": 1918, "loss": 0.1791, "learning_rate": 1.8906589318864384e-07, "epoch": 0.8814752068808236, "percentage": 88.16, "elapsed_time": "4:55:38", "remaining_time": "0:39:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1692, "total_steps": 1918, "loss": 0.1839, "learning_rate": 1.8742487121795188e-07, "epoch": 0.8819964813970157, "percentage": 88.22, "elapsed_time": "4:55:49", "remaining_time": "0:39:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1693, "total_steps": 1918, "loss": 0.1829, "learning_rate": 1.8579072465950197e-07, "epoch": 0.8825177559132078, "percentage": 88.27, "elapsed_time": "4:55:59", "remaining_time": "0:39:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1694, "total_steps": 1918, "loss": 0.1887, "learning_rate": 1.8416345837170114e-07, "epoch": 0.8830390304293999, "percentage": 88.32, "elapsed_time": "4:56:11", "remaining_time": "0:39:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1695, "total_steps": 1918, "loss": 0.1876, "learning_rate": 1.8254307719250214e-07, "epoch": 0.883560304945592, "percentage": 88.37, "elapsed_time": "4:56:21", "remaining_time": "0:38:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1696, "total_steps": 1918, "loss": 0.178, "learning_rate": 1.8092958593938476e-07, "epoch": 0.8840815794617841, "percentage": 88.43, "elapsed_time": "4:56:32", "remaining_time": "0:38:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1697, "total_steps": 1918, "loss": 0.1771, "learning_rate": 1.793229894093479e-07, "epoch": 0.8846028539779761, "percentage": 88.48, "elapsed_time": "4:56:41", "remaining_time": "0:38:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1698, "total_steps": 1918, "loss": 0.1782, "learning_rate": 1.7772329237889158e-07, "epoch": 0.8851241284941682, "percentage": 88.53, "elapsed_time": "4:56:52", "remaining_time": "0:38:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1699, "total_steps": 1918, "loss": 0.1761, "learning_rate": 1.7613049960400057e-07, "epoch": 0.8856454030103603, "percentage": 88.58, "elapsed_time": "4:57:03", "remaining_time": "0:38:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1700, "total_steps": 1918, "loss": 0.1656, "learning_rate": 1.7454461582013665e-07, "epoch": 0.8861666775265524, "percentage": 88.63, "elapsed_time": "4:57:13", "remaining_time": "0:38:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1701, "total_steps": 1918, "loss": 0.1829, "learning_rate": 1.7296564574221796e-07, "epoch": 0.8866879520427445, "percentage": 88.69, "elapsed_time": "4:57:23", "remaining_time": "0:37:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1702, "total_steps": 1918, "loss": 0.174, "learning_rate": 1.7139359406460888e-07, "epoch": 0.8872092265589366, "percentage": 88.74, "elapsed_time": "4:57:34", "remaining_time": "0:37:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1703, "total_steps": 1918, "loss": 0.1709, "learning_rate": 1.698284654611057e-07, "epoch": 0.8877305010751287, "percentage": 88.79, "elapsed_time": "4:57:44", "remaining_time": "0:37:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1704, "total_steps": 1918, "loss": 0.1808, "learning_rate": 1.6827026458492018e-07, "epoch": 0.8882517755913207, "percentage": 88.84, "elapsed_time": "4:57:53", "remaining_time": "0:37:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1705, "total_steps": 1918, "loss": 0.1835, "learning_rate": 1.6671899606866966e-07, "epoch": 0.8887730501075128, "percentage": 88.89, "elapsed_time": "4:58:03", "remaining_time": "0:37:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1706, "total_steps": 1918, "loss": 0.1679, "learning_rate": 1.651746645243596e-07, "epoch": 0.889294324623705, "percentage": 88.95, "elapsed_time": "4:58:11", "remaining_time": "0:37:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1707, "total_steps": 1918, "loss": 0.1767, "learning_rate": 1.6363727454337202e-07, "epoch": 0.889815599139897, "percentage": 89.0, "elapsed_time": "4:58:22", "remaining_time": "0:36:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1708, "total_steps": 1918, "loss": 0.1799, "learning_rate": 1.6210683069645212e-07, "epoch": 0.8903368736560892, "percentage": 89.05, "elapsed_time": "4:58:32", "remaining_time": "0:36:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1709, "total_steps": 1918, "loss": 0.1651, "learning_rate": 1.6058333753369265e-07, "epoch": 0.8908581481722813, "percentage": 89.1, "elapsed_time": "4:58:43", "remaining_time": "0:36:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1710, "total_steps": 1918, "loss": 0.1893, "learning_rate": 1.5906679958452215e-07, "epoch": 0.8913794226884734, "percentage": 89.16, "elapsed_time": "4:58:54", "remaining_time": "0:36:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1711, "total_steps": 1918, "loss": 0.178, "learning_rate": 1.5755722135769036e-07, "epoch": 0.8919006972046654, "percentage": 89.21, "elapsed_time": "4:59:04", "remaining_time": "0:36:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1712, "total_steps": 1918, "loss": 0.1841, "learning_rate": 1.5605460734125582e-07, "epoch": 0.8924219717208575, "percentage": 89.26, "elapsed_time": "4:59:14", "remaining_time": "0:36:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1713, "total_steps": 1918, "loss": 0.1772, "learning_rate": 1.545589620025731e-07, "epoch": 0.8929432462370496, "percentage": 89.31, "elapsed_time": "4:59:26", "remaining_time": "0:35:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1714, "total_steps": 1918, "loss": 0.1743, "learning_rate": 1.530702897882766e-07, "epoch": 0.8934645207532417, "percentage": 89.36, "elapsed_time": "4:59:36", "remaining_time": "0:35:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1715, "total_steps": 1918, "loss": 0.1797, "learning_rate": 1.5158859512427044e-07, "epoch": 0.8939857952694338, "percentage": 89.42, "elapsed_time": "4:59:46", "remaining_time": "0:35:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1716, "total_steps": 1918, "loss": 0.1722, "learning_rate": 1.501138824157139e-07, "epoch": 0.8945070697856259, "percentage": 89.47, "elapsed_time": "4:59:56", "remaining_time": "0:35:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1717, "total_steps": 1918, "loss": 0.1839, "learning_rate": 1.4864615604700872e-07, "epoch": 0.895028344301818, "percentage": 89.52, "elapsed_time": "5:00:08", "remaining_time": "0:35:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1718, "total_steps": 1918, "loss": 0.2006, "learning_rate": 1.471854203817852e-07, "epoch": 0.89554961881801, "percentage": 89.57, "elapsed_time": "5:00:18", "remaining_time": "0:34:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1719, "total_steps": 1918, "loss": 0.1812, "learning_rate": 1.4573167976288994e-07, "epoch": 0.8960708933342021, "percentage": 89.62, "elapsed_time": "5:00:29", "remaining_time": "0:34:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1720, "total_steps": 1918, "loss": 0.1803, "learning_rate": 1.4428493851237403e-07, "epoch": 0.8965921678503942, "percentage": 89.68, "elapsed_time": "5:00:41", "remaining_time": "0:34:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1721, "total_steps": 1918, "loss": 0.1837, "learning_rate": 1.4284520093147818e-07, "epoch": 0.8971134423665863, "percentage": 89.73, "elapsed_time": "5:00:52", "remaining_time": "0:34:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1722, "total_steps": 1918, "loss": 0.1856, "learning_rate": 1.4141247130062069e-07, "epoch": 0.8976347168827784, "percentage": 89.78, "elapsed_time": "5:01:04", "remaining_time": "0:34:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1723, "total_steps": 1918, "loss": 0.1864, "learning_rate": 1.3998675387938476e-07, "epoch": 0.8981559913989705, "percentage": 89.83, "elapsed_time": "5:01:14", "remaining_time": "0:34:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1724, "total_steps": 1918, "loss": 0.1592, "learning_rate": 1.3856805290650644e-07, "epoch": 0.8986772659151626, "percentage": 89.89, "elapsed_time": "5:01:26", "remaining_time": "0:33:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1725, "total_steps": 1918, "loss": 0.1749, "learning_rate": 1.3715637259986147e-07, "epoch": 0.8991985404313546, "percentage": 89.94, "elapsed_time": "5:01:36", "remaining_time": "0:33:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1726, "total_steps": 1918, "loss": 0.1798, "learning_rate": 1.3575171715645235e-07, "epoch": 0.8997198149475467, "percentage": 89.99, "elapsed_time": "5:01:46", "remaining_time": "0:33:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1727, "total_steps": 1918, "loss": 0.1691, "learning_rate": 1.343540907523963e-07, "epoch": 0.9002410894637388, "percentage": 90.04, "elapsed_time": "5:01:57", "remaining_time": "0:33:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1728, "total_steps": 1918, "loss": 0.1848, "learning_rate": 1.3296349754291366e-07, "epoch": 0.9007623639799309, "percentage": 90.09, "elapsed_time": "5:02:06", "remaining_time": "0:33:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1729, "total_steps": 1918, "loss": 0.1821, "learning_rate": 1.3157994166231342e-07, "epoch": 0.901283638496123, "percentage": 90.15, "elapsed_time": "5:02:17", "remaining_time": "0:33:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1730, "total_steps": 1918, "loss": 0.179, "learning_rate": 1.3020342722398273e-07, "epoch": 0.9018049130123151, "percentage": 90.2, "elapsed_time": "5:02:28", "remaining_time": "0:32:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1731, "total_steps": 1918, "loss": 0.1847, "learning_rate": 1.2883395832037516e-07, "epoch": 0.9023261875285072, "percentage": 90.25, "elapsed_time": "5:02:37", "remaining_time": "0:32:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1732, "total_steps": 1918, "loss": 0.1866, "learning_rate": 1.2747153902299524e-07, "epoch": 0.9028474620446993, "percentage": 90.3, "elapsed_time": "5:02:46", "remaining_time": "0:32:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1733, "total_steps": 1918, "loss": 0.1985, "learning_rate": 1.2611617338239097e-07, "epoch": 0.9033687365608913, "percentage": 90.35, "elapsed_time": "5:02:57", "remaining_time": "0:32:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1734, "total_steps": 1918, "loss": 0.1728, "learning_rate": 1.247678654281384e-07, "epoch": 0.9038900110770834, "percentage": 90.41, "elapsed_time": "5:03:07", "remaining_time": "0:32:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1735, "total_steps": 1918, "loss": 0.1624, "learning_rate": 1.234266191688302e-07, "epoch": 0.9044112855932755, "percentage": 90.46, "elapsed_time": "5:03:18", "remaining_time": "0:31:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1736, "total_steps": 1918, "loss": 0.1828, "learning_rate": 1.2209243859206577e-07, "epoch": 0.9049325601094677, "percentage": 90.51, "elapsed_time": "5:03:28", "remaining_time": "0:31:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1737, "total_steps": 1918, "loss": 0.1718, "learning_rate": 1.2076532766443578e-07, "epoch": 0.9054538346256598, "percentage": 90.56, "elapsed_time": "5:03:38", "remaining_time": "0:31:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1738, "total_steps": 1918, "loss": 0.1793, "learning_rate": 1.1944529033151436e-07, "epoch": 0.9059751091418519, "percentage": 90.62, "elapsed_time": "5:03:48", "remaining_time": "0:31:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1739, "total_steps": 1918, "loss": 0.1548, "learning_rate": 1.1813233051784417e-07, "epoch": 0.906496383658044, "percentage": 90.67, "elapsed_time": "5:03:57", "remaining_time": "0:31:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1740, "total_steps": 1918, "loss": 0.1735, "learning_rate": 1.1682645212692634e-07, "epoch": 0.907017658174236, "percentage": 90.72, "elapsed_time": "5:04:08", "remaining_time": "0:31:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1741, "total_steps": 1918, "loss": 0.1723, "learning_rate": 1.1552765904120966e-07, "epoch": 0.9075389326904281, "percentage": 90.77, "elapsed_time": "5:04:18", "remaining_time": "0:30:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1742, "total_steps": 1918, "loss": 0.1707, "learning_rate": 1.1423595512207591e-07, "epoch": 0.9080602072066202, "percentage": 90.82, "elapsed_time": "5:04:27", "remaining_time": "0:30:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1743, "total_steps": 1918, "loss": 0.1727, "learning_rate": 1.1295134420983179e-07, "epoch": 0.9085814817228123, "percentage": 90.88, "elapsed_time": "5:04:38", "remaining_time": "0:30:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1744, "total_steps": 1918, "loss": 0.1719, "learning_rate": 1.1167383012369609e-07, "epoch": 0.9091027562390044, "percentage": 90.93, "elapsed_time": "5:04:47", "remaining_time": "0:30:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1745, "total_steps": 1918, "loss": 0.1732, "learning_rate": 1.1040341666178733e-07, "epoch": 0.9096240307551965, "percentage": 90.98, "elapsed_time": "5:04:57", "remaining_time": "0:30:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1746, "total_steps": 1918, "loss": 0.1814, "learning_rate": 1.0914010760111476e-07, "epoch": 0.9101453052713886, "percentage": 91.03, "elapsed_time": "5:05:07", "remaining_time": "0:30:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1747, "total_steps": 1918, "loss": 0.1755, "learning_rate": 1.078839066975651e-07, "epoch": 0.9106665797875806, "percentage": 91.08, "elapsed_time": "5:05:16", "remaining_time": "0:29:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1748, "total_steps": 1918, "loss": 0.1845, "learning_rate": 1.0663481768589196e-07, "epoch": 0.9111878543037727, "percentage": 91.14, "elapsed_time": "5:05:28", "remaining_time": "0:29:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1749, "total_steps": 1918, "loss": 0.1709, "learning_rate": 1.0539284427970559e-07, "epoch": 0.9117091288199648, "percentage": 91.19, "elapsed_time": "5:05:38", "remaining_time": "0:29:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1750, "total_steps": 1918, "loss": 0.1746, "learning_rate": 1.0415799017146094e-07, "epoch": 0.9122304033361569, "percentage": 91.24, "elapsed_time": "5:05:48", "remaining_time": "0:29:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1751, "total_steps": 1918, "loss": 0.173, "learning_rate": 1.029302590324463e-07, "epoch": 0.912751677852349, "percentage": 91.29, "elapsed_time": "5:06:00", "remaining_time": "0:29:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1752, "total_steps": 1918, "loss": 0.1766, "learning_rate": 1.0170965451277382e-07, "epoch": 0.9132729523685411, "percentage": 91.35, "elapsed_time": "5:06:10", "remaining_time": "0:29:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1753, "total_steps": 1918, "loss": 0.1831, "learning_rate": 1.0049618024136703e-07, "epoch": 0.9137942268847332, "percentage": 91.4, "elapsed_time": "5:06:21", "remaining_time": "0:28:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1754, "total_steps": 1918, "loss": 0.1649, "learning_rate": 9.928983982595175e-08, "epoch": 0.9143155014009252, "percentage": 91.45, "elapsed_time": "5:06:31", "remaining_time": "0:28:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1755, "total_steps": 1918, "loss": 0.192, "learning_rate": 9.809063685304376e-08, "epoch": 0.9148367759171173, "percentage": 91.5, "elapsed_time": "5:06:42", "remaining_time": "0:28:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1756, "total_steps": 1918, "loss": 0.1837, "learning_rate": 9.689857488793891e-08, "epoch": 0.9153580504333094, "percentage": 91.55, "elapsed_time": "5:06:53", "remaining_time": "0:28:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1757, "total_steps": 1918, "loss": 0.1837, "learning_rate": 9.571365747470251e-08, "epoch": 0.9158793249495015, "percentage": 91.61, "elapsed_time": "5:07:03", "remaining_time": "0:28:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1758, "total_steps": 1918, "loss": 0.1731, "learning_rate": 9.45358881361591e-08, "epoch": 0.9164005994656936, "percentage": 91.66, "elapsed_time": "5:07:15", "remaining_time": "0:27:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1759, "total_steps": 1918, "loss": 0.1756, "learning_rate": 9.336527037388132e-08, "epoch": 0.9169218739818857, "percentage": 91.71, "elapsed_time": "5:07:26", "remaining_time": "0:27:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1760, "total_steps": 1918, "loss": 0.1826, "learning_rate": 9.22018076681791e-08, "epoch": 0.9174431484980778, "percentage": 91.76, "elapsed_time": "5:07:37", "remaining_time": "0:27:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1761, "total_steps": 1918, "loss": 0.1721, "learning_rate": 9.10455034780916e-08, "epoch": 0.9179644230142698, "percentage": 91.81, "elapsed_time": "5:07:48", "remaining_time": "0:27:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1762, "total_steps": 1918, "loss": 0.1827, "learning_rate": 8.989636124137363e-08, "epoch": 0.9184856975304619, "percentage": 91.87, "elapsed_time": "5:07:58", "remaining_time": "0:27:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1763, "total_steps": 1918, "loss": 0.1785, "learning_rate": 8.875438437448813e-08, "epoch": 0.919006972046654, "percentage": 91.92, "elapsed_time": "5:08:08", "remaining_time": "0:27:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1764, "total_steps": 1918, "loss": 0.1718, "learning_rate": 8.761957627259509e-08, "epoch": 0.9195282465628462, "percentage": 91.97, "elapsed_time": "5:08:20", "remaining_time": "0:26:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1765, "total_steps": 1918, "loss": 0.1744, "learning_rate": 8.649194030953989e-08, "epoch": 0.9200495210790383, "percentage": 92.02, "elapsed_time": "5:08:30", "remaining_time": "0:26:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1766, "total_steps": 1918, "loss": 0.1751, "learning_rate": 8.537147983784716e-08, "epoch": 0.9205707955952304, "percentage": 92.08, "elapsed_time": "5:08:41", "remaining_time": "0:26:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1767, "total_steps": 1918, "loss": 0.1757, "learning_rate": 8.425819818870667e-08, "epoch": 0.9210920701114225, "percentage": 92.13, "elapsed_time": "5:08:51", "remaining_time": "0:26:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1768, "total_steps": 1918, "loss": 0.1854, "learning_rate": 8.3152098671965e-08, "epoch": 0.9216133446276146, "percentage": 92.18, "elapsed_time": "5:09:02", "remaining_time": "0:26:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1769, "total_steps": 1918, "loss": 0.1859, "learning_rate": 8.205318457611772e-08, "epoch": 0.9221346191438066, "percentage": 92.23, "elapsed_time": "5:09:13", "remaining_time": "0:26:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1770, "total_steps": 1918, "loss": 0.1756, "learning_rate": 8.096145916829529e-08, "epoch": 0.9226558936599987, "percentage": 92.28, "elapsed_time": "5:09:24", "remaining_time": "0:25:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1771, "total_steps": 1918, "loss": 0.1679, "learning_rate": 7.98769256942572e-08, "epoch": 0.9231771681761908, "percentage": 92.34, "elapsed_time": "5:09:35", "remaining_time": "0:25:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1772, "total_steps": 1918, "loss": 0.1877, "learning_rate": 7.879958737838201e-08, "epoch": 0.9236984426923829, "percentage": 92.39, "elapsed_time": "5:09:44", "remaining_time": "0:25:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1773, "total_steps": 1918, "loss": 0.1773, "learning_rate": 7.77294474236534e-08, "epoch": 0.924219717208575, "percentage": 92.44, "elapsed_time": "5:09:54", "remaining_time": "0:25:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1774, "total_steps": 1918, "loss": 0.1889, "learning_rate": 7.66665090116575e-08, "epoch": 0.9247409917247671, "percentage": 92.49, "elapsed_time": "5:10:04", "remaining_time": "0:25:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1775, "total_steps": 1918, "loss": 0.1837, "learning_rate": 7.561077530256755e-08, "epoch": 0.9252622662409592, "percentage": 92.54, "elapsed_time": "5:10:14", "remaining_time": "0:24:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1776, "total_steps": 1918, "loss": 0.1952, "learning_rate": 7.456224943513779e-08, "epoch": 0.9257835407571512, "percentage": 92.6, "elapsed_time": "5:10:23", "remaining_time": "0:24:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1777, "total_steps": 1918, "loss": 0.1787, "learning_rate": 7.352093452669324e-08, "epoch": 0.9263048152733433, "percentage": 92.65, "elapsed_time": "5:10:33", "remaining_time": "0:24:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1778, "total_steps": 1918, "loss": 0.1841, "learning_rate": 7.248683367311937e-08, "epoch": 0.9268260897895354, "percentage": 92.7, "elapsed_time": "5:10:45", "remaining_time": "0:24:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1779, "total_steps": 1918, "loss": 0.1821, "learning_rate": 7.145994994885497e-08, "epoch": 0.9273473643057275, "percentage": 92.75, "elapsed_time": "5:10:55", "remaining_time": "0:24:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1780, "total_steps": 1918, "loss": 0.1768, "learning_rate": 7.044028640688122e-08, "epoch": 0.9278686388219196, "percentage": 92.81, "elapsed_time": "5:11:05", "remaining_time": "0:24:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1781, "total_steps": 1918, "loss": 0.1759, "learning_rate": 6.942784607871373e-08, "epoch": 0.9283899133381117, "percentage": 92.86, "elapsed_time": "5:11:15", "remaining_time": "0:23:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1782, "total_steps": 1918, "loss": 0.1776, "learning_rate": 6.842263197439303e-08, "epoch": 0.9289111878543038, "percentage": 92.91, "elapsed_time": "5:11:26", "remaining_time": "0:23:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1783, "total_steps": 1918, "loss": 0.1889, "learning_rate": 6.742464708247548e-08, "epoch": 0.9294324623704958, "percentage": 92.96, "elapsed_time": "5:11:38", "remaining_time": "0:23:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1784, "total_steps": 1918, "loss": 0.1671, "learning_rate": 6.643389437002462e-08, "epoch": 0.9299537368866879, "percentage": 93.01, "elapsed_time": "5:11:49", "remaining_time": "0:23:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1785, "total_steps": 1918, "loss": 0.1823, "learning_rate": 6.545037678260257e-08, "epoch": 0.93047501140288, "percentage": 93.07, "elapsed_time": "5:11:59", "remaining_time": "0:23:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1786, "total_steps": 1918, "loss": 0.1688, "learning_rate": 6.447409724426063e-08, "epoch": 0.9309962859190721, "percentage": 93.12, "elapsed_time": "5:12:09", "remaining_time": "0:23:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1787, "total_steps": 1918, "loss": 0.1722, "learning_rate": 6.350505865753142e-08, "epoch": 0.9315175604352642, "percentage": 93.17, "elapsed_time": "5:12:20", "remaining_time": "0:22:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1788, "total_steps": 1918, "loss": 0.1577, "learning_rate": 6.254326390341958e-08, "epoch": 0.9320388349514563, "percentage": 93.22, "elapsed_time": "5:12:30", "remaining_time": "0:22:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1789, "total_steps": 1918, "loss": 0.1828, "learning_rate": 6.158871584139303e-08, "epoch": 0.9325601094676484, "percentage": 93.27, "elapsed_time": "5:12:40", "remaining_time": "0:22:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1790, "total_steps": 1918, "loss": 0.1841, "learning_rate": 6.06414173093764e-08, "epoch": 0.9330813839838404, "percentage": 93.33, "elapsed_time": "5:12:50", "remaining_time": "0:22:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1791, "total_steps": 1918, "loss": 0.1789, "learning_rate": 5.970137112373903e-08, "epoch": 0.9336026585000325, "percentage": 93.38, "elapsed_time": "5:13:01", "remaining_time": "0:22:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1792, "total_steps": 1918, "loss": 0.1953, "learning_rate": 5.876858007929004e-08, "epoch": 0.9341239330162247, "percentage": 93.43, "elapsed_time": "5:13:11", "remaining_time": "0:22:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1793, "total_steps": 1918, "loss": 0.1655, "learning_rate": 5.784304694926773e-08, "epoch": 0.9346452075324168, "percentage": 93.48, "elapsed_time": "5:13:21", "remaining_time": "0:21:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1794, "total_steps": 1918, "loss": 0.1764, "learning_rate": 5.692477448533351e-08, "epoch": 0.9351664820486089, "percentage": 93.53, "elapsed_time": "5:13:32", "remaining_time": "0:21:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1795, "total_steps": 1918, "loss": 0.1748, "learning_rate": 5.601376541756076e-08, "epoch": 0.935687756564801, "percentage": 93.59, "elapsed_time": "5:13:43", "remaining_time": "0:21:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1796, "total_steps": 1918, "loss": 0.1738, "learning_rate": 5.511002245442987e-08, "epoch": 0.9362090310809931, "percentage": 93.64, "elapsed_time": "5:13:53", "remaining_time": "0:21:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1797, "total_steps": 1918, "loss": 0.1787, "learning_rate": 5.4213548282817664e-08, "epoch": 0.9367303055971851, "percentage": 93.69, "elapsed_time": "5:14:03", "remaining_time": "0:21:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1798, "total_steps": 1918, "loss": 0.1811, "learning_rate": 5.3324345567990485e-08, "epoch": 0.9372515801133772, "percentage": 93.74, "elapsed_time": "5:14:15", "remaining_time": "0:20:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1799, "total_steps": 1918, "loss": 0.177, "learning_rate": 5.244241695359753e-08, "epoch": 0.9377728546295693, "percentage": 93.8, "elapsed_time": "5:14:25", "remaining_time": "0:20:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1800, "total_steps": 1918, "loss": 0.1651, "learning_rate": 5.156776506166028e-08, "epoch": 0.9382941291457614, "percentage": 93.85, "elapsed_time": "5:14:35", "remaining_time": "0:20:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1801, "total_steps": 1918, "loss": 0.2017, "learning_rate": 5.070039249256642e-08, "epoch": 0.9388154036619535, "percentage": 93.9, "elapsed_time": "5:14:46", "remaining_time": "0:20:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1802, "total_steps": 1918, "loss": 0.1755, "learning_rate": 4.984030182506233e-08, "epoch": 0.9393366781781456, "percentage": 93.95, "elapsed_time": "5:14:56", "remaining_time": "0:20:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1803, "total_steps": 1918, "loss": 0.183, "learning_rate": 4.89874956162445e-08, "epoch": 0.9398579526943377, "percentage": 94.0, "elapsed_time": "5:15:06", "remaining_time": "0:20:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1804, "total_steps": 1918, "loss": 0.1795, "learning_rate": 4.814197640155199e-08, "epoch": 0.9403792272105298, "percentage": 94.06, "elapsed_time": "5:15:17", "remaining_time": "0:19:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1805, "total_steps": 1918, "loss": 0.1775, "learning_rate": 4.73037466947604e-08, "epoch": 0.9409005017267218, "percentage": 94.11, "elapsed_time": "5:15:28", "remaining_time": "0:19:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1806, "total_steps": 1918, "loss": 0.1862, "learning_rate": 4.64728089879718e-08, "epoch": 0.9414217762429139, "percentage": 94.16, "elapsed_time": "5:15:39", "remaining_time": "0:19:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1807, "total_steps": 1918, "loss": 0.1729, "learning_rate": 4.564916575160977e-08, "epoch": 0.941943050759106, "percentage": 94.21, "elapsed_time": "5:15:48", "remaining_time": "0:19:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1808, "total_steps": 1918, "loss": 0.1844, "learning_rate": 4.4832819434410535e-08, "epoch": 0.9424643252752981, "percentage": 94.26, "elapsed_time": "5:15:59", "remaining_time": "0:19:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1809, "total_steps": 1918, "loss": 0.17, "learning_rate": 4.402377246341627e-08, "epoch": 0.9429855997914902, "percentage": 94.32, "elapsed_time": "5:16:10", "remaining_time": "0:19:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1810, "total_steps": 1918, "loss": 0.1765, "learning_rate": 4.322202724396818e-08, "epoch": 0.9435068743076823, "percentage": 94.37, "elapsed_time": "5:16:19", "remaining_time": "0:18:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1811, "total_steps": 1918, "loss": 0.1811, "learning_rate": 4.2427586159697886e-08, "epoch": 0.9440281488238744, "percentage": 94.42, "elapsed_time": "5:16:29", "remaining_time": "0:18:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1812, "total_steps": 1918, "loss": 0.1796, "learning_rate": 4.164045157252272e-08, "epoch": 0.9445494233400664, "percentage": 94.47, "elapsed_time": "5:16:41", "remaining_time": "0:18:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1813, "total_steps": 1918, "loss": 0.1669, "learning_rate": 4.086062582263656e-08, "epoch": 0.9450706978562585, "percentage": 94.53, "elapsed_time": "5:16:51", "remaining_time": "0:18:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1814, "total_steps": 1918, "loss": 0.1843, "learning_rate": 4.008811122850426e-08, "epoch": 0.9455919723724506, "percentage": 94.58, "elapsed_time": "5:17:01", "remaining_time": "0:18:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1815, "total_steps": 1918, "loss": 0.1894, "learning_rate": 3.9322910086853625e-08, "epoch": 0.9461132468886427, "percentage": 94.63, "elapsed_time": "5:17:11", "remaining_time": "0:18:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1816, "total_steps": 1918, "loss": 0.1737, "learning_rate": 3.856502467266987e-08, "epoch": 0.9466345214048348, "percentage": 94.68, "elapsed_time": "5:17:21", "remaining_time": "0:17:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1817, "total_steps": 1918, "loss": 0.1792, "learning_rate": 3.7814457239187255e-08, "epoch": 0.9471557959210269, "percentage": 94.73, "elapsed_time": "5:17:31", "remaining_time": "0:17:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1818, "total_steps": 1918, "loss": 0.1973, "learning_rate": 3.707121001788438e-08, "epoch": 0.947677070437219, "percentage": 94.79, "elapsed_time": "5:17:42", "remaining_time": "0:17:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1819, "total_steps": 1918, "loss": 0.1765, "learning_rate": 3.633528521847507e-08, "epoch": 0.948198344953411, "percentage": 94.84, "elapsed_time": "5:17:52", "remaining_time": "0:17:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1820, "total_steps": 1918, "loss": 0.1896, "learning_rate": 3.5606685028904686e-08, "epoch": 0.9487196194696031, "percentage": 94.89, "elapsed_time": "5:18:03", "remaining_time": "0:17:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1821, "total_steps": 1918, "loss": 0.1827, "learning_rate": 3.4885411615341034e-08, "epoch": 0.9492408939857953, "percentage": 94.94, "elapsed_time": "5:18:13", "remaining_time": "0:16:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1822, "total_steps": 1918, "loss": 0.1791, "learning_rate": 3.4171467122169344e-08, "epoch": 0.9497621685019874, "percentage": 94.99, "elapsed_time": "5:18:21", "remaining_time": "0:16:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1823, "total_steps": 1918, "loss": 0.1821, "learning_rate": 3.346485367198588e-08, "epoch": 0.9502834430181795, "percentage": 95.05, "elapsed_time": "5:18:32", "remaining_time": "0:16:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1824, "total_steps": 1918, "loss": 0.1771, "learning_rate": 3.2765573365591e-08, "epoch": 0.9508047175343716, "percentage": 95.1, "elapsed_time": "5:18:40", "remaining_time": "0:16:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1825, "total_steps": 1918, "loss": 0.1812, "learning_rate": 3.207362828198307e-08, "epoch": 0.9513259920505637, "percentage": 95.15, "elapsed_time": "5:18:51", "remaining_time": "0:16:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1826, "total_steps": 1918, "loss": 0.1781, "learning_rate": 3.138902047835263e-08, "epoch": 0.9518472665667557, "percentage": 95.2, "elapsed_time": "5:19:01", "remaining_time": "0:16:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1827, "total_steps": 1918, "loss": 0.1763, "learning_rate": 3.071175199007653e-08, "epoch": 0.9523685410829478, "percentage": 95.26, "elapsed_time": "5:19:13", "remaining_time": "0:15:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1828, "total_steps": 1918, "loss": 0.1762, "learning_rate": 3.00418248307105e-08, "epoch": 0.9528898155991399, "percentage": 95.31, "elapsed_time": "5:19:23", "remaining_time": "0:15:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1829, "total_steps": 1918, "loss": 0.1769, "learning_rate": 2.9379240991984635e-08, "epoch": 0.953411090115332, "percentage": 95.36, "elapsed_time": "5:19:32", "remaining_time": "0:15:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1830, "total_steps": 1918, "loss": 0.1694, "learning_rate": 2.8724002443797083e-08, "epoch": 0.9539323646315241, "percentage": 95.41, "elapsed_time": "5:19:41", "remaining_time": "0:15:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1831, "total_steps": 1918, "loss": 0.1901, "learning_rate": 2.807611113420816e-08, "epoch": 0.9544536391477162, "percentage": 95.46, "elapsed_time": "5:19:52", "remaining_time": "0:15:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1832, "total_steps": 1918, "loss": 0.1732, "learning_rate": 2.743556898943345e-08, "epoch": 0.9549749136639083, "percentage": 95.52, "elapsed_time": "5:20:02", "remaining_time": "0:15:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1833, "total_steps": 1918, "loss": 0.1687, "learning_rate": 2.680237791384044e-08, "epoch": 0.9554961881801003, "percentage": 95.57, "elapsed_time": "5:20:14", "remaining_time": "0:14:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1834, "total_steps": 1918, "loss": 0.1787, "learning_rate": 2.6176539789939947e-08, "epoch": 0.9560174626962924, "percentage": 95.62, "elapsed_time": "5:20:24", "remaining_time": "0:14:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1835, "total_steps": 1918, "loss": 0.1721, "learning_rate": 2.5558056478383887e-08, "epoch": 0.9565387372124845, "percentage": 95.67, "elapsed_time": "5:20:35", "remaining_time": "0:14:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1836, "total_steps": 1918, "loss": 0.1726, "learning_rate": 2.4946929817956376e-08, "epoch": 0.9570600117286766, "percentage": 95.72, "elapsed_time": "5:20:45", "remaining_time": "0:14:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1837, "total_steps": 1918, "loss": 0.1799, "learning_rate": 2.4343161625570433e-08, "epoch": 0.9575812862448687, "percentage": 95.78, "elapsed_time": "5:20:56", "remaining_time": "0:14:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1838, "total_steps": 1918, "loss": 0.1767, "learning_rate": 2.3746753696262113e-08, "epoch": 0.9581025607610608, "percentage": 95.83, "elapsed_time": "5:21:06", "remaining_time": "0:13:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1839, "total_steps": 1918, "loss": 0.1735, "learning_rate": 2.3157707803184438e-08, "epoch": 0.9586238352772529, "percentage": 95.88, "elapsed_time": "5:21:16", "remaining_time": "0:13:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1840, "total_steps": 1918, "loss": 0.179, "learning_rate": 2.2576025697603198e-08, "epoch": 0.959145109793445, "percentage": 95.93, "elapsed_time": "5:21:25", "remaining_time": "0:13:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1841, "total_steps": 1918, "loss": 0.1721, "learning_rate": 2.2001709108891155e-08, "epoch": 0.959666384309637, "percentage": 95.99, "elapsed_time": "5:21:36", "remaining_time": "0:13:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1842, "total_steps": 1918, "loss": 0.1816, "learning_rate": 2.143475974452275e-08, "epoch": 0.9601876588258291, "percentage": 96.04, "elapsed_time": "5:21:46", "remaining_time": "0:13:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1843, "total_steps": 1918, "loss": 0.1759, "learning_rate": 2.0875179290069934e-08, "epoch": 0.9607089333420212, "percentage": 96.09, "elapsed_time": "5:21:56", "remaining_time": "0:13:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1844, "total_steps": 1918, "loss": 0.1792, "learning_rate": 2.032296940919526e-08, "epoch": 0.9612302078582133, "percentage": 96.14, "elapsed_time": "5:22:06", "remaining_time": "0:12:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1845, "total_steps": 1918, "loss": 0.1823, "learning_rate": 1.9778131743649064e-08, "epoch": 0.9617514823744054, "percentage": 96.19, "elapsed_time": "5:22:18", "remaining_time": "0:12:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1846, "total_steps": 1918, "loss": 0.1639, "learning_rate": 1.9240667913264233e-08, "epoch": 0.9622727568905975, "percentage": 96.25, "elapsed_time": "5:22:28", "remaining_time": "0:12:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1847, "total_steps": 1918, "loss": 0.1877, "learning_rate": 1.8710579515948957e-08, "epoch": 0.9627940314067897, "percentage": 96.3, "elapsed_time": "5:22:39", "remaining_time": "0:12:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1848, "total_steps": 1918, "loss": 0.1812, "learning_rate": 1.8187868127685914e-08, "epoch": 0.9633153059229816, "percentage": 96.35, "elapsed_time": "5:22:50", "remaining_time": "0:12:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1849, "total_steps": 1918, "loss": 0.165, "learning_rate": 1.767253530252422e-08, "epoch": 0.9638365804391738, "percentage": 96.4, "elapsed_time": "5:22:59", "remaining_time": "0:12:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1850, "total_steps": 1918, "loss": 0.1846, "learning_rate": 1.716458257257636e-08, "epoch": 0.9643578549553659, "percentage": 96.45, "elapsed_time": "5:23:09", "remaining_time": "0:11:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1851, "total_steps": 1918, "loss": 0.1845, "learning_rate": 1.666401144801405e-08, "epoch": 0.964879129471558, "percentage": 96.51, "elapsed_time": "5:23:20", "remaining_time": "0:11:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1852, "total_steps": 1918, "loss": 0.1809, "learning_rate": 1.6170823417062386e-08, "epoch": 0.9654004039877501, "percentage": 96.56, "elapsed_time": "5:23:30", "remaining_time": "0:11:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1853, "total_steps": 1918, "loss": 0.1865, "learning_rate": 1.568501994599625e-08, "epoch": 0.9659216785039422, "percentage": 96.61, "elapsed_time": "5:23:40", "remaining_time": "0:11:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1854, "total_steps": 1918, "loss": 0.1912, "learning_rate": 1.5206602479135857e-08, "epoch": 0.9664429530201343, "percentage": 96.66, "elapsed_time": "5:23:51", "remaining_time": "0:11:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1855, "total_steps": 1918, "loss": 0.1788, "learning_rate": 1.4735572438842605e-08, "epoch": 0.9669642275363263, "percentage": 96.72, "elapsed_time": "5:24:01", "remaining_time": "0:11:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1856, "total_steps": 1918, "loss": 0.1653, "learning_rate": 1.4271931225514624e-08, "epoch": 0.9674855020525184, "percentage": 96.77, "elapsed_time": "5:24:11", "remaining_time": "0:10:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1857, "total_steps": 1918, "loss": 0.1838, "learning_rate": 1.381568021758234e-08, "epoch": 0.9680067765687105, "percentage": 96.82, "elapsed_time": "5:24:22", "remaining_time": "0:10:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1858, "total_steps": 1918, "loss": 0.1801, "learning_rate": 1.336682077150514e-08, "epoch": 0.9685280510849026, "percentage": 96.87, "elapsed_time": "5:24:32", "remaining_time": "0:10:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1859, "total_steps": 1918, "loss": 0.1944, "learning_rate": 1.2925354221766661e-08, "epoch": 0.9690493256010947, "percentage": 96.92, "elapsed_time": "5:24:42", "remaining_time": "0:10:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1860, "total_steps": 1918, "loss": 0.1866, "learning_rate": 1.2491281880871175e-08, "epoch": 0.9695706001172868, "percentage": 96.98, "elapsed_time": "5:24:52", "remaining_time": "0:10:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1861, "total_steps": 1918, "loss": 0.1726, "learning_rate": 1.206460503933915e-08, "epoch": 0.9700918746334789, "percentage": 97.03, "elapsed_time": "5:25:02", "remaining_time": "0:09:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1862, "total_steps": 1918, "loss": 0.1764, "learning_rate": 1.1645324965704473e-08, "epoch": 0.9706131491496709, "percentage": 97.08, "elapsed_time": "5:25:12", "remaining_time": "0:09:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1863, "total_steps": 1918, "loss": 0.1856, "learning_rate": 1.1233442906509462e-08, "epoch": 0.971134423665863, "percentage": 97.13, "elapsed_time": "5:25:23", "remaining_time": "0:09:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1864, "total_steps": 1918, "loss": 0.1735, "learning_rate": 1.0828960086302075e-08, "epoch": 0.9716556981820551, "percentage": 97.18, "elapsed_time": "5:25:34", "remaining_time": "0:09:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1865, "total_steps": 1918, "loss": 0.1865, "learning_rate": 1.0431877707632043e-08, "epoch": 0.9721769726982472, "percentage": 97.24, "elapsed_time": "5:25:43", "remaining_time": "0:09:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1866, "total_steps": 1918, "loss": 0.1834, "learning_rate": 1.0042196951046968e-08, "epoch": 0.9726982472144393, "percentage": 97.29, "elapsed_time": "5:25:53", "remaining_time": "0:09:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1867, "total_steps": 1918, "loss": 0.1955, "learning_rate": 9.659918975088444e-09, "epoch": 0.9732195217306314, "percentage": 97.34, "elapsed_time": "5:26:04", "remaining_time": "0:08:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1868, "total_steps": 1918, "loss": 0.1891, "learning_rate": 9.285044916290675e-09, "epoch": 0.9737407962468235, "percentage": 97.39, "elapsed_time": "5:26:14", "remaining_time": "0:08:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1869, "total_steps": 1918, "loss": 0.1802, "learning_rate": 8.91757588917408e-09, "epoch": 0.9742620707630155, "percentage": 97.45, "elapsed_time": "5:26:24", "remaining_time": "0:08:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1870, "total_steps": 1918, "loss": 0.1824, "learning_rate": 8.557512986244464e-09, "epoch": 0.9747833452792076, "percentage": 97.5, "elapsed_time": "5:26:34", "remaining_time": "0:08:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1871, "total_steps": 1918, "loss": 0.1766, "learning_rate": 8.20485727798831e-09, "epoch": 0.9753046197953997, "percentage": 97.55, "elapsed_time": "5:26:44", "remaining_time": "0:08:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1872, "total_steps": 1918, "loss": 0.173, "learning_rate": 7.85960981287026e-09, "epoch": 0.9758258943115918, "percentage": 97.6, "elapsed_time": "5:26:55", "remaining_time": "0:08:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1873, "total_steps": 1918, "loss": 0.1688, "learning_rate": 7.521771617330365e-09, "epoch": 0.9763471688277839, "percentage": 97.65, "elapsed_time": "5:27:05", "remaining_time": "0:07:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1874, "total_steps": 1918, "loss": 0.1881, "learning_rate": 7.191343695779618e-09, "epoch": 0.976868443343976, "percentage": 97.71, "elapsed_time": "5:27:15", "remaining_time": "0:07:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1875, "total_steps": 1918, "loss": 0.1907, "learning_rate": 6.86832703059831e-09, "epoch": 0.9773897178601682, "percentage": 97.76, "elapsed_time": "5:27:26", "remaining_time": "0:07:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1876, "total_steps": 1918, "loss": 0.1774, "learning_rate": 6.552722582132687e-09, "epoch": 0.9779109923763603, "percentage": 97.81, "elapsed_time": "5:27:36", "remaining_time": "0:07:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1877, "total_steps": 1918, "loss": 0.1806, "learning_rate": 6.24453128869218e-09, "epoch": 0.9784322668925522, "percentage": 97.86, "elapsed_time": "5:27:46", "remaining_time": "0:07:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1878, "total_steps": 1918, "loss": 0.1768, "learning_rate": 5.94375406654607e-09, "epoch": 0.9789535414087444, "percentage": 97.91, "elapsed_time": "5:27:58", "remaining_time": "0:06:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1879, "total_steps": 1918, "loss": 0.1861, "learning_rate": 5.650391809922107e-09, "epoch": 0.9794748159249365, "percentage": 97.97, "elapsed_time": "5:28:08", "remaining_time": "0:06:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1880, "total_steps": 1918, "loss": 0.1728, "learning_rate": 5.364445391001228e-09, "epoch": 0.9799960904411286, "percentage": 98.02, "elapsed_time": "5:28:19", "remaining_time": "0:06:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1881, "total_steps": 1918, "loss": 0.1743, "learning_rate": 5.085915659918672e-09, "epoch": 0.9805173649573207, "percentage": 98.07, "elapsed_time": "5:28:29", "remaining_time": "0:06:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1882, "total_steps": 1918, "loss": 0.1763, "learning_rate": 4.814803444758431e-09, "epoch": 0.9810386394735128, "percentage": 98.12, "elapsed_time": "5:28:39", "remaining_time": "0:06:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1883, "total_steps": 1918, "loss": 0.1911, "learning_rate": 4.551109551551581e-09, "epoch": 0.9815599139897049, "percentage": 98.18, "elapsed_time": "5:28:50", "remaining_time": "0:06:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1884, "total_steps": 1918, "loss": 0.175, "learning_rate": 4.294834764274614e-09, "epoch": 0.9820811885058969, "percentage": 98.23, "elapsed_time": "5:29:00", "remaining_time": "0:05:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1885, "total_steps": 1918, "loss": 0.1782, "learning_rate": 4.04597984484667e-09, "epoch": 0.982602463022089, "percentage": 98.28, "elapsed_time": "5:29:11", "remaining_time": "0:05:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1886, "total_steps": 1918, "loss": 0.183, "learning_rate": 3.804545533126758e-09, "epoch": 0.9831237375382811, "percentage": 98.33, "elapsed_time": "5:29:21", "remaining_time": "0:05:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1887, "total_steps": 1918, "loss": 0.1711, "learning_rate": 3.5705325469123644e-09, "epoch": 0.9836450120544732, "percentage": 98.38, "elapsed_time": "5:29:31", "remaining_time": "0:05:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1888, "total_steps": 1918, "loss": 0.1839, "learning_rate": 3.3439415819369604e-09, "epoch": 0.9841662865706653, "percentage": 98.44, "elapsed_time": "5:29:43", "remaining_time": "0:05:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1889, "total_steps": 1918, "loss": 0.1733, "learning_rate": 3.124773311867779e-09, "epoch": 0.9846875610868574, "percentage": 98.49, "elapsed_time": "5:29:53", "remaining_time": "0:05:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1890, "total_steps": 1918, "loss": 0.1617, "learning_rate": 2.9130283883044285e-09, "epoch": 0.9852088356030495, "percentage": 98.54, "elapsed_time": "5:30:01", "remaining_time": "0:04:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1891, "total_steps": 1918, "loss": 0.1814, "learning_rate": 2.70870744077556e-09, "epoch": 0.9857301101192415, "percentage": 98.59, "elapsed_time": "5:30:12", "remaining_time": "0:04:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1892, "total_steps": 1918, "loss": 0.1815, "learning_rate": 2.5118110767388682e-09, "epoch": 0.9862513846354336, "percentage": 98.64, "elapsed_time": "5:30:22", "remaining_time": "0:04:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1893, "total_steps": 1918, "loss": 0.1867, "learning_rate": 2.322339881577762e-09, "epoch": 0.9867726591516257, "percentage": 98.7, "elapsed_time": "5:30:33", "remaining_time": "0:04:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1894, "total_steps": 1918, "loss": 0.1683, "learning_rate": 2.140294418600808e-09, "epoch": 0.9872939336678178, "percentage": 98.75, "elapsed_time": "5:30:43", "remaining_time": "0:04:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1895, "total_steps": 1918, "loss": 0.1847, "learning_rate": 1.965675229038677e-09, "epoch": 0.9878152081840099, "percentage": 98.8, "elapsed_time": "5:30:53", "remaining_time": "0:04:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1896, "total_steps": 1918, "loss": 0.1759, "learning_rate": 1.7984828320444236e-09, "epoch": 0.988336482700202, "percentage": 98.85, "elapsed_time": "5:31:04", "remaining_time": "0:03:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1897, "total_steps": 1918, "loss": 0.1794, "learning_rate": 1.6387177246893205e-09, "epoch": 0.9888577572163941, "percentage": 98.91, "elapsed_time": "5:31:15", "remaining_time": "0:03:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1898, "total_steps": 1918, "loss": 0.1804, "learning_rate": 1.486380381964525e-09, "epoch": 0.9893790317325861, "percentage": 98.96, "elapsed_time": "5:31:26", "remaining_time": "0:03:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1899, "total_steps": 1918, "loss": 0.1828, "learning_rate": 1.3414712567769161e-09, "epoch": 0.9899003062487782, "percentage": 99.01, "elapsed_time": "5:31:38", "remaining_time": "0:03:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1900, "total_steps": 1918, "loss": 0.1801, "learning_rate": 1.2039907799490935e-09, "epoch": 0.9904215807649703, "percentage": 99.06, "elapsed_time": "5:31:49", "remaining_time": "0:03:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1901, "total_steps": 1918, "loss": 0.1755, "learning_rate": 1.0739393602185454e-09, "epoch": 0.9909428552811624, "percentage": 99.11, "elapsed_time": "5:32:00", "remaining_time": "0:02:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1902, "total_steps": 1918, "loss": 0.1699, "learning_rate": 9.513173842348732e-10, "epoch": 0.9914641297973545, "percentage": 99.17, "elapsed_time": "5:32:10", "remaining_time": "0:02:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1903, "total_steps": 1918, "loss": 0.2021, "learning_rate": 8.361252165597911e-10, "epoch": 0.9919854043135466, "percentage": 99.22, "elapsed_time": "5:32:21", "remaining_time": "0:02:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1904, "total_steps": 1918, "loss": 0.1709, "learning_rate": 7.283631996662933e-10, "epoch": 0.9925066788297388, "percentage": 99.27, "elapsed_time": "5:32:32", "remaining_time": "0:02:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1905, "total_steps": 1918, "loss": 0.1874, "learning_rate": 6.28031653936434e-10, "epoch": 0.9930279533459307, "percentage": 99.32, "elapsed_time": "5:32:43", "remaining_time": "0:02:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1906, "total_steps": 1918, "loss": 0.1696, "learning_rate": 5.351308776613273e-10, "epoch": 0.9935492278621229, "percentage": 99.37, "elapsed_time": "5:32:53", "remaining_time": "0:02:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1907, "total_steps": 1918, "loss": 0.1886, "learning_rate": 4.49661147040592e-10, "epoch": 0.994070502378315, "percentage": 99.43, "elapsed_time": "5:33:03", "remaining_time": "0:01:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1908, "total_steps": 1918, "loss": 0.1804, "learning_rate": 3.7162271617985357e-10, "epoch": 0.9945917768945071, "percentage": 99.48, "elapsed_time": "5:33:14", "remaining_time": "0:01:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1909, "total_steps": 1918, "loss": 0.1739, "learning_rate": 3.0101581709185424e-10, "epoch": 0.9951130514106992, "percentage": 99.53, "elapsed_time": "5:33:23", "remaining_time": "0:01:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1910, "total_steps": 1918, "loss": 0.1751, "learning_rate": 2.3784065969451043e-10, "epoch": 0.9956343259268913, "percentage": 99.58, "elapsed_time": "5:33:34", "remaining_time": "0:01:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1911, "total_steps": 1918, "loss": 0.1773, "learning_rate": 1.8209743181146766e-10, "epoch": 0.9961556004430834, "percentage": 99.64, "elapsed_time": "5:33:44", "remaining_time": "0:01:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1912, "total_steps": 1918, "loss": 0.1898, "learning_rate": 1.3378629917015772e-10, "epoch": 0.9966768749592755, "percentage": 99.69, "elapsed_time": "5:33:54", "remaining_time": "0:01:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1913, "total_steps": 1918, "loss": 0.2015, "learning_rate": 9.290740540207621e-11, "epoch": 0.9971981494754675, "percentage": 99.74, "elapsed_time": "5:34:05", "remaining_time": "0:00:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1914, "total_steps": 1918, "loss": 0.1774, "learning_rate": 5.94608720427825e-11, "epoch": 0.9977194239916596, "percentage": 99.79, "elapsed_time": "5:34:15", "remaining_time": "0:00:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1915, "total_steps": 1918, "loss": 0.1849, "learning_rate": 3.344679853023447e-11, "epoch": 0.9982406985078517, "percentage": 99.84, "elapsed_time": "5:34:27", "remaining_time": "0:00:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1916, "total_steps": 1918, "loss": 0.1845, "learning_rate": 1.4865262205898678e-11, "epoch": 0.9987619730240438, "percentage": 99.9, "elapsed_time": "5:34:38", "remaining_time": "0:00:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1917, "total_steps": 1918, "loss": 0.1807, "learning_rate": 3.716318313640166e-12, "epoch": 0.9992832475402359, "percentage": 99.95, "elapsed_time": "5:34:47", "remaining_time": "0:00:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1918, "total_steps": 1918, "loss": 0.1743, "learning_rate": 0.0, "epoch": 0.999804522056428, "percentage": 100.0, "elapsed_time": "5:34:57", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1918, "total_steps": 1918, "epoch": 0.999804522056428, "percentage": 100.0, "elapsed_time": "5:34:57", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}