| {"current_steps": 100, "total_steps": 24000, "loss": 3.9537, "learning_rate": 2.0833333333333333e-07, "epoch": 0.0416579879191835, "percentage": 0.42, "elapsed_time": "0:04:55", "remaining_time": "19:35:36", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 200, "total_steps": 24000, "loss": 0.4085, "learning_rate": 4.1666666666666667e-07, "epoch": 0.083315975838367, "percentage": 0.83, "elapsed_time": "0:09:40", "remaining_time": "19:10:55", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 300, "total_steps": 24000, "loss": 0.2146, "learning_rate": 6.25e-07, "epoch": 0.12497396375755052, "percentage": 1.25, "elapsed_time": "0:14:24", "remaining_time": "18:58:34", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 400, "total_steps": 24000, "loss": 0.2104, "learning_rate": 8.333333333333333e-07, "epoch": 0.166631951676734, "percentage": 1.67, "elapsed_time": "0:19:09", "remaining_time": "18:50:44", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 500, "total_steps": 24000, "loss": 0.2079, "learning_rate": 1.0416666666666667e-06, "epoch": 0.20828993959591752, "percentage": 2.08, "elapsed_time": "0:23:54", "remaining_time": "18:43:40", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 600, "total_steps": 24000, "loss": 0.2051, "learning_rate": 1.25e-06, "epoch": 0.24994792751510103, "percentage": 2.5, "elapsed_time": "0:28:38", "remaining_time": "18:37:14", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 700, "total_steps": 24000, "loss": 0.199, "learning_rate": 1.4583333333333335e-06, "epoch": 0.29160591543428455, "percentage": 2.92, "elapsed_time": "0:33:23", "remaining_time": "18:31:18", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 800, "total_steps": 24000, "loss": 0.1886, "learning_rate": 1.6666666666666667e-06, "epoch": 0.333263903353468, "percentage": 3.33, "elapsed_time": "0:38:07", "remaining_time": "18:25:38", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 900, "total_steps": 24000, "loss": 0.1839, "learning_rate": 1.8750000000000003e-06, "epoch": 0.3749218912726515, "percentage": 3.75, "elapsed_time": "0:42:51", "remaining_time": "18:20:08", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 1000, "total_steps": 24000, "loss": 0.1823, "learning_rate": 2.0833333333333334e-06, "epoch": 0.41657987919183503, "percentage": 4.17, "elapsed_time": "0:47:36", "remaining_time": "18:14:50", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 1100, "total_steps": 24000, "loss": 0.1814, "learning_rate": 2.2916666666666666e-06, "epoch": 0.45823786711101855, "percentage": 4.58, "elapsed_time": "0:52:20", "remaining_time": "18:09:37", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 1200, "total_steps": 24000, "loss": 0.1809, "learning_rate": 2.5e-06, "epoch": 0.49989585503020206, "percentage": 5.0, "elapsed_time": "0:57:04", "remaining_time": "18:04:31", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 1300, "total_steps": 24000, "loss": 0.1809, "learning_rate": 2.7083333333333334e-06, "epoch": 0.5415538429493856, "percentage": 5.42, "elapsed_time": "1:01:49", "remaining_time": "17:59:24", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 1400, "total_steps": 24000, "loss": 0.1907, "learning_rate": 2.916666666666667e-06, "epoch": 0.5832118308685691, "percentage": 5.83, "elapsed_time": "1:06:33", "remaining_time": "17:54:19", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 1500, "total_steps": 24000, "loss": 0.1809, "learning_rate": 3.125e-06, "epoch": 0.6248698187877526, "percentage": 6.25, "elapsed_time": "1:11:17", "remaining_time": "17:49:24", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 1600, "total_steps": 24000, "loss": 0.1804, "learning_rate": 3.3333333333333333e-06, "epoch": 0.666527806706936, "percentage": 6.67, "elapsed_time": "1:16:01", "remaining_time": "17:44:24", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 1700, "total_steps": 24000, "loss": 0.1803, "learning_rate": 3.5416666666666673e-06, "epoch": 0.7081857946261195, "percentage": 7.08, "elapsed_time": "1:20:46", "remaining_time": "17:39:32", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 1800, "total_steps": 24000, "loss": 0.1807, "learning_rate": 3.7500000000000005e-06, "epoch": 0.749843782545303, "percentage": 7.5, "elapsed_time": "1:25:31", "remaining_time": "17:34:52", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 1900, "total_steps": 24000, "loss": 0.1806, "learning_rate": 3.958333333333333e-06, "epoch": 0.7915017704644866, "percentage": 7.92, "elapsed_time": "1:30:23", "remaining_time": "17:31:26", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 2000, "total_steps": 24000, "loss": 0.1807, "learning_rate": 4.166666666666667e-06, "epoch": 0.8331597583836701, "percentage": 8.33, "elapsed_time": "1:35:08", "remaining_time": "17:26:28", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 2100, "total_steps": 24000, "loss": 0.1805, "learning_rate": 4.3750000000000005e-06, "epoch": 0.8748177463028536, "percentage": 8.75, "elapsed_time": "1:39:52", "remaining_time": "17:21:36", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 2200, "total_steps": 24000, "loss": 0.1806, "learning_rate": 4.583333333333333e-06, "epoch": 0.9164757342220371, "percentage": 9.17, "elapsed_time": "1:44:37", "remaining_time": "17:16:43", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 2300, "total_steps": 24000, "loss": 0.1817, "learning_rate": 4.791666666666668e-06, "epoch": 0.9581337221412206, "percentage": 9.58, "elapsed_time": "1:49:22", "remaining_time": "17:11:51", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 2400, "total_steps": 24000, "loss": 0.1855, "learning_rate": 5e-06, "epoch": 0.9997917100604041, "percentage": 10.0, "elapsed_time": "1:54:06", "remaining_time": "17:07:01", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 2400, "total_steps": 24000, "eval_loss": 0.18077221512794495, "epoch": 0.9997917100604041, "percentage": 10.0, "elapsed_time": "1:57:24", "remaining_time": "17:36:41", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 2500, "total_steps": 24000, "loss": 0.1804, "learning_rate": 4.999735579817769e-06, "epoch": 1.0414496979795875, "percentage": 10.42, "elapsed_time": "2:03:11", "remaining_time": "17:39:23", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 2600, "total_steps": 24000, "loss": 0.18, "learning_rate": 4.998942375205502e-06, "epoch": 1.0831076858987712, "percentage": 10.83, "elapsed_time": "2:07:55", "remaining_time": "17:32:56", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 2700, "total_steps": 24000, "loss": 0.1802, "learning_rate": 4.997620553954645e-06, "epoch": 1.1247656738179546, "percentage": 11.25, "elapsed_time": "2:12:40", "remaining_time": "17:26:39", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 2800, "total_steps": 24000, "loss": 0.1803, "learning_rate": 4.995770395678171e-06, "epoch": 1.1664236617371382, "percentage": 11.67, "elapsed_time": "2:17:24", "remaining_time": "17:20:24", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 2900, "total_steps": 24000, "loss": 0.1801, "learning_rate": 4.993392291751431e-06, "epoch": 1.2080816496563216, "percentage": 12.08, "elapsed_time": "2:22:08", "remaining_time": "17:14:15", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 3000, "total_steps": 24000, "loss": 0.18, "learning_rate": 4.990486745229364e-06, "epoch": 1.2497396375755052, "percentage": 12.5, "elapsed_time": "2:26:53", "remaining_time": "17:08:11", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 3100, "total_steps": 24000, "loss": 0.1798, "learning_rate": 4.9870543707400835e-06, "epoch": 1.2913976254946886, "percentage": 12.92, "elapsed_time": "2:31:37", "remaining_time": "17:02:14", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 3200, "total_steps": 24000, "loss": 0.1808, "learning_rate": 4.983095894354858e-06, "epoch": 1.333055613413872, "percentage": 13.33, "elapsed_time": "2:36:22", "remaining_time": "16:56:24", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 3300, "total_steps": 24000, "loss": 0.1802, "learning_rate": 4.978612153434527e-06, "epoch": 1.3747136013330556, "percentage": 13.75, "elapsed_time": "2:41:06", "remaining_time": "16:50:35", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 3400, "total_steps": 24000, "loss": 0.1799, "learning_rate": 4.973604096452361e-06, "epoch": 1.416371589252239, "percentage": 14.17, "elapsed_time": "2:45:50", "remaining_time": "16:44:49", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 3500, "total_steps": 24000, "loss": 0.1797, "learning_rate": 4.968072782793436e-06, "epoch": 1.4580295771714227, "percentage": 14.58, "elapsed_time": "2:50:34", "remaining_time": "16:39:07", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 3600, "total_steps": 24000, "loss": 0.1797, "learning_rate": 4.962019382530521e-06, "epoch": 1.499687565090606, "percentage": 15.0, "elapsed_time": "2:55:19", "remaining_time": "16:33:27", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 3700, "total_steps": 24000, "loss": 0.1799, "learning_rate": 4.955445176176577e-06, "epoch": 1.5413455530097897, "percentage": 15.42, "elapsed_time": "3:00:02", "remaining_time": "16:27:49", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 3800, "total_steps": 24000, "loss": 0.1797, "learning_rate": 4.948351554413879e-06, "epoch": 1.583003540928973, "percentage": 15.83, "elapsed_time": "3:04:46", "remaining_time": "16:22:13", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 3900, "total_steps": 24000, "loss": 0.1797, "learning_rate": 4.9407400177998335e-06, "epoch": 1.6246615288481565, "percentage": 16.25, "elapsed_time": "3:09:30", "remaining_time": "16:16:41", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 4000, "total_steps": 24000, "loss": 0.1796, "learning_rate": 4.93261217644956e-06, "epoch": 1.6663195167673401, "percentage": 16.67, "elapsed_time": "3:14:14", "remaining_time": "16:11:10", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 4100, "total_steps": 24000, "loss": 0.1796, "learning_rate": 4.9239697496952904e-06, "epoch": 1.7079775046865238, "percentage": 17.08, "elapsed_time": "3:18:58", "remaining_time": "16:05:43", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 4200, "total_steps": 24000, "loss": 0.1797, "learning_rate": 4.914814565722671e-06, "epoch": 1.7496354926057072, "percentage": 17.5, "elapsed_time": "3:23:41", "remaining_time": "16:00:15", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 4300, "total_steps": 24000, "loss": 0.1801, "learning_rate": 4.905148561184033e-06, "epoch": 1.7912934805248906, "percentage": 17.92, "elapsed_time": "3:28:25", "remaining_time": "15:54:52", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 4400, "total_steps": 24000, "loss": 0.18, "learning_rate": 4.894973780788722e-06, "epoch": 1.8329514684440742, "percentage": 18.33, "elapsed_time": "3:33:09", "remaining_time": "15:49:29", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 4500, "total_steps": 24000, "loss": 0.1797, "learning_rate": 4.884292376870567e-06, "epoch": 1.8746094563632578, "percentage": 18.75, "elapsed_time": "3:37:53", "remaining_time": "15:44:10", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 4600, "total_steps": 24000, "loss": 0.1796, "learning_rate": 4.873106608932585e-06, "epoch": 1.916267444282441, "percentage": 19.17, "elapsed_time": "3:42:36", "remaining_time": "15:38:50", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 4700, "total_steps": 24000, "loss": 0.1799, "learning_rate": 4.861418843169012e-06, "epoch": 1.9579254322016246, "percentage": 19.58, "elapsed_time": "3:47:20", "remaining_time": "15:33:33", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 4800, "total_steps": 24000, "loss": 0.1879, "learning_rate": 4.849231551964771e-06, "epoch": 1.9995834201208083, "percentage": 20.0, "elapsed_time": "3:52:03", "remaining_time": "15:28:15", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 4801, "total_steps": 24000, "eval_loss": 0.1797732561826706, "epoch": 2.0, "percentage": 20.0, "elapsed_time": "3:55:23", "remaining_time": "15:41:18", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 4900, "total_steps": 24000, "loss": 0.1796, "learning_rate": 4.836547313372472e-06, "epoch": 2.041241408039992, "percentage": 20.42, "elapsed_time": "4:05:18", "remaining_time": "15:56:10", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 5000, "total_steps": 24000, "loss": 0.1794, "learning_rate": 4.823368810567056e-06, "epoch": 2.082899395959175, "percentage": 20.83, "elapsed_time": "4:10:01", "remaining_time": "15:50:07", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 5100, "total_steps": 24000, "loss": 0.1797, "learning_rate": 4.809698831278217e-06, "epoch": 2.1245573838783587, "percentage": 21.25, "elapsed_time": "4:14:45", "remaining_time": "15:44:06", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 5200, "total_steps": 24000, "loss": 0.1796, "learning_rate": 4.7955402672006855e-06, "epoch": 2.1662153717975423, "percentage": 21.67, "elapsed_time": "4:19:29", "remaining_time": "15:38:08", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 5300, "total_steps": 24000, "loss": 0.1795, "learning_rate": 4.780896113382536e-06, "epoch": 2.2078733597167255, "percentage": 22.08, "elapsed_time": "4:24:13", "remaining_time": "15:32:14", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 5400, "total_steps": 24000, "loss": 0.1795, "learning_rate": 4.765769467591626e-06, "epoch": 2.249531347635909, "percentage": 22.5, "elapsed_time": "4:28:56", "remaining_time": "15:26:22", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 5500, "total_steps": 24000, "loss": 0.1797, "learning_rate": 4.750163529660303e-06, "epoch": 2.2911893355550927, "percentage": 22.92, "elapsed_time": "4:33:40", "remaining_time": "15:20:31", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 5600, "total_steps": 24000, "loss": 0.1795, "learning_rate": 4.734081600808531e-06, "epoch": 2.3328473234742764, "percentage": 23.33, "elapsed_time": "4:38:23", "remaining_time": "15:14:43", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 5700, "total_steps": 24000, "loss": 0.1796, "learning_rate": 4.717527082945555e-06, "epoch": 2.3745053113934596, "percentage": 23.75, "elapsed_time": "4:43:07", "remaining_time": "15:08:58", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 5800, "total_steps": 24000, "loss": 0.1797, "learning_rate": 4.700503477950278e-06, "epoch": 2.416163299312643, "percentage": 24.17, "elapsed_time": "4:47:51", "remaining_time": "15:03:16", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 5900, "total_steps": 24000, "loss": 0.1796, "learning_rate": 4.6830143869304904e-06, "epoch": 2.457821287231827, "percentage": 24.58, "elapsed_time": "4:52:35", "remaining_time": "14:57:37", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 6000, "total_steps": 24000, "loss": 0.1796, "learning_rate": 4.665063509461098e-06, "epoch": 2.4994792751510104, "percentage": 25.0, "elapsed_time": "4:57:19", "remaining_time": "14:51:59", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 6100, "total_steps": 24000, "loss": 0.1795, "learning_rate": 4.646654642801533e-06, "epoch": 2.5411372630701936, "percentage": 25.42, "elapsed_time": "5:02:03", "remaining_time": "14:46:23", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 6200, "total_steps": 24000, "loss": 0.1795, "learning_rate": 4.627791681092499e-06, "epoch": 2.5827952509893772, "percentage": 25.83, "elapsed_time": "5:06:48", "remaining_time": "14:40:49", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 6300, "total_steps": 24000, "loss": 0.1796, "learning_rate": 4.608478614532215e-06, "epoch": 2.624453238908561, "percentage": 26.25, "elapsed_time": "5:11:32", "remaining_time": "14:35:16", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 6400, "total_steps": 24000, "loss": 0.1797, "learning_rate": 4.588719528532342e-06, "epoch": 2.666111226827744, "percentage": 26.67, "elapsed_time": "5:16:16", "remaining_time": "14:29:45", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 6500, "total_steps": 24000, "loss": 0.1796, "learning_rate": 4.568518602853776e-06, "epoch": 2.7077692147469277, "percentage": 27.08, "elapsed_time": "5:21:00", "remaining_time": "14:24:16", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 6600, "total_steps": 24000, "loss": 0.1795, "learning_rate": 4.54788011072248e-06, "epoch": 2.7494272026661113, "percentage": 27.5, "elapsed_time": "5:25:44", "remaining_time": "14:18:47", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 6700, "total_steps": 24000, "loss": 0.1796, "learning_rate": 4.526808417925531e-06, "epoch": 2.791085190585295, "percentage": 27.92, "elapsed_time": "5:30:28", "remaining_time": "14:13:19", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 6800, "total_steps": 24000, "loss": 0.1795, "learning_rate": 4.50530798188761e-06, "epoch": 2.832743178504478, "percentage": 28.33, "elapsed_time": "5:35:12", "remaining_time": "14:07:52", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 6900, "total_steps": 24000, "loss": 0.1794, "learning_rate": 4.4833833507280884e-06, "epoch": 2.8744011664236617, "percentage": 28.75, "elapsed_time": "5:39:55", "remaining_time": "14:02:25", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 7000, "total_steps": 24000, "loss": 0.1793, "learning_rate": 4.46103916229894e-06, "epoch": 2.9160591543428453, "percentage": 29.17, "elapsed_time": "5:44:38", "remaining_time": "13:57:00", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 7100, "total_steps": 24000, "loss": 0.1836, "learning_rate": 4.438280143203665e-06, "epoch": 2.9577171422620285, "percentage": 29.58, "elapsed_time": "5:49:22", "remaining_time": "13:51:36", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 7200, "total_steps": 24000, "loss": 0.1793, "learning_rate": 4.415111107797445e-06, "epoch": 2.999375130181212, "percentage": 30.0, "elapsed_time": "5:54:06", "remaining_time": "13:46:16", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 7201, "total_steps": 24000, "eval_loss": 0.17931845784187317, "epoch": 2.9997917100604043, "percentage": 30.0, "elapsed_time": "5:57:27", "remaining_time": "13:53:54", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 7300, "total_steps": 24000, "loss": 0.1795, "learning_rate": 4.391536957168733e-06, "epoch": 3.041033118100396, "percentage": 30.42, "elapsed_time": "6:03:13", "remaining_time": "13:50:56", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 7400, "total_steps": 24000, "loss": 0.1794, "learning_rate": 4.367562678102491e-06, "epoch": 3.0826911060195794, "percentage": 30.83, "elapsed_time": "6:07:57", "remaining_time": "13:45:24", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 7500, "total_steps": 24000, "loss": 0.1793, "learning_rate": 4.34319334202531e-06, "epoch": 3.1243490939387626, "percentage": 31.25, "elapsed_time": "6:12:41", "remaining_time": "13:39:54", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 7600, "total_steps": 24000, "loss": 0.1793, "learning_rate": 4.318434103932622e-06, "epoch": 3.166007081857946, "percentage": 31.67, "elapsed_time": "6:17:25", "remaining_time": "13:34:26", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 7700, "total_steps": 24000, "loss": 0.1794, "learning_rate": 4.293290201298224e-06, "epoch": 3.20766506977713, "percentage": 32.08, "elapsed_time": "6:22:09", "remaining_time": "13:28:58", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 7800, "total_steps": 24000, "loss": 0.1792, "learning_rate": 4.267766952966369e-06, "epoch": 3.2493230576963135, "percentage": 32.5, "elapsed_time": "6:26:53", "remaining_time": "13:23:32", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 7900, "total_steps": 24000, "loss": 0.1793, "learning_rate": 4.241869758026638e-06, "epoch": 3.2909810456154966, "percentage": 32.92, "elapsed_time": "6:31:37", "remaining_time": "13:18:06", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 8000, "total_steps": 24000, "loss": 0.1791, "learning_rate": 4.215604094671835e-06, "epoch": 3.3326390335346803, "percentage": 33.33, "elapsed_time": "6:36:20", "remaining_time": "13:12:41", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 8100, "total_steps": 24000, "loss": 0.1794, "learning_rate": 4.188975519039151e-06, "epoch": 3.374297021453864, "percentage": 33.75, "elapsed_time": "6:41:04", "remaining_time": "13:07:17", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 8200, "total_steps": 24000, "loss": 0.1796, "learning_rate": 4.161989664034844e-06, "epoch": 3.4159550093730475, "percentage": 34.17, "elapsed_time": "6:45:47", "remaining_time": "13:01:53", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 8300, "total_steps": 24000, "loss": 0.1794, "learning_rate": 4.134652238142674e-06, "epoch": 3.4576129972922307, "percentage": 34.58, "elapsed_time": "6:50:31", "remaining_time": "12:56:31", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 8400, "total_steps": 24000, "loss": 0.1793, "learning_rate": 4.106969024216348e-06, "epoch": 3.4992709852114143, "percentage": 35.0, "elapsed_time": "6:55:15", "remaining_time": "12:51:10", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 8500, "total_steps": 24000, "loss": 0.1792, "learning_rate": 4.078945878256244e-06, "epoch": 3.540928973130598, "percentage": 35.42, "elapsed_time": "6:59:59", "remaining_time": "12:45:51", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 8600, "total_steps": 24000, "loss": 0.1794, "learning_rate": 4.0505887281706505e-06, "epoch": 3.582586961049781, "percentage": 35.83, "elapsed_time": "7:04:43", "remaining_time": "12:40:32", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 8700, "total_steps": 24000, "loss": 0.1798, "learning_rate": 4.021903572521802e-06, "epoch": 3.6242449489689648, "percentage": 36.25, "elapsed_time": "7:09:27", "remaining_time": "12:35:14", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 8800, "total_steps": 24000, "loss": 0.1794, "learning_rate": 3.992896479256966e-06, "epoch": 3.6659029368881484, "percentage": 36.67, "elapsed_time": "7:14:11", "remaining_time": "12:29:57", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 8900, "total_steps": 24000, "loss": 0.1793, "learning_rate": 3.963573584424852e-06, "epoch": 3.707560924807332, "percentage": 37.08, "elapsed_time": "7:18:55", "remaining_time": "12:24:40", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 9000, "total_steps": 24000, "loss": 0.1792, "learning_rate": 3.933941090877615e-06, "epoch": 3.749218912726515, "percentage": 37.5, "elapsed_time": "7:23:38", "remaining_time": "12:19:24", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 9100, "total_steps": 24000, "loss": 0.1794, "learning_rate": 3.9040052669587325e-06, "epoch": 3.790876900645699, "percentage": 37.92, "elapsed_time": "7:28:21", "remaining_time": "12:14:08", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 9200, "total_steps": 24000, "loss": 0.1794, "learning_rate": 3.8737724451770155e-06, "epoch": 3.8325348885648824, "percentage": 38.33, "elapsed_time": "7:33:05", "remaining_time": "12:08:53", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 9300, "total_steps": 24000, "loss": 0.1794, "learning_rate": 3.8432490208670605e-06, "epoch": 3.8741928764840656, "percentage": 38.75, "elapsed_time": "7:37:49", "remaining_time": "12:03:39", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 9400, "total_steps": 24000, "loss": 0.1793, "learning_rate": 3.8124414508364005e-06, "epoch": 3.9158508644032493, "percentage": 39.17, "elapsed_time": "7:42:32", "remaining_time": "11:58:25", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 9500, "total_steps": 24000, "loss": 0.1792, "learning_rate": 3.7813562519996633e-06, "epoch": 3.957508852322433, "percentage": 39.58, "elapsed_time": "7:47:16", "remaining_time": "11:53:12", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 9600, "total_steps": 24000, "loss": 0.1793, "learning_rate": 3.7500000000000005e-06, "epoch": 3.9991668402416165, "percentage": 40.0, "elapsed_time": "7:52:00", "remaining_time": "11:48:00", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 9602, "total_steps": 24000, "eval_loss": 0.1792728751897812, "epoch": 4.0, "percentage": 40.01, "elapsed_time": "7:55:21", "remaining_time": "11:52:48", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 9700, "total_steps": 24000, "loss": 0.1793, "learning_rate": 3.7183793278181063e-06, "epoch": 4.0408248281608, "percentage": 40.42, "elapsed_time": "8:09:15", "remaining_time": "12:01:16", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 9800, "total_steps": 24000, "loss": 0.1792, "learning_rate": 3.6865009243691015e-06, "epoch": 4.082482816079984, "percentage": 40.83, "elapsed_time": "8:13:59", "remaining_time": "11:55:46", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 9900, "total_steps": 24000, "loss": 0.1792, "learning_rate": 3.654371533087586e-06, "epoch": 4.1241408039991665, "percentage": 41.25, "elapsed_time": "8:18:43", "remaining_time": "11:50:18", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 10000, "total_steps": 24000, "loss": 0.1791, "learning_rate": 3.621997950501156e-06, "epoch": 4.16579879191835, "percentage": 41.67, "elapsed_time": "8:23:27", "remaining_time": "11:44:50", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 10100, "total_steps": 24000, "loss": 0.1793, "learning_rate": 3.5893870247926986e-06, "epoch": 4.207456779837534, "percentage": 42.08, "elapsed_time": "8:28:11", "remaining_time": "11:39:24", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 10200, "total_steps": 24000, "loss": 0.1792, "learning_rate": 3.556545654351749e-06, "epoch": 4.249114767756717, "percentage": 42.5, "elapsed_time": "8:32:55", "remaining_time": "11:33:57", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 10300, "total_steps": 24000, "loss": 0.1793, "learning_rate": 3.5234807863152316e-06, "epoch": 4.290772755675901, "percentage": 42.92, "elapsed_time": "8:37:39", "remaining_time": "11:28:32", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 10400, "total_steps": 24000, "loss": 0.1792, "learning_rate": 3.4901994150978926e-06, "epoch": 4.332430743595085, "percentage": 43.33, "elapsed_time": "8:42:23", "remaining_time": "11:23:08", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 10500, "total_steps": 24000, "loss": 0.1792, "learning_rate": 3.4567085809127247e-06, "epoch": 4.374088731514268, "percentage": 43.75, "elapsed_time": "8:47:07", "remaining_time": "11:17:43", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 10600, "total_steps": 24000, "loss": 0.1792, "learning_rate": 3.4230153682817112e-06, "epoch": 4.415746719433451, "percentage": 44.17, "elapsed_time": "8:51:51", "remaining_time": "11:12:20", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 10700, "total_steps": 24000, "loss": 0.1791, "learning_rate": 3.389126904537192e-06, "epoch": 4.457404707352635, "percentage": 44.58, "elapsed_time": "8:56:34", "remaining_time": "11:06:58", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 10800, "total_steps": 24000, "loss": 0.1791, "learning_rate": 3.3550503583141726e-06, "epoch": 4.499062695271818, "percentage": 45.0, "elapsed_time": "9:01:18", "remaining_time": "11:01:36", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 10900, "total_steps": 24000, "loss": 0.1793, "learning_rate": 3.3207929380339034e-06, "epoch": 4.540720683191002, "percentage": 45.42, "elapsed_time": "9:06:02", "remaining_time": "10:56:15", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 11000, "total_steps": 24000, "loss": 0.1792, "learning_rate": 3.2863618903790346e-06, "epoch": 4.5823786711101855, "percentage": 45.83, "elapsed_time": "9:10:46", "remaining_time": "10:50:54", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 11100, "total_steps": 24000, "loss": 0.1795, "learning_rate": 3.2517644987606827e-06, "epoch": 4.624036659029369, "percentage": 46.25, "elapsed_time": "9:15:30", "remaining_time": "10:45:34", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 11200, "total_steps": 24000, "loss": 0.1792, "learning_rate": 3.217008081777726e-06, "epoch": 4.665694646948553, "percentage": 46.67, "elapsed_time": "9:20:13", "remaining_time": "10:40:15", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 11300, "total_steps": 24000, "loss": 0.1792, "learning_rate": 3.182099991668653e-06, "epoch": 4.7073526348677355, "percentage": 47.08, "elapsed_time": "9:24:57", "remaining_time": "10:34:57", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 11400, "total_steps": 24000, "loss": 0.1793, "learning_rate": 3.147047612756302e-06, "epoch": 4.749010622786919, "percentage": 47.5, "elapsed_time": "9:29:41", "remaining_time": "10:29:39", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 11500, "total_steps": 24000, "loss": 0.1791, "learning_rate": 3.1118583598858097e-06, "epoch": 4.790668610706103, "percentage": 47.92, "elapsed_time": "9:34:24", "remaining_time": "10:24:21", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 11600, "total_steps": 24000, "loss": 0.179, "learning_rate": 3.0765396768561005e-06, "epoch": 4.832326598625286, "percentage": 48.33, "elapsed_time": "9:39:08", "remaining_time": "10:19:04", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 11700, "total_steps": 24000, "loss": 0.1792, "learning_rate": 3.0410990348452572e-06, "epoch": 4.87398458654447, "percentage": 48.75, "elapsed_time": "9:43:51", "remaining_time": "10:13:48", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 11800, "total_steps": 24000, "loss": 0.179, "learning_rate": 3.0055439308300954e-06, "epoch": 4.915642574463654, "percentage": 49.17, "elapsed_time": "9:48:35", "remaining_time": "10:08:32", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 11900, "total_steps": 24000, "loss": 0.1792, "learning_rate": 2.96988188600028e-06, "epoch": 4.957300562382837, "percentage": 49.58, "elapsed_time": "9:53:18", "remaining_time": "10:03:17", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 12000, "total_steps": 24000, "loss": 0.1791, "learning_rate": 2.9341204441673267e-06, "epoch": 4.998958550302021, "percentage": 50.0, "elapsed_time": "9:58:02", "remaining_time": "9:58:02", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 12002, "total_steps": 24000, "eval_loss": 0.179093137383461, "epoch": 4.999791710060404, "percentage": 50.01, "elapsed_time": "10:01:26", "remaining_time": "10:01:14", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 12100, "total_steps": 24000, "loss": 0.179, "learning_rate": 2.898267170168807e-06, "epoch": 5.040616538221204, "percentage": 50.42, "elapsed_time": "10:14:01", "remaining_time": "10:03:52", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 12200, "total_steps": 24000, "loss": 0.1789, "learning_rate": 2.862329648268117e-06, "epoch": 5.082274526140387, "percentage": 50.83, "elapsed_time": "10:18:45", "remaining_time": "9:58:27", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 12300, "total_steps": 24000, "loss": 0.1791, "learning_rate": 2.82631548055013e-06, "epoch": 5.123932514059571, "percentage": 51.25, "elapsed_time": "10:23:28", "remaining_time": "9:53:04", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 12400, "total_steps": 24000, "loss": 0.179, "learning_rate": 2.7902322853130758e-06, "epoch": 5.1655905019787545, "percentage": 51.67, "elapsed_time": "10:28:12", "remaining_time": "9:47:40", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 12500, "total_steps": 24000, "loss": 0.1792, "learning_rate": 2.754087695457005e-06, "epoch": 5.207248489897938, "percentage": 52.08, "elapsed_time": "10:32:56", "remaining_time": "9:42:17", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 12600, "total_steps": 24000, "loss": 0.179, "learning_rate": 2.717889356869146e-06, "epoch": 5.248906477817122, "percentage": 52.5, "elapsed_time": "10:37:39", "remaining_time": "9:36:55", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 12700, "total_steps": 24000, "loss": 0.179, "learning_rate": 2.681644926806527e-06, "epoch": 5.290564465736305, "percentage": 52.92, "elapsed_time": "10:42:22", "remaining_time": "9:31:34", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 12800, "total_steps": 24000, "loss": 0.179, "learning_rate": 2.6453620722761897e-06, "epoch": 5.332222453655488, "percentage": 53.33, "elapsed_time": "10:47:06", "remaining_time": "9:26:13", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 12900, "total_steps": 24000, "loss": 0.1791, "learning_rate": 2.6090484684133406e-06, "epoch": 5.373880441574672, "percentage": 53.75, "elapsed_time": "10:51:50", "remaining_time": "9:20:52", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 13000, "total_steps": 24000, "loss": 0.179, "learning_rate": 2.572711796857779e-06, "epoch": 5.415538429493855, "percentage": 54.17, "elapsed_time": "10:56:33", "remaining_time": "9:15:33", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 13100, "total_steps": 24000, "loss": 0.179, "learning_rate": 2.5363597441289574e-06, "epoch": 5.457196417413039, "percentage": 54.58, "elapsed_time": "11:01:17", "remaining_time": "9:10:14", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 13200, "total_steps": 24000, "loss": 0.179, "learning_rate": 2.5e-06, "epoch": 5.498854405332223, "percentage": 55.0, "elapsed_time": "11:06:01", "remaining_time": "9:04:55", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 13300, "total_steps": 24000, "loss": 0.1791, "learning_rate": 2.4636402558710434e-06, "epoch": 5.540512393251406, "percentage": 55.42, "elapsed_time": "11:10:45", "remaining_time": "8:59:37", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 13400, "total_steps": 24000, "loss": 0.179, "learning_rate": 2.4272882031422216e-06, "epoch": 5.58217038117059, "percentage": 55.83, "elapsed_time": "11:15:28", "remaining_time": "8:54:19", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 13500, "total_steps": 24000, "loss": 0.1791, "learning_rate": 2.3909515315866606e-06, "epoch": 5.6238283690897735, "percentage": 56.25, "elapsed_time": "11:20:12", "remaining_time": "8:49:02", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 13600, "total_steps": 24000, "loss": 0.1789, "learning_rate": 2.3546379277238107e-06, "epoch": 5.665486357008956, "percentage": 56.67, "elapsed_time": "11:24:55", "remaining_time": "8:43:46", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 13700, "total_steps": 24000, "loss": 0.1791, "learning_rate": 2.318355073193474e-06, "epoch": 5.70714434492814, "percentage": 57.08, "elapsed_time": "11:29:39", "remaining_time": "8:38:30", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 13800, "total_steps": 24000, "loss": 0.179, "learning_rate": 2.2821106431308546e-06, "epoch": 5.7488023328473234, "percentage": 57.5, "elapsed_time": "11:34:23", "remaining_time": "8:33:14", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 13900, "total_steps": 24000, "loss": 0.1791, "learning_rate": 2.2459123045429953e-06, "epoch": 5.790460320766507, "percentage": 57.92, "elapsed_time": "11:39:06", "remaining_time": "8:27:59", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 14000, "total_steps": 24000, "loss": 0.1791, "learning_rate": 2.2097677146869242e-06, "epoch": 5.832118308685691, "percentage": 58.33, "elapsed_time": "11:43:50", "remaining_time": "8:22:44", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 14100, "total_steps": 24000, "loss": 0.179, "learning_rate": 2.173684519449872e-06, "epoch": 5.873776296604874, "percentage": 58.75, "elapsed_time": "11:48:34", "remaining_time": "8:17:30", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 14200, "total_steps": 24000, "loss": 0.1789, "learning_rate": 2.1376703517318835e-06, "epoch": 5.915434284524057, "percentage": 59.17, "elapsed_time": "11:53:18", "remaining_time": "8:12:16", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 14300, "total_steps": 24000, "loss": 0.179, "learning_rate": 2.101732829831194e-06, "epoch": 5.957092272443241, "percentage": 59.58, "elapsed_time": "11:58:02", "remaining_time": "8:07:03", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 14400, "total_steps": 24000, "loss": 0.1789, "learning_rate": 2.0658795558326745e-06, "epoch": 5.998750260362424, "percentage": 60.0, "elapsed_time": "12:02:46", "remaining_time": "8:01:50", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 14403, "total_steps": 24000, "eval_loss": 0.17907081544399261, "epoch": 6.0, "percentage": 60.01, "elapsed_time": "12:06:10", "remaining_time": "8:03:52", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 14500, "total_steps": 24000, "loss": 0.1791, "learning_rate": 2.0301181139997206e-06, "epoch": 6.040408248281608, "percentage": 60.42, "elapsed_time": "12:11:45", "remaining_time": "7:59:25", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 14600, "total_steps": 24000, "loss": 0.179, "learning_rate": 1.994456069169906e-06, "epoch": 6.082066236200792, "percentage": 60.83, "elapsed_time": "12:16:29", "remaining_time": "7:54:10", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 14700, "total_steps": 24000, "loss": 0.1789, "learning_rate": 1.958900965154743e-06, "epoch": 6.123724224119975, "percentage": 61.25, "elapsed_time": "12:21:13", "remaining_time": "7:48:56", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 14800, "total_steps": 24000, "loss": 0.1788, "learning_rate": 1.9234603231439e-06, "epoch": 6.165382212039159, "percentage": 61.67, "elapsed_time": "12:25:56", "remaining_time": "7:43:41", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 14900, "total_steps": 24000, "loss": 0.1788, "learning_rate": 1.8881416401141905e-06, "epoch": 6.207040199958342, "percentage": 62.08, "elapsed_time": "12:30:40", "remaining_time": "7:38:27", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 15000, "total_steps": 24000, "loss": 0.1788, "learning_rate": 1.852952387243698e-06, "epoch": 6.248698187877525, "percentage": 62.5, "elapsed_time": "12:35:23", "remaining_time": "7:33:14", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 15100, "total_steps": 24000, "loss": 0.1788, "learning_rate": 1.8179000083313483e-06, "epoch": 6.290356175796709, "percentage": 62.92, "elapsed_time": "12:40:07", "remaining_time": "7:28:01", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 15200, "total_steps": 24000, "loss": 0.1787, "learning_rate": 1.7829919182222752e-06, "epoch": 6.332014163715892, "percentage": 63.33, "elapsed_time": "12:44:50", "remaining_time": "7:22:48", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 15300, "total_steps": 24000, "loss": 0.1789, "learning_rate": 1.7482355012393177e-06, "epoch": 6.373672151635076, "percentage": 63.75, "elapsed_time": "12:49:34", "remaining_time": "7:17:35", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 15400, "total_steps": 24000, "loss": 0.179, "learning_rate": 1.7136381096209665e-06, "epoch": 6.41533013955426, "percentage": 64.17, "elapsed_time": "12:54:17", "remaining_time": "7:12:23", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 15500, "total_steps": 24000, "loss": 0.1789, "learning_rate": 1.6792070619660977e-06, "epoch": 6.456988127473443, "percentage": 64.58, "elapsed_time": "12:59:01", "remaining_time": "7:07:12", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 15600, "total_steps": 24000, "loss": 0.1787, "learning_rate": 1.6449496416858285e-06, "epoch": 6.498646115392627, "percentage": 65.0, "elapsed_time": "13:03:45", "remaining_time": "7:02:01", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 15700, "total_steps": 24000, "loss": 0.1788, "learning_rate": 1.6108730954628093e-06, "epoch": 6.54030410331181, "percentage": 65.42, "elapsed_time": "13:08:28", "remaining_time": "6:56:50", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 15800, "total_steps": 24000, "loss": 0.1787, "learning_rate": 1.5769846317182894e-06, "epoch": 6.581962091230993, "percentage": 65.83, "elapsed_time": "13:13:12", "remaining_time": "6:51:40", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 15900, "total_steps": 24000, "loss": 0.1788, "learning_rate": 1.5432914190872757e-06, "epoch": 6.623620079150177, "percentage": 66.25, "elapsed_time": "13:17:56", "remaining_time": "6:46:30", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 16000, "total_steps": 24000, "loss": 0.1789, "learning_rate": 1.509800584902108e-06, "epoch": 6.6652780670693605, "percentage": 66.67, "elapsed_time": "13:22:40", "remaining_time": "6:41:20", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 16100, "total_steps": 24000, "loss": 0.1788, "learning_rate": 1.4765192136847686e-06, "epoch": 6.706936054988544, "percentage": 67.08, "elapsed_time": "13:27:24", "remaining_time": "6:36:10", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 16200, "total_steps": 24000, "loss": 0.1789, "learning_rate": 1.443454345648252e-06, "epoch": 6.748594042907728, "percentage": 67.5, "elapsed_time": "13:32:08", "remaining_time": "6:31:01", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 16300, "total_steps": 24000, "loss": 0.1789, "learning_rate": 1.4106129752073023e-06, "epoch": 6.790252030826911, "percentage": 67.92, "elapsed_time": "13:36:52", "remaining_time": "6:25:52", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 16400, "total_steps": 24000, "loss": 0.1788, "learning_rate": 1.3780020494988447e-06, "epoch": 6.831910018746095, "percentage": 68.33, "elapsed_time": "13:41:35", "remaining_time": "6:20:44", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 16500, "total_steps": 24000, "loss": 0.1786, "learning_rate": 1.3456284669124159e-06, "epoch": 6.873568006665278, "percentage": 68.75, "elapsed_time": "13:46:19", "remaining_time": "6:15:36", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 16600, "total_steps": 24000, "loss": 0.1789, "learning_rate": 1.313499075630899e-06, "epoch": 6.915225994584461, "percentage": 69.17, "elapsed_time": "13:51:03", "remaining_time": "6:10:28", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 16700, "total_steps": 24000, "loss": 0.1788, "learning_rate": 1.2816206721818944e-06, "epoch": 6.956883982503645, "percentage": 69.58, "elapsed_time": "13:55:47", "remaining_time": "6:05:20", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 16800, "total_steps": 24000, "loss": 0.1787, "learning_rate": 1.2500000000000007e-06, "epoch": 6.998541970422829, "percentage": 70.0, "elapsed_time": "14:00:31", "remaining_time": "6:00:13", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 16803, "total_steps": 24000, "eval_loss": 0.17890912294387817, "epoch": 6.999791710060404, "percentage": 70.01, "elapsed_time": "14:03:57", "remaining_time": "6:01:29", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 16900, "total_steps": 24000, "loss": 0.1786, "learning_rate": 1.218643748000337e-06, "epoch": 7.040199958342012, "percentage": 70.42, "elapsed_time": "14:17:21", "remaining_time": "6:00:11", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 17000, "total_steps": 24000, "loss": 0.1787, "learning_rate": 1.1875585491636e-06, "epoch": 7.081857946261196, "percentage": 70.83, "elapsed_time": "14:22:05", "remaining_time": "5:54:58", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 17100, "total_steps": 24000, "loss": 0.1786, "learning_rate": 1.1567509791329402e-06, "epoch": 7.123515934180379, "percentage": 71.25, "elapsed_time": "14:26:49", "remaining_time": "5:49:46", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 17200, "total_steps": 24000, "loss": 0.1786, "learning_rate": 1.1262275548229852e-06, "epoch": 7.165173922099562, "percentage": 71.67, "elapsed_time": "14:31:33", "remaining_time": "5:44:34", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 17300, "total_steps": 24000, "loss": 0.1789, "learning_rate": 1.0959947330412681e-06, "epoch": 7.206831910018746, "percentage": 72.08, "elapsed_time": "14:36:17", "remaining_time": "5:39:22", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 17400, "total_steps": 24000, "loss": 0.1786, "learning_rate": 1.0660589091223854e-06, "epoch": 7.2484898979379295, "percentage": 72.5, "elapsed_time": "14:41:00", "remaining_time": "5:34:10", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 17500, "total_steps": 24000, "loss": 0.1787, "learning_rate": 1.0364264155751489e-06, "epoch": 7.290147885857113, "percentage": 72.92, "elapsed_time": "14:45:44", "remaining_time": "5:28:59", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 17600, "total_steps": 24000, "loss": 0.1786, "learning_rate": 1.0071035207430352e-06, "epoch": 7.331805873776297, "percentage": 73.33, "elapsed_time": "14:50:28", "remaining_time": "5:23:48", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 17700, "total_steps": 24000, "loss": 0.1786, "learning_rate": 9.780964274781984e-07, "epoch": 7.37346386169548, "percentage": 73.75, "elapsed_time": "14:55:12", "remaining_time": "5:18:37", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 17800, "total_steps": 24000, "loss": 0.1787, "learning_rate": 9.494112718293503e-07, "epoch": 7.415121849614664, "percentage": 74.17, "elapsed_time": "14:59:56", "remaining_time": "5:13:27", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 17900, "total_steps": 24000, "loss": 0.1787, "learning_rate": 9.210541217437566e-07, "epoch": 7.456779837533847, "percentage": 74.58, "elapsed_time": "15:04:40", "remaining_time": "5:08:17", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 18000, "total_steps": 24000, "loss": 0.1785, "learning_rate": 8.930309757836517e-07, "epoch": 7.49843782545303, "percentage": 75.0, "elapsed_time": "15:09:23", "remaining_time": "5:03:07", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 18100, "total_steps": 24000, "loss": 0.1786, "learning_rate": 8.653477618573261e-07, "epoch": 7.540095813372214, "percentage": 75.42, "elapsed_time": "15:14:07", "remaining_time": "4:57:58", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 18200, "total_steps": 24000, "loss": 0.1786, "learning_rate": 8.380103359651554e-07, "epoch": 7.581753801291398, "percentage": 75.83, "elapsed_time": "15:18:51", "remaining_time": "4:52:49", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 18300, "total_steps": 24000, "loss": 0.1786, "learning_rate": 8.110244809608494e-07, "epoch": 7.623411789210581, "percentage": 76.25, "elapsed_time": "15:23:34", "remaining_time": "4:47:40", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 18400, "total_steps": 24000, "loss": 0.1786, "learning_rate": 7.843959053281663e-07, "epoch": 7.665069777129765, "percentage": 76.67, "elapsed_time": "15:28:18", "remaining_time": "4:42:31", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 18500, "total_steps": 24000, "loss": 0.1785, "learning_rate": 7.581302419733633e-07, "epoch": 7.7067277650489485, "percentage": 77.08, "elapsed_time": "15:33:02", "remaining_time": "4:37:23", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 18600, "total_steps": 24000, "loss": 0.1786, "learning_rate": 7.322330470336314e-07, "epoch": 7.748385752968131, "percentage": 77.5, "elapsed_time": "15:37:46", "remaining_time": "4:32:15", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 18700, "total_steps": 24000, "loss": 0.1786, "learning_rate": 7.067097987017762e-07, "epoch": 7.790043740887315, "percentage": 77.92, "elapsed_time": "15:42:30", "remaining_time": "4:27:07", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 18800, "total_steps": 24000, "loss": 0.1786, "learning_rate": 6.815658960673782e-07, "epoch": 7.8317017288064985, "percentage": 78.33, "elapsed_time": "15:47:14", "remaining_time": "4:22:00", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 18900, "total_steps": 24000, "loss": 0.1785, "learning_rate": 6.568066579746901e-07, "epoch": 7.873359716725682, "percentage": 78.75, "elapsed_time": "15:51:57", "remaining_time": "4:16:52", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 19000, "total_steps": 24000, "loss": 0.1786, "learning_rate": 6.324373218975105e-07, "epoch": 7.915017704644866, "percentage": 79.17, "elapsed_time": "15:56:41", "remaining_time": "4:11:45", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 19100, "total_steps": 24000, "loss": 0.1785, "learning_rate": 6.084630428312679e-07, "epoch": 7.956675692564049, "percentage": 79.58, "elapsed_time": "16:01:25", "remaining_time": "4:06:38", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 19200, "total_steps": 24000, "loss": 0.1787, "learning_rate": 5.848888922025553e-07, "epoch": 7.998333680483233, "percentage": 80.0, "elapsed_time": "16:06:09", "remaining_time": "4:01:32", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 19204, "total_steps": 24000, "eval_loss": 0.17885753512382507, "epoch": 8.0, "percentage": 80.02, "elapsed_time": "16:09:37", "remaining_time": "4:02:09", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 19300, "total_steps": 24000, "loss": 0.1782, "learning_rate": 5.617198567963353e-07, "epoch": 8.039991668402417, "percentage": 80.42, "elapsed_time": "16:17:37", "remaining_time": "3:58:04", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 19400, "total_steps": 24000, "loss": 0.1782, "learning_rate": 5.389608377010608e-07, "epoch": 8.0816496563216, "percentage": 80.83, "elapsed_time": "16:22:21", "remaining_time": "3:52:55", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 19500, "total_steps": 24000, "loss": 0.1782, "learning_rate": 5.166166492719124e-07, "epoch": 8.123307644240784, "percentage": 81.25, "elapsed_time": "16:27:05", "remaining_time": "3:47:47", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 19600, "total_steps": 24000, "loss": 0.1781, "learning_rate": 4.946920181123904e-07, "epoch": 8.164965632159968, "percentage": 81.67, "elapsed_time": "16:31:49", "remaining_time": "3:42:39", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 19700, "total_steps": 24000, "loss": 0.1781, "learning_rate": 4.7319158207446953e-07, "epoch": 8.20662362007915, "percentage": 82.08, "elapsed_time": "16:36:33", "remaining_time": "3:37:31", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 19800, "total_steps": 24000, "loss": 0.1781, "learning_rate": 4.5211988927752026e-07, "epoch": 8.248281607998333, "percentage": 82.5, "elapsed_time": "16:41:17", "remaining_time": "3:32:23", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 19900, "total_steps": 24000, "loss": 0.1781, "learning_rate": 4.3148139714622365e-07, "epoch": 8.289939595917517, "percentage": 82.92, "elapsed_time": "16:46:01", "remaining_time": "3:27:16", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 20000, "total_steps": 24000, "loss": 0.178, "learning_rate": 4.1128047146765936e-07, "epoch": 8.3315975838367, "percentage": 83.33, "elapsed_time": "16:50:45", "remaining_time": "3:22:09", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 20100, "total_steps": 24000, "loss": 0.178, "learning_rate": 3.915213854677863e-07, "epoch": 8.373255571755884, "percentage": 83.75, "elapsed_time": "16:55:28", "remaining_time": "3:17:01", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 20200, "total_steps": 24000, "loss": 0.178, "learning_rate": 3.722083189075007e-07, "epoch": 8.414913559675067, "percentage": 84.17, "elapsed_time": "17:00:12", "remaining_time": "3:11:55", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 20300, "total_steps": 24000, "loss": 0.178, "learning_rate": 3.5334535719846767e-07, "epoch": 8.456571547594251, "percentage": 84.58, "elapsed_time": "17:04:55", "remaining_time": "3:06:48", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 20400, "total_steps": 24000, "loss": 0.178, "learning_rate": 3.3493649053890325e-07, "epoch": 8.498229535513435, "percentage": 85.0, "elapsed_time": "17:09:39", "remaining_time": "3:01:42", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 20500, "total_steps": 24000, "loss": 0.1782, "learning_rate": 3.1698561306951065e-07, "epoch": 8.539887523432618, "percentage": 85.42, "elapsed_time": "17:14:22", "remaining_time": "2:56:36", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 20600, "total_steps": 24000, "loss": 0.1779, "learning_rate": 2.9949652204972257e-07, "epoch": 8.581545511351802, "percentage": 85.83, "elapsed_time": "17:19:06", "remaining_time": "2:51:30", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 20700, "total_steps": 24000, "loss": 0.1777, "learning_rate": 2.8247291705444575e-07, "epoch": 8.623203499270986, "percentage": 86.25, "elapsed_time": "17:23:50", "remaining_time": "2:46:24", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 20800, "total_steps": 24000, "loss": 0.1779, "learning_rate": 2.6591839919146963e-07, "epoch": 8.66486148719017, "percentage": 86.67, "elapsed_time": "17:28:34", "remaining_time": "2:41:19", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 20900, "total_steps": 24000, "loss": 0.1781, "learning_rate": 2.4983647033969714e-07, "epoch": 8.706519475109353, "percentage": 87.08, "elapsed_time": "17:33:17", "remaining_time": "2:36:13", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 21000, "total_steps": 24000, "loss": 0.178, "learning_rate": 2.3423053240837518e-07, "epoch": 8.748177463028536, "percentage": 87.5, "elapsed_time": "17:38:02", "remaining_time": "2:31:08", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 21100, "total_steps": 24000, "loss": 0.178, "learning_rate": 2.1910388661746495e-07, "epoch": 8.78983545094772, "percentage": 87.92, "elapsed_time": "17:42:45", "remaining_time": "2:26:04", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 21200, "total_steps": 24000, "loss": 0.178, "learning_rate": 2.044597327993153e-07, "epoch": 8.831493438866902, "percentage": 88.33, "elapsed_time": "17:47:29", "remaining_time": "2:20:59", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 21300, "total_steps": 24000, "loss": 0.1779, "learning_rate": 1.9030116872178317e-07, "epoch": 8.873151426786086, "percentage": 88.75, "elapsed_time": "17:52:13", "remaining_time": "2:15:54", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 21400, "total_steps": 24000, "loss": 0.178, "learning_rate": 1.7663118943294367e-07, "epoch": 8.91480941470527, "percentage": 89.17, "elapsed_time": "17:56:57", "remaining_time": "2:10:50", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 21500, "total_steps": 24000, "loss": 0.178, "learning_rate": 1.6345268662752904e-07, "epoch": 8.956467402624453, "percentage": 89.58, "elapsed_time": "18:01:41", "remaining_time": "2:05:46", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 21600, "total_steps": 24000, "loss": 0.1779, "learning_rate": 1.507684480352292e-07, "epoch": 8.998125390543636, "percentage": 90.0, "elapsed_time": "18:06:25", "remaining_time": "2:00:42", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 21604, "total_steps": 24000, "eval_loss": 0.17924286425113678, "epoch": 8.999791710060403, "percentage": 90.02, "elapsed_time": "18:09:54", "remaining_time": "2:00:52", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 21700, "total_steps": 24000, "loss": 0.1766, "learning_rate": 1.3858115683098832e-07, "epoch": 9.03978337846282, "percentage": 90.42, "elapsed_time": "18:15:13", "remaining_time": "1:56:05", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 21800, "total_steps": 24000, "loss": 0.1763, "learning_rate": 1.2689339106741529e-07, "epoch": 9.081441366382004, "percentage": 90.83, "elapsed_time": "18:19:57", "remaining_time": "1:51:00", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 21900, "total_steps": 24000, "loss": 0.1764, "learning_rate": 1.1570762312943295e-07, "epoch": 9.123099354301187, "percentage": 91.25, "elapsed_time": "18:24:41", "remaining_time": "1:45:55", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 22000, "total_steps": 24000, "loss": 0.1763, "learning_rate": 1.0502621921127776e-07, "epoch": 9.164757342220371, "percentage": 91.67, "elapsed_time": "18:29:24", "remaining_time": "1:40:51", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 22100, "total_steps": 24000, "loss": 0.1764, "learning_rate": 9.485143881596715e-08, "epoch": 9.206415330139555, "percentage": 92.08, "elapsed_time": "18:34:08", "remaining_time": "1:35:47", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 22200, "total_steps": 24000, "loss": 0.1763, "learning_rate": 8.518543427732951e-08, "epoch": 9.248073318058738, "percentage": 92.5, "elapsed_time": "18:38:52", "remaining_time": "1:30:43", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 22300, "total_steps": 24000, "loss": 0.1762, "learning_rate": 7.603025030471001e-08, "epoch": 9.289731305977922, "percentage": 92.92, "elapsed_time": "18:43:36", "remaining_time": "1:25:39", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 22400, "total_steps": 24000, "loss": 0.1766, "learning_rate": 6.738782355044048e-08, "epoch": 9.331389293897105, "percentage": 93.33, "elapsed_time": "18:48:21", "remaining_time": "1:20:35", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 22500, "total_steps": 24000, "loss": 0.1763, "learning_rate": 5.92599822001666e-08, "epoch": 9.373047281816289, "percentage": 93.75, "elapsed_time": "18:53:04", "remaining_time": "1:15:32", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 22600, "total_steps": 24000, "loss": 0.1762, "learning_rate": 5.164844558612131e-08, "epoch": 9.414705269735471, "percentage": 94.17, "elapsed_time": "18:57:48", "remaining_time": "1:10:29", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 22700, "total_steps": 24000, "loss": 0.1764, "learning_rate": 4.455482382342336e-08, "epoch": 9.456363257654655, "percentage": 94.58, "elapsed_time": "19:02:32", "remaining_time": "1:05:25", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 22800, "total_steps": 24000, "loss": 0.1764, "learning_rate": 3.798061746947995e-08, "epoch": 9.498021245573838, "percentage": 95.0, "elapsed_time": "19:07:16", "remaining_time": "1:00:22", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 22900, "total_steps": 24000, "loss": 0.1763, "learning_rate": 3.1927217206564884e-08, "epoch": 9.539679233493022, "percentage": 95.42, "elapsed_time": "19:12:00", "remaining_time": "0:55:20", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 23000, "total_steps": 24000, "loss": 0.1761, "learning_rate": 2.6395903547638825e-08, "epoch": 9.581337221412205, "percentage": 95.83, "elapsed_time": "19:16:43", "remaining_time": "0:50:17", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 23100, "total_steps": 24000, "loss": 0.1761, "learning_rate": 2.1387846565474047e-08, "epoch": 9.622995209331389, "percentage": 96.25, "elapsed_time": "19:21:27", "remaining_time": "0:45:15", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 23200, "total_steps": 24000, "loss": 0.1761, "learning_rate": 1.6904105645142443e-08, "epoch": 9.664653197250573, "percentage": 96.67, "elapsed_time": "19:26:11", "remaining_time": "0:40:12", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 23300, "total_steps": 24000, "loss": 0.1763, "learning_rate": 1.2945629259917547e-08, "epoch": 9.706311185169756, "percentage": 97.08, "elapsed_time": "19:30:55", "remaining_time": "0:35:10", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 23400, "total_steps": 24000, "loss": 0.1763, "learning_rate": 9.513254770636138e-09, "epoch": 9.74796917308894, "percentage": 97.5, "elapsed_time": "19:35:39", "remaining_time": "0:30:08", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 23500, "total_steps": 24000, "loss": 0.1762, "learning_rate": 6.607708248569378e-09, "epoch": 9.789627161008124, "percentage": 97.92, "elapsed_time": "19:40:23", "remaining_time": "0:25:06", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 23600, "total_steps": 24000, "loss": 0.1762, "learning_rate": 4.229604321829561e-09, "epoch": 9.831285148927307, "percentage": 98.33, "elapsed_time": "19:45:06", "remaining_time": "0:20:05", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 23700, "total_steps": 24000, "loss": 0.1763, "learning_rate": 2.3794460453555046e-09, "epoch": 9.87294313684649, "percentage": 98.75, "elapsed_time": "19:49:50", "remaining_time": "0:15:03", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 23800, "total_steps": 24000, "loss": 0.1763, "learning_rate": 1.0576247944985018e-09, "epoch": 9.914601124765674, "percentage": 99.17, "elapsed_time": "19:54:33", "remaining_time": "0:10:02", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 23900, "total_steps": 24000, "loss": 0.1762, "learning_rate": 2.6442018223132857e-10, "epoch": 9.956259112684858, "percentage": 99.58, "elapsed_time": "19:59:17", "remaining_time": "0:05:01", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 24000, "total_steps": 24000, "loss": 0.1763, "learning_rate": 0.0, "epoch": 9.997917100604042, "percentage": 100.0, "elapsed_time": "20:04:01", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0} |
|
|