| {"current_steps": 10, "total_steps": 3320, "loss": 1.3483, "lr": 3.0120481927710846e-06, "epoch": 0.015053156458744943, "percentage": 0.3, "elapsed_time": "0:01:16", "remaining_time": "7:03:14"} |
| {"current_steps": 20, "total_steps": 3320, "loss": 1.2949, "lr": 6.024096385542169e-06, "epoch": 0.030106312917489886, "percentage": 0.6, "elapsed_time": "0:02:32", "remaining_time": "6:59:21"} |
| {"current_steps": 30, "total_steps": 3320, "loss": 1.1399, "lr": 9.036144578313253e-06, "epoch": 0.04515946937623483, "percentage": 0.9, "elapsed_time": "0:03:47", "remaining_time": "6:56:29"} |
| {"current_steps": 40, "total_steps": 3320, "loss": 0.9064, "lr": 1.2048192771084338e-05, "epoch": 0.06021262583497977, "percentage": 1.2, "elapsed_time": "0:05:04", "remaining_time": "6:55:32"} |
| {"current_steps": 50, "total_steps": 3320, "loss": 0.4566, "lr": 1.5060240963855424e-05, "epoch": 0.07526578229372471, "percentage": 1.51, "elapsed_time": "0:06:19", "remaining_time": "6:53:37"} |
| {"current_steps": 50, "total_steps": 3320, "eval_loss": 0.31506142020225525, "epoch": 0.07526578229372471, "percentage": 1.51, "elapsed_time": "0:08:56", "remaining_time": "9:44:29"} |
| {"current_steps": 60, "total_steps": 3320, "loss": 0.2427, "lr": 1.8072289156626505e-05, "epoch": 0.09031893875246966, "percentage": 1.81, "elapsed_time": "0:10:16", "remaining_time": "9:17:51"} |
| {"current_steps": 70, "total_steps": 3320, "loss": 0.2342, "lr": 2.1084337349397593e-05, "epoch": 0.1053720952112146, "percentage": 2.11, "elapsed_time": "0:11:31", "remaining_time": "8:55:16"} |
| {"current_steps": 80, "total_steps": 3320, "loss": 0.1697, "lr": 2.4096385542168677e-05, "epoch": 0.12042525166995954, "percentage": 2.41, "elapsed_time": "0:12:47", "remaining_time": "8:37:51"} |
| {"current_steps": 90, "total_steps": 3320, "loss": 0.1242, "lr": 2.7108433734939758e-05, "epoch": 0.1354784081287045, "percentage": 2.71, "elapsed_time": "0:14:02", "remaining_time": "8:24:06"} |
| {"current_steps": 100, "total_steps": 3320, "loss": 0.1039, "lr": 3.012048192771085e-05, "epoch": 0.15053156458744943, "percentage": 3.01, "elapsed_time": "0:15:18", "remaining_time": "8:12:48"} |
| {"current_steps": 100, "total_steps": 3320, "eval_loss": 0.09335148334503174, "epoch": 0.15053156458744943, "percentage": 3.01, "elapsed_time": "0:17:55", "remaining_time": "9:37:01"} |
| {"current_steps": 110, "total_steps": 3320, "loss": 0.0837, "lr": 3.313253012048193e-05, "epoch": 0.16558472104619437, "percentage": 3.31, "elapsed_time": "0:19:15", "remaining_time": "9:21:50"} |
| {"current_steps": 120, "total_steps": 3320, "loss": 0.1008, "lr": 3.614457831325301e-05, "epoch": 0.18063787750493931, "percentage": 3.61, "elapsed_time": "0:20:30", "remaining_time": "9:07:01"} |
| {"current_steps": 130, "total_steps": 3320, "loss": 0.0816, "lr": 3.91566265060241e-05, "epoch": 0.19569103396368426, "percentage": 3.92, "elapsed_time": "0:21:46", "remaining_time": "8:54:17"} |
| {"current_steps": 140, "total_steps": 3320, "loss": 0.0828, "lr": 4.2168674698795186e-05, "epoch": 0.2107441904224292, "percentage": 4.22, "elapsed_time": "0:23:01", "remaining_time": "8:43:09"} |
| {"current_steps": 150, "total_steps": 3320, "loss": 0.0879, "lr": 4.5180722891566266e-05, "epoch": 0.22579734688117414, "percentage": 4.52, "elapsed_time": "0:24:17", "remaining_time": "8:33:21"} |
| {"current_steps": 150, "total_steps": 3320, "eval_loss": 0.07289445400238037, "epoch": 0.22579734688117414, "percentage": 4.52, "elapsed_time": "0:26:54", "remaining_time": "9:28:38"} |
| {"current_steps": 160, "total_steps": 3320, "loss": 0.0821, "lr": 4.8192771084337354e-05, "epoch": 0.2408505033399191, "percentage": 4.82, "elapsed_time": "0:28:14", "remaining_time": "9:17:51"} |
| {"current_steps": 170, "total_steps": 3320, "loss": 0.0799, "lr": 5.120481927710844e-05, "epoch": 0.25590365979866403, "percentage": 5.12, "elapsed_time": "0:29:30", "remaining_time": "9:06:47"} |
| {"current_steps": 180, "total_steps": 3320, "loss": 0.0729, "lr": 5.4216867469879516e-05, "epoch": 0.270956816257409, "percentage": 5.42, "elapsed_time": "0:30:46", "remaining_time": "8:56:50"} |
| {"current_steps": 190, "total_steps": 3320, "loss": 0.0699, "lr": 5.72289156626506e-05, "epoch": 0.2860099727161539, "percentage": 5.72, "elapsed_time": "0:32:02", "remaining_time": "8:47:44"} |
| {"current_steps": 200, "total_steps": 3320, "loss": 0.0684, "lr": 6.02409638554217e-05, "epoch": 0.30106312917489886, "percentage": 6.02, "elapsed_time": "0:33:18", "remaining_time": "8:39:32"} |
| {"current_steps": 200, "total_steps": 3320, "eval_loss": 0.06437338143587112, "epoch": 0.30106312917489886, "percentage": 6.02, "elapsed_time": "0:35:55", "remaining_time": "9:20:21"} |
| {"current_steps": 210, "total_steps": 3320, "loss": 0.0706, "lr": 6.325301204819278e-05, "epoch": 0.3161162856336438, "percentage": 6.33, "elapsed_time": "0:37:15", "remaining_time": "9:11:44"} |
| {"current_steps": 220, "total_steps": 3320, "loss": 0.066, "lr": 6.626506024096386e-05, "epoch": 0.33116944209238874, "percentage": 6.63, "elapsed_time": "0:38:30", "remaining_time": "9:02:41"} |
| {"current_steps": 230, "total_steps": 3320, "loss": 0.0741, "lr": 6.927710843373494e-05, "epoch": 0.3462225985511337, "percentage": 6.93, "elapsed_time": "0:39:46", "remaining_time": "8:54:23"} |
| {"current_steps": 240, "total_steps": 3320, "loss": 0.0612, "lr": 7.228915662650602e-05, "epoch": 0.36127575500987863, "percentage": 7.23, "elapsed_time": "0:41:02", "remaining_time": "8:46:37"} |
| {"current_steps": 250, "total_steps": 3320, "loss": 0.0696, "lr": 7.530120481927712e-05, "epoch": 0.3763289114686236, "percentage": 7.53, "elapsed_time": "0:42:18", "remaining_time": "8:39:26"} |
| {"current_steps": 250, "total_steps": 3320, "eval_loss": 0.060398537665605545, "epoch": 0.3763289114686236, "percentage": 7.53, "elapsed_time": "0:44:54", "remaining_time": "9:11:28"} |
| {"current_steps": 260, "total_steps": 3320, "loss": 0.0436, "lr": 7.83132530120482e-05, "epoch": 0.3913820679273685, "percentage": 7.83, "elapsed_time": "0:46:14", "remaining_time": "9:04:16"} |
| {"current_steps": 270, "total_steps": 3320, "loss": 0.0543, "lr": 8.132530120481928e-05, "epoch": 0.40643522438611346, "percentage": 8.13, "elapsed_time": "0:47:30", "remaining_time": "8:56:34"} |
| {"current_steps": 280, "total_steps": 3320, "loss": 0.0613, "lr": 8.433734939759037e-05, "epoch": 0.4214883808448584, "percentage": 8.43, "elapsed_time": "0:48:45", "remaining_time": "8:49:26"} |
| {"current_steps": 290, "total_steps": 3320, "loss": 0.0506, "lr": 8.734939759036145e-05, "epoch": 0.43654153730360334, "percentage": 8.73, "elapsed_time": "0:50:01", "remaining_time": "8:42:41"} |
| {"current_steps": 300, "total_steps": 3320, "loss": 0.064, "lr": 9.036144578313253e-05, "epoch": 0.4515946937623483, "percentage": 9.04, "elapsed_time": "0:51:17", "remaining_time": "8:36:16"} |
| {"current_steps": 300, "total_steps": 3320, "eval_loss": 0.053826671093702316, "epoch": 0.4515946937623483, "percentage": 9.04, "elapsed_time": "0:53:53", "remaining_time": "9:02:31"} |
| {"current_steps": 310, "total_steps": 3320, "loss": 0.0469, "lr": 9.337349397590361e-05, "epoch": 0.46664785022109323, "percentage": 9.34, "elapsed_time": "0:55:13", "remaining_time": "8:56:12"} |
| {"current_steps": 320, "total_steps": 3320, "loss": 0.0784, "lr": 9.638554216867471e-05, "epoch": 0.4817010066798382, "percentage": 9.64, "elapsed_time": "0:56:28", "remaining_time": "8:49:26"} |
| {"current_steps": 330, "total_steps": 3320, "loss": 0.056, "lr": 9.939759036144579e-05, "epoch": 0.4967541631385831, "percentage": 9.94, "elapsed_time": "0:57:44", "remaining_time": "8:43:07"} |
| {"current_steps": 340, "total_steps": 3320, "loss": 0.0396, "lr": 9.999823129264712e-05, "epoch": 0.5118073195973281, "percentage": 10.24, "elapsed_time": "0:58:59", "remaining_time": "8:37:02"} |
| {"current_steps": 350, "total_steps": 3320, "loss": 0.048, "lr": 9.999104613348688e-05, "epoch": 0.526860476056073, "percentage": 10.54, "elapsed_time": "1:00:15", "remaining_time": "8:31:16"} |
| {"current_steps": 350, "total_steps": 3320, "eval_loss": 0.055311419069767, "epoch": 0.526860476056073, "percentage": 10.54, "elapsed_time": "1:02:51", "remaining_time": "8:53:23"} |
| {"current_steps": 360, "total_steps": 3320, "loss": 0.0501, "lr": 9.997833477197385e-05, "epoch": 0.541913632514818, "percentage": 10.84, "elapsed_time": "1:04:11", "remaining_time": "8:47:46"} |
| {"current_steps": 370, "total_steps": 3320, "loss": 0.0474, "lr": 9.996009861327077e-05, "epoch": 0.5569667889735629, "percentage": 11.14, "elapsed_time": "1:05:26", "remaining_time": "8:41:44"} |
| {"current_steps": 380, "total_steps": 3320, "loss": 0.0538, "lr": 9.993633967327269e-05, "epoch": 0.5720199454323078, "percentage": 11.45, "elapsed_time": "1:06:42", "remaining_time": "8:36:02"} |
| {"current_steps": 390, "total_steps": 3320, "loss": 0.0417, "lr": 9.990706057838416e-05, "epoch": 0.5870731018910528, "percentage": 11.75, "elapsed_time": "1:07:57", "remaining_time": "8:30:33"} |
| {"current_steps": 400, "total_steps": 3320, "loss": 0.0568, "lr": 9.987226456522884e-05, "epoch": 0.6021262583497977, "percentage": 12.05, "elapsed_time": "1:09:12", "remaining_time": "8:25:15"} |
| {"current_steps": 400, "total_steps": 3320, "eval_loss": 0.05042395368218422, "epoch": 0.6021262583497977, "percentage": 12.05, "elapsed_time": "1:11:49", "remaining_time": "8:44:18"} |
| {"current_steps": 410, "total_steps": 3320, "loss": 0.0403, "lr": 9.983195548029173e-05, "epoch": 0.6171794148085427, "percentage": 12.35, "elapsed_time": "1:13:12", "remaining_time": "8:39:34"} |
| {"current_steps": 420, "total_steps": 3320, "loss": 0.0613, "lr": 9.9786137779494e-05, "epoch": 0.6322325712672876, "percentage": 12.65, "elapsed_time": "1:14:27", "remaining_time": "8:34:08"} |
| {"current_steps": 430, "total_steps": 3320, "loss": 0.0427, "lr": 9.973481652770038e-05, "epoch": 0.6472857277260325, "percentage": 12.95, "elapsed_time": "1:15:43", "remaining_time": "8:28:53"} |
| {"current_steps": 440, "total_steps": 3320, "loss": 0.0413, "lr": 9.967799739815925e-05, "epoch": 0.6623388841847775, "percentage": 13.25, "elapsed_time": "1:16:58", "remaining_time": "8:23:49"} |
| {"current_steps": 450, "total_steps": 3320, "loss": 0.0548, "lr": 9.961568667187556e-05, "epoch": 0.6773920406435224, "percentage": 13.55, "elapsed_time": "1:18:13", "remaining_time": "8:18:54"} |
| {"current_steps": 450, "total_steps": 3320, "eval_loss": 0.046242497861385345, "epoch": 0.6773920406435224, "percentage": 13.55, "elapsed_time": "1:20:50", "remaining_time": "8:35:34"} |
| {"current_steps": 460, "total_steps": 3320, "loss": 0.0444, "lr": 9.954789123691642e-05, "epoch": 0.6924451971022674, "percentage": 13.86, "elapsed_time": "1:22:10", "remaining_time": "8:30:56"} |
| {"current_steps": 470, "total_steps": 3320, "loss": 0.0486, "lr": 9.947461858764978e-05, "epoch": 0.7074983535610123, "percentage": 14.16, "elapsed_time": "1:23:26", "remaining_time": "8:25:55"} |
| {"current_steps": 480, "total_steps": 3320, "loss": 0.0423, "lr": 9.939587682391586e-05, "epoch": 0.7225515100197573, "percentage": 14.46, "elapsed_time": "1:24:41", "remaining_time": "8:21:07"} |
| {"current_steps": 490, "total_steps": 3320, "loss": 0.0604, "lr": 9.931167465013182e-05, "epoch": 0.7376046664785022, "percentage": 14.76, "elapsed_time": "1:25:57", "remaining_time": "8:16:27"} |
| {"current_steps": 500, "total_steps": 3320, "loss": 0.0387, "lr": 9.922202137432955e-05, "epoch": 0.7526578229372471, "percentage": 15.06, "elapsed_time": "1:27:13", "remaining_time": "8:11:54"} |
| {"current_steps": 500, "total_steps": 3320, "eval_loss": 0.04570082202553749, "epoch": 0.7526578229372471, "percentage": 15.06, "elapsed_time": "1:29:50", "remaining_time": "8:26:40"} |
| {"current_steps": 510, "total_steps": 3320, "loss": 0.0443, "lr": 9.912692690712665e-05, "epoch": 0.7677109793959921, "percentage": 15.36, "elapsed_time": "1:31:12", "remaining_time": "8:22:32"} |
| {"current_steps": 520, "total_steps": 3320, "loss": 0.0482, "lr": 9.902640176063103e-05, "epoch": 0.782764135854737, "percentage": 15.66, "elapsed_time": "1:32:28", "remaining_time": "8:17:55"} |
| {"current_steps": 530, "total_steps": 3320, "loss": 0.0529, "lr": 9.892045704727864e-05, "epoch": 0.797817292313482, "percentage": 15.96, "elapsed_time": "1:33:43", "remaining_time": "8:13:24"} |
| {"current_steps": 540, "total_steps": 3320, "loss": 0.0636, "lr": 9.880910447860527e-05, "epoch": 0.8128704487722269, "percentage": 16.27, "elapsed_time": "1:34:59", "remaining_time": "8:09:01"} |
| {"current_steps": 550, "total_steps": 3320, "loss": 0.0454, "lr": 9.869235636395177e-05, "epoch": 0.8279236052309719, "percentage": 16.57, "elapsed_time": "1:36:15", "remaining_time": "8:04:45"} |
| {"current_steps": 550, "total_steps": 3320, "eval_loss": 0.043903350830078125, "epoch": 0.8279236052309719, "percentage": 16.57, "elapsed_time": "1:38:52", "remaining_time": "8:17:57"} |
| {"current_steps": 560, "total_steps": 3320, "loss": 0.0639, "lr": 9.857022560910338e-05, "epoch": 0.8429767616897168, "percentage": 16.87, "elapsed_time": "1:40:12", "remaining_time": "8:13:51"} |
| {"current_steps": 570, "total_steps": 3320, "loss": 0.0414, "lr": 9.844272571486311e-05, "epoch": 0.8580299181484617, "percentage": 17.17, "elapsed_time": "1:41:27", "remaining_time": "8:09:31"} |
| {"current_steps": 580, "total_steps": 3320, "loss": 0.0569, "lr": 9.830987077555924e-05, "epoch": 0.8730830746072067, "percentage": 17.47, "elapsed_time": "1:42:43", "remaining_time": "8:05:17"} |
| {"current_steps": 590, "total_steps": 3320, "loss": 0.0629, "lr": 9.817167547748729e-05, "epoch": 0.8881362310659516, "percentage": 17.77, "elapsed_time": "1:43:59", "remaining_time": "8:01:10"} |
| {"current_steps": 600, "total_steps": 3320, "loss": 0.0343, "lr": 9.802815509728662e-05, "epoch": 0.9031893875246966, "percentage": 18.07, "elapsed_time": "1:45:15", "remaining_time": "7:57:09"} |
| {"current_steps": 600, "total_steps": 3320, "eval_loss": 0.042122405022382736, "epoch": 0.9031893875246966, "percentage": 18.07, "elapsed_time": "1:47:52", "remaining_time": "8:09:03"} |
| {"current_steps": 610, "total_steps": 3320, "loss": 0.0373, "lr": 9.787932550025158e-05, "epoch": 0.9182425439834415, "percentage": 18.37, "elapsed_time": "1:49:13", "remaining_time": "8:05:13"} |
| {"current_steps": 620, "total_steps": 3320, "loss": 0.0413, "lr": 9.772520313857775e-05, "epoch": 0.9332957004421865, "percentage": 18.67, "elapsed_time": "1:50:28", "remaining_time": "8:01:07"} |
| {"current_steps": 630, "total_steps": 3320, "loss": 0.0462, "lr": 9.756580504954334e-05, "epoch": 0.9483488569009314, "percentage": 18.98, "elapsed_time": "1:51:44", "remaining_time": "7:57:07"} |
| {"current_steps": 640, "total_steps": 3320, "loss": 0.047, "lr": 9.740114885362562e-05, "epoch": 0.9634020133596763, "percentage": 19.28, "elapsed_time": "1:53:00", "remaining_time": "7:53:14"} |
| {"current_steps": 650, "total_steps": 3320, "loss": 0.0363, "lr": 9.723125275255325e-05, "epoch": 0.9784551698184213, "percentage": 19.58, "elapsed_time": "1:54:16", "remaining_time": "7:49:24"} |
| {"current_steps": 650, "total_steps": 3320, "eval_loss": 0.0401780903339386, "epoch": 0.9784551698184213, "percentage": 19.58, "elapsed_time": "1:56:54", "remaining_time": "8:00:12"} |
| {"current_steps": 660, "total_steps": 3320, "loss": 0.0306, "lr": 9.705613552729415e-05, "epoch": 0.9935083262771662, "percentage": 19.88, "elapsed_time": "1:58:14", "remaining_time": "7:56:33"} |
| {"current_steps": 670, "total_steps": 3320, "loss": 0.0412, "lr": 9.68758165359794e-05, "epoch": 1.0085614827359113, "percentage": 20.18, "elapsed_time": "1:59:30", "remaining_time": "7:52:41"} |
| {"current_steps": 680, "total_steps": 3320, "loss": 0.0404, "lr": 9.669031571176322e-05, "epoch": 1.0236146391946561, "percentage": 20.48, "elapsed_time": "2:00:46", "remaining_time": "7:48:52"} |
| {"current_steps": 690, "total_steps": 3320, "loss": 0.0377, "lr": 9.64996535606196e-05, "epoch": 1.0386677956534012, "percentage": 20.78, "elapsed_time": "2:02:02", "remaining_time": "7:45:08"} |
| {"current_steps": 700, "total_steps": 3320, "loss": 0.0272, "lr": 9.630385115907545e-05, "epoch": 1.053720952112146, "percentage": 21.08, "elapsed_time": "2:03:18", "remaining_time": "7:41:30"} |
| {"current_steps": 700, "total_steps": 3320, "eval_loss": 0.04149024188518524, "epoch": 1.053720952112146, "percentage": 21.08, "elapsed_time": "2:05:56", "remaining_time": "7:51:21"} |
| {"current_steps": 710, "total_steps": 3320, "loss": 0.0345, "lr": 9.610293015188067e-05, "epoch": 1.068774108570891, "percentage": 21.39, "elapsed_time": "2:07:16", "remaining_time": "7:47:52"} |
| {"current_steps": 720, "total_steps": 3320, "loss": 0.0271, "lr": 9.589691274961556e-05, "epoch": 1.083827265029636, "percentage": 21.69, "elapsed_time": "2:08:32", "remaining_time": "7:44:09"} |
| {"current_steps": 730, "total_steps": 3320, "loss": 0.0437, "lr": 9.568582172623544e-05, "epoch": 1.098880421488381, "percentage": 21.99, "elapsed_time": "2:09:48", "remaining_time": "7:40:31"} |
| {"current_steps": 740, "total_steps": 3320, "loss": 0.0355, "lr": 9.546968041655326e-05, "epoch": 1.1139335779471258, "percentage": 22.29, "elapsed_time": "2:11:03", "remaining_time": "7:36:57"} |
| {"current_steps": 750, "total_steps": 3320, "loss": 0.0324, "lr": 9.524851271366001e-05, "epoch": 1.1289867344058706, "percentage": 22.59, "elapsed_time": "2:12:19", "remaining_time": "7:33:27"} |
| {"current_steps": 750, "total_steps": 3320, "eval_loss": 0.03844917565584183, "epoch": 1.1289867344058706, "percentage": 22.59, "elapsed_time": "2:14:58", "remaining_time": "7:42:29"} |
| {"current_steps": 760, "total_steps": 3320, "loss": 0.0288, "lr": 9.502234306628355e-05, "epoch": 1.1440398908646157, "percentage": 22.89, "elapsed_time": "2:16:18", "remaining_time": "7:39:09"} |
| {"current_steps": 770, "total_steps": 3320, "loss": 0.0327, "lr": 9.47911964760858e-05, "epoch": 1.1590930473233607, "percentage": 23.19, "elapsed_time": "2:17:34", "remaining_time": "7:35:37"} |
| {"current_steps": 780, "total_steps": 3320, "loss": 0.0284, "lr": 9.455509849489915e-05, "epoch": 1.1741462037821055, "percentage": 23.49, "elapsed_time": "2:18:50", "remaining_time": "7:32:08"} |
| {"current_steps": 790, "total_steps": 3320, "loss": 0.0361, "lr": 9.431407522190175e-05, "epoch": 1.1891993602408506, "percentage": 23.8, "elapsed_time": "2:20:06", "remaining_time": "7:28:43"} |
| {"current_steps": 800, "total_steps": 3320, "loss": 0.0394, "lr": 9.406815330073244e-05, "epoch": 1.2042525166995954, "percentage": 24.1, "elapsed_time": "2:21:23", "remaining_time": "7:25:21"} |
| {"current_steps": 800, "total_steps": 3320, "eval_loss": 0.042881306260824203, "epoch": 1.2042525166995954, "percentage": 24.1, "elapsed_time": "2:24:01", "remaining_time": "7:33:40"} |
| {"current_steps": 810, "total_steps": 3320, "loss": 0.0394, "lr": 9.381735991654546e-05, "epoch": 1.2193056731583405, "percentage": 24.4, "elapsed_time": "2:25:21", "remaining_time": "7:30:27"} |
| {"current_steps": 820, "total_steps": 3320, "loss": 0.038, "lr": 9.356172279300528e-05, "epoch": 1.2343588296170853, "percentage": 24.7, "elapsed_time": "2:26:38", "remaining_time": "7:27:03"} |
| {"current_steps": 830, "total_steps": 3320, "loss": 0.0351, "lr": 9.330127018922194e-05, "epoch": 1.2494119860758304, "percentage": 25.0, "elapsed_time": "2:27:54", "remaining_time": "7:23:42"} |
| {"current_steps": 840, "total_steps": 3320, "loss": 0.0379, "lr": 9.303603089662716e-05, "epoch": 1.2644651425345752, "percentage": 25.3, "elapsed_time": "2:29:10", "remaining_time": "7:20:25"} |
| {"current_steps": 850, "total_steps": 3320, "loss": 0.0297, "lr": 9.276603423579164e-05, "epoch": 1.2795182989933203, "percentage": 25.6, "elapsed_time": "2:30:26", "remaining_time": "7:17:10"} |
| {"current_steps": 850, "total_steps": 3320, "eval_loss": 0.04107122868299484, "epoch": 1.2795182989933203, "percentage": 25.6, "elapsed_time": "2:33:05", "remaining_time": "7:24:51"} |
| {"current_steps": 860, "total_steps": 3320, "loss": 0.0429, "lr": 9.249131005318387e-05, "epoch": 1.294571455452065, "percentage": 25.9, "elapsed_time": "2:34:26", "remaining_time": "7:21:45"} |
| {"current_steps": 870, "total_steps": 3320, "loss": 0.0349, "lr": 9.221188871787075e-05, "epoch": 1.30962461191081, "percentage": 26.2, "elapsed_time": "2:35:42", "remaining_time": "7:18:29"} |
| {"current_steps": 880, "total_steps": 3320, "loss": 0.037, "lr": 9.192780111816047e-05, "epoch": 1.324677768369555, "percentage": 26.51, "elapsed_time": "2:36:59", "remaining_time": "7:15:16"} |
| {"current_steps": 890, "total_steps": 3320, "loss": 0.0327, "lr": 9.163907865818806e-05, "epoch": 1.3397309248283, "percentage": 26.81, "elapsed_time": "2:38:15", "remaining_time": "7:12:05"} |
| {"current_steps": 900, "total_steps": 3320, "loss": 0.0423, "lr": 9.134575325444376e-05, "epoch": 1.3547840812870449, "percentage": 27.11, "elapsed_time": "2:39:31", "remaining_time": "7:08:56"} |
| {"current_steps": 900, "total_steps": 3320, "eval_loss": 0.03963349014520645, "epoch": 1.3547840812870449, "percentage": 27.11, "elapsed_time": "2:42:10", "remaining_time": "7:16:03"} |
| {"current_steps": 910, "total_steps": 3320, "loss": 0.0292, "lr": 9.104785733224496e-05, "epoch": 1.3698372377457897, "percentage": 27.41, "elapsed_time": "2:43:30", "remaining_time": "7:13:02"} |
| {"current_steps": 920, "total_steps": 3320, "loss": 0.0358, "lr": 9.07454238221517e-05, "epoch": 1.3848903942045347, "percentage": 27.71, "elapsed_time": "2:44:47", "remaining_time": "7:09:52"} |
| {"current_steps": 930, "total_steps": 3320, "loss": 0.0294, "lr": 9.043848615632642e-05, "epoch": 1.3999435506632798, "percentage": 28.01, "elapsed_time": "2:46:03", "remaining_time": "7:06:44"} |
| {"current_steps": 940, "total_steps": 3320, "loss": 0.0375, "lr": 9.012707826483823e-05, "epoch": 1.4149967071220246, "percentage": 28.31, "elapsed_time": "2:47:19", "remaining_time": "7:03:40"} |
| {"current_steps": 950, "total_steps": 3320, "loss": 0.0324, "lr": 8.98112345719122e-05, "epoch": 1.4300498635807695, "percentage": 28.61, "elapsed_time": "2:48:36", "remaining_time": "7:00:38"} |
| {"current_steps": 950, "total_steps": 3320, "eval_loss": 0.03718731552362442, "epoch": 1.4300498635807695, "percentage": 28.61, "elapsed_time": "2:51:15", "remaining_time": "7:07:14"} |
| {"current_steps": 960, "total_steps": 3320, "loss": 0.0385, "lr": 8.949098999212391e-05, "epoch": 1.4451030200395145, "percentage": 28.92, "elapsed_time": "2:52:35", "remaining_time": "7:04:18"} |
| {"current_steps": 970, "total_steps": 3320, "loss": 0.0321, "lr": 8.916637992653991e-05, "epoch": 1.4601561764982596, "percentage": 29.22, "elapsed_time": "2:53:52", "remaining_time": "7:01:13"} |
| {"current_steps": 980, "total_steps": 3320, "loss": 0.0299, "lr": 8.883744025880428e-05, "epoch": 1.4752093329570044, "percentage": 29.52, "elapsed_time": "2:55:08", "remaining_time": "6:58:11"} |
| {"current_steps": 990, "total_steps": 3320, "loss": 0.0304, "lr": 8.850420735117202e-05, "epoch": 1.4902624894157492, "percentage": 29.82, "elapsed_time": "2:56:24", "remaining_time": "6:55:11"} |
| {"current_steps": 1000, "total_steps": 3320, "loss": 0.0311, "lr": 8.816671804048933e-05, "epoch": 1.5053156458744943, "percentage": 30.12, "elapsed_time": "2:57:41", "remaining_time": "6:52:13"} |
| {"current_steps": 1000, "total_steps": 3320, "eval_loss": 0.03950938582420349, "epoch": 1.5053156458744943, "percentage": 30.12, "elapsed_time": "3:00:19", "remaining_time": "6:58:22"} |
| {"current_steps": 1010, "total_steps": 3320, "loss": 0.0358, "lr": 8.782500963412156e-05, "epoch": 1.5203688023332393, "percentage": 30.42, "elapsed_time": "3:01:40", "remaining_time": "6:55:30"} |
| {"current_steps": 1020, "total_steps": 3320, "loss": 0.029, "lr": 8.747911990582912e-05, "epoch": 1.5354219587919842, "percentage": 30.72, "elapsed_time": "3:02:56", "remaining_time": "6:52:32"} |
| {"current_steps": 1030, "total_steps": 3320, "loss": 0.0288, "lr": 8.712908709159183e-05, "epoch": 1.550475115250729, "percentage": 31.02, "elapsed_time": "3:04:13", "remaining_time": "6:49:35"} |
| {"current_steps": 1040, "total_steps": 3320, "loss": 0.0422, "lr": 8.677494988538211e-05, "epoch": 1.565528271709474, "percentage": 31.33, "elapsed_time": "3:05:29", "remaining_time": "6:46:40"} |
| {"current_steps": 1050, "total_steps": 3320, "loss": 0.0309, "lr": 8.641674743488769e-05, "epoch": 1.5805814281682191, "percentage": 31.63, "elapsed_time": "3:06:46", "remaining_time": "6:43:47"} |
| {"current_steps": 1050, "total_steps": 3320, "eval_loss": 0.04065566882491112, "epoch": 1.5805814281682191, "percentage": 31.63, "elapsed_time": "3:09:25", "remaining_time": "6:49:31"} |
| {"current_steps": 1060, "total_steps": 3320, "loss": 0.0377, "lr": 8.605451933718397e-05, "epoch": 1.595634584626964, "percentage": 31.93, "elapsed_time": "3:10:47", "remaining_time": "6:46:46"} |
| {"current_steps": 1070, "total_steps": 3320, "loss": 0.0387, "lr": 8.568830563435694e-05, "epoch": 1.6106877410857088, "percentage": 32.23, "elapsed_time": "3:12:03", "remaining_time": "6:43:51"} |
| {"current_steps": 1080, "total_steps": 3320, "loss": 0.0254, "lr": 8.531814680907664e-05, "epoch": 1.6257408975444538, "percentage": 32.53, "elapsed_time": "3:13:20", "remaining_time": "6:40:59"} |
| {"current_steps": 1090, "total_steps": 3320, "loss": 0.0284, "lr": 8.494408378012209e-05, "epoch": 1.6407940540031989, "percentage": 32.83, "elapsed_time": "3:14:36", "remaining_time": "6:38:08"} |
| {"current_steps": 1100, "total_steps": 3320, "loss": 0.0233, "lr": 8.456615789785804e-05, "epoch": 1.6558472104619437, "percentage": 33.13, "elapsed_time": "3:15:52", "remaining_time": "6:35:19"} |
| {"current_steps": 1100, "total_steps": 3320, "eval_loss": 0.03772934526205063, "epoch": 1.6558472104619437, "percentage": 33.13, "elapsed_time": "3:18:32", "remaining_time": "6:40:40"} |
| {"current_steps": 1110, "total_steps": 3320, "loss": 0.0445, "lr": 8.418441093966385e-05, "epoch": 1.6709003669206886, "percentage": 33.43, "elapsed_time": "3:19:52", "remaining_time": "6:37:56"} |
| {"current_steps": 1120, "total_steps": 3320, "loss": 0.029, "lr": 8.379888510531535e-05, "epoch": 1.6859535233794336, "percentage": 33.73, "elapsed_time": "3:21:08", "remaining_time": "6:35:06"} |
| {"current_steps": 1130, "total_steps": 3320, "loss": 0.0224, "lr": 8.340962301231981e-05, "epoch": 1.7010066798381787, "percentage": 34.04, "elapsed_time": "3:22:24", "remaining_time": "6:32:17"} |
| {"current_steps": 1140, "total_steps": 3320, "loss": 0.0311, "lr": 8.301666769120488e-05, "epoch": 1.7160598362969235, "percentage": 34.34, "elapsed_time": "3:23:41", "remaining_time": "6:29:31"} |
| {"current_steps": 1150, "total_steps": 3320, "loss": 0.0455, "lr": 8.262006258076187e-05, "epoch": 1.7311129927556683, "percentage": 34.64, "elapsed_time": "3:24:58", "remaining_time": "6:26:46"} |
| {"current_steps": 1150, "total_steps": 3320, "eval_loss": 0.035410501062870026, "epoch": 1.7311129927556683, "percentage": 34.64, "elapsed_time": "3:27:37", "remaining_time": "6:31:47"} |
| {"current_steps": 1160, "total_steps": 3320, "loss": 0.0307, "lr": 8.221985152324385e-05, "epoch": 1.7461661492144134, "percentage": 34.94, "elapsed_time": "3:28:58", "remaining_time": "6:29:07"} |
| {"current_steps": 1170, "total_steps": 3320, "loss": 0.0413, "lr": 8.18160787595191e-05, "epoch": 1.7612193056731584, "percentage": 35.24, "elapsed_time": "3:30:15", "remaining_time": "6:26:21"} |
| {"current_steps": 1180, "total_steps": 3320, "loss": 0.0364, "lr": 8.14087889241806e-05, "epoch": 1.7762724621319033, "percentage": 35.54, "elapsed_time": "3:31:32", "remaining_time": "6:23:37"} |
| {"current_steps": 1190, "total_steps": 3320, "loss": 0.0384, "lr": 8.099802704061195e-05, "epoch": 1.791325618590648, "percentage": 35.84, "elapsed_time": "3:32:48", "remaining_time": "6:20:55"} |
| {"current_steps": 1200, "total_steps": 3320, "loss": 0.0329, "lr": 8.058383851601027e-05, "epoch": 1.8063787750493931, "percentage": 36.14, "elapsed_time": "3:34:05", "remaining_time": "6:18:13"} |
| {"current_steps": 1200, "total_steps": 3320, "eval_loss": 0.03639229014515877, "epoch": 1.8063787750493931, "percentage": 36.14, "elapsed_time": "3:36:44", "remaining_time": "6:22:55"} |
| {"current_steps": 1210, "total_steps": 3320, "loss": 0.0289, "lr": 8.01662691363668e-05, "epoch": 1.8214319315081382, "percentage": 36.45, "elapsed_time": "3:38:05", "remaining_time": "6:20:18"} |
| {"current_steps": 1220, "total_steps": 3320, "loss": 0.0367, "lr": 7.974536506140547e-05, "epoch": 1.836485087966883, "percentage": 36.75, "elapsed_time": "3:39:21", "remaining_time": "6:17:35"} |
| {"current_steps": 1230, "total_steps": 3320, "loss": 0.0328, "lr": 7.932117281948021e-05, "epoch": 1.8515382444256279, "percentage": 37.05, "elapsed_time": "3:40:38", "remaining_time": "6:14:54"} |
| {"current_steps": 1240, "total_steps": 3320, "loss": 0.0343, "lr": 7.889373930243164e-05, "epoch": 1.866591400884373, "percentage": 37.35, "elapsed_time": "3:41:54", "remaining_time": "6:12:14"} |
| {"current_steps": 1250, "total_steps": 3320, "loss": 0.0352, "lr": 7.846311176040331e-05, "epoch": 1.881644557343118, "percentage": 37.65, "elapsed_time": "3:43:11", "remaining_time": "6:09:35"} |
| {"current_steps": 1250, "total_steps": 3320, "eval_loss": 0.035072676837444305, "epoch": 1.881644557343118, "percentage": 37.65, "elapsed_time": "3:45:50", "remaining_time": "6:14:00"} |
| {"current_steps": 1260, "total_steps": 3320, "loss": 0.0374, "lr": 7.802933779661859e-05, "epoch": 1.8966977138018628, "percentage": 37.95, "elapsed_time": "3:47:12", "remaining_time": "6:11:27"} |
| {"current_steps": 1270, "total_steps": 3320, "loss": 0.0307, "lr": 7.759246536211844e-05, "epoch": 1.9117508702606076, "percentage": 38.25, "elapsed_time": "3:48:28", "remaining_time": "6:08:47"} |
| {"current_steps": 1280, "total_steps": 3320, "loss": 0.0326, "lr": 7.715254275046062e-05, "epoch": 1.9268040267193527, "percentage": 38.55, "elapsed_time": "3:49:45", "remaining_time": "6:06:09"} |
| {"current_steps": 1290, "total_steps": 3320, "loss": 0.0297, "lr": 7.670961859238124e-05, "epoch": 1.9418571831780977, "percentage": 38.86, "elapsed_time": "3:51:01", "remaining_time": "6:03:33"} |
| {"current_steps": 1300, "total_steps": 3320, "loss": 0.029, "lr": 7.626374185041886e-05, "epoch": 1.9569103396368426, "percentage": 39.16, "elapsed_time": "3:52:18", "remaining_time": "6:00:58"} |
| {"current_steps": 1300, "total_steps": 3320, "eval_loss": 0.0350230410695076, "epoch": 1.9569103396368426, "percentage": 39.16, "elapsed_time": "3:54:58", "remaining_time": "6:05:07"} |
| {"current_steps": 1310, "total_steps": 3320, "loss": 0.0263, "lr": 7.581496181350203e-05, "epoch": 1.9719634960955874, "percentage": 39.46, "elapsed_time": "3:56:20", "remaining_time": "6:02:38"} |
| {"current_steps": 1320, "total_steps": 3320, "loss": 0.0281, "lr": 7.536332809150067e-05, "epoch": 1.9870166525543325, "percentage": 39.76, "elapsed_time": "3:57:37", "remaining_time": "6:00:02"} |
| {"current_steps": 1330, "total_steps": 3320, "loss": 0.0346, "lr": 7.490889060974201e-05, "epoch": 2.0020698090130775, "percentage": 40.06, "elapsed_time": "3:58:53", "remaining_time": "5:57:27"} |
| {"current_steps": 1340, "total_steps": 3320, "loss": 0.017, "lr": 7.445169960349167e-05, "epoch": 2.0171229654718226, "percentage": 40.36, "elapsed_time": "4:00:10", "remaining_time": "5:54:53"} |
| {"current_steps": 1350, "total_steps": 3320, "loss": 0.0187, "lr": 7.399180561240044e-05, "epoch": 2.032176121930567, "percentage": 40.66, "elapsed_time": "4:01:27", "remaining_time": "5:52:21"} |
| {"current_steps": 1350, "total_steps": 3320, "eval_loss": 0.03626255691051483, "epoch": 2.032176121930567, "percentage": 40.66, "elapsed_time": "4:04:07", "remaining_time": "5:56:14"} |
| {"current_steps": 1360, "total_steps": 3320, "loss": 0.0119, "lr": 7.352925947491746e-05, "epoch": 2.0472292783893122, "percentage": 40.96, "elapsed_time": "4:05:28", "remaining_time": "5:53:46"} |
| {"current_steps": 1370, "total_steps": 3320, "loss": 0.0175, "lr": 7.306411232267029e-05, "epoch": 2.0622824348480573, "percentage": 41.27, "elapsed_time": "4:06:45", "remaining_time": "5:51:13"} |
| {"current_steps": 1380, "total_steps": 3320, "loss": 0.0172, "lr": 7.259641557481269e-05, "epoch": 2.0773355913068023, "percentage": 41.57, "elapsed_time": "4:08:02", "remaining_time": "5:48:41"} |
| {"current_steps": 1390, "total_steps": 3320, "loss": 0.0146, "lr": 7.212622093234049e-05, "epoch": 2.092388747765547, "percentage": 41.87, "elapsed_time": "4:09:19", "remaining_time": "5:46:11"} |
| {"current_steps": 1400, "total_steps": 3320, "loss": 0.025, "lr": 7.165358037237643e-05, "epoch": 2.107441904224292, "percentage": 42.17, "elapsed_time": "4:10:36", "remaining_time": "5:43:41"} |
| {"current_steps": 1400, "total_steps": 3320, "eval_loss": 0.038006313145160675, "epoch": 2.107441904224292, "percentage": 42.17, "elapsed_time": "4:13:16", "remaining_time": "5:47:20"} |
| {"current_steps": 1410, "total_steps": 3320, "loss": 0.0249, "lr": 7.117854614242434e-05, "epoch": 2.122495060683037, "percentage": 42.47, "elapsed_time": "4:14:37", "remaining_time": "5:44:55"} |
| {"current_steps": 1420, "total_steps": 3320, "loss": 0.022, "lr": 7.070117075459352e-05, "epoch": 2.137548217141782, "percentage": 42.77, "elapsed_time": "4:15:54", "remaining_time": "5:42:25"} |
| {"current_steps": 1430, "total_steps": 3320, "loss": 0.0244, "lr": 7.022150697979384e-05, "epoch": 2.1526013736005267, "percentage": 43.07, "elapsed_time": "4:17:11", "remaining_time": "5:39:56"} |
| {"current_steps": 1440, "total_steps": 3320, "loss": 0.0283, "lr": 6.973960784190237e-05, "epoch": 2.167654530059272, "percentage": 43.37, "elapsed_time": "4:18:28", "remaining_time": "5:37:27"} |
| {"current_steps": 1450, "total_steps": 3320, "loss": 0.0209, "lr": 6.925552661190166e-05, "epoch": 2.182707686518017, "percentage": 43.67, "elapsed_time": "4:19:45", "remaining_time": "5:35:00"} |
| {"current_steps": 1450, "total_steps": 3320, "eval_loss": 0.03765711560845375, "epoch": 2.182707686518017, "percentage": 43.67, "elapsed_time": "4:22:25", "remaining_time": "5:38:26"} |
| {"current_steps": 1460, "total_steps": 3320, "loss": 0.0255, "lr": 6.876931680199121e-05, "epoch": 2.197760842976762, "percentage": 43.98, "elapsed_time": "4:23:46", "remaining_time": "5:36:03"} |
| {"current_steps": 1470, "total_steps": 3320, "loss": 0.0202, "lr": 6.828103215967186e-05, "epoch": 2.2128139994355065, "percentage": 44.28, "elapsed_time": "4:25:03", "remaining_time": "5:33:34"} |
| {"current_steps": 1480, "total_steps": 3320, "loss": 0.0266, "lr": 6.779072666180446e-05, "epoch": 2.2278671558942515, "percentage": 44.58, "elapsed_time": "4:26:20", "remaining_time": "5:31:07"} |
| {"current_steps": 1490, "total_steps": 3320, "loss": 0.0166, "lr": 6.729845450864294e-05, "epoch": 2.2429203123529966, "percentage": 44.88, "elapsed_time": "4:27:37", "remaining_time": "5:28:41"} |
| {"current_steps": 1500, "total_steps": 3320, "loss": 0.0224, "lr": 6.680427011784292e-05, "epoch": 2.257973468811741, "percentage": 45.18, "elapsed_time": "4:28:54", "remaining_time": "5:26:16"} |
| {"current_steps": 1500, "total_steps": 3320, "eval_loss": 0.0406508594751358, "epoch": 2.257973468811741, "percentage": 45.18, "elapsed_time": "4:31:34", "remaining_time": "5:29:31"} |
| {"current_steps": 1510, "total_steps": 3320, "loss": 0.0187, "lr": 6.630822811844604e-05, "epoch": 2.2730266252704863, "percentage": 45.48, "elapsed_time": "4:32:56", "remaining_time": "5:27:09"} |
| {"current_steps": 1520, "total_steps": 3320, "loss": 0.0234, "lr": 6.58103833448412e-05, "epoch": 2.2880797817292313, "percentage": 45.78, "elapsed_time": "4:34:13", "remaining_time": "5:24:43"} |
| {"current_steps": 1530, "total_steps": 3320, "loss": 0.0241, "lr": 6.531079083070288e-05, "epoch": 2.3031329381879764, "percentage": 46.08, "elapsed_time": "4:35:29", "remaining_time": "5:22:18"} |
| {"current_steps": 1540, "total_steps": 3320, "loss": 0.0174, "lr": 6.480950580290752e-05, "epoch": 2.3181860946467214, "percentage": 46.39, "elapsed_time": "4:36:46", "remaining_time": "5:19:54"} |
| {"current_steps": 1550, "total_steps": 3320, "loss": 0.0261, "lr": 6.430658367542843e-05, "epoch": 2.333239251105466, "percentage": 46.69, "elapsed_time": "4:38:03", "remaining_time": "5:17:31"} |
| {"current_steps": 1550, "total_steps": 3320, "eval_loss": 0.039291996508836746, "epoch": 2.333239251105466, "percentage": 46.69, "elapsed_time": "4:40:43", "remaining_time": "5:20:33"} |
| {"current_steps": 1560, "total_steps": 3320, "loss": 0.0239, "lr": 6.380208004321036e-05, "epoch": 2.348292407564211, "percentage": 46.99, "elapsed_time": "4:42:04", "remaining_time": "5:18:14"} |
| {"current_steps": 1570, "total_steps": 3320, "loss": 0.0182, "lr": 6.32960506760236e-05, "epoch": 2.363345564022956, "percentage": 47.29, "elapsed_time": "4:43:20", "remaining_time": "5:15:50"} |
| {"current_steps": 1580, "total_steps": 3320, "loss": 0.0169, "lr": 6.278855151229901e-05, "epoch": 2.378398720481701, "percentage": 47.59, "elapsed_time": "4:44:37", "remaining_time": "5:13:26"} |
| {"current_steps": 1590, "total_steps": 3320, "loss": 0.0126, "lr": 6.227963865294444e-05, "epoch": 2.393451876940446, "percentage": 47.89, "elapsed_time": "4:45:54", "remaining_time": "5:11:04"} |
| {"current_steps": 1600, "total_steps": 3320, "loss": 0.0156, "lr": 6.176936835514312e-05, "epoch": 2.408505033399191, "percentage": 48.19, "elapsed_time": "4:47:10", "remaining_time": "5:08:43"} |
| {"current_steps": 1600, "total_steps": 3320, "eval_loss": 0.038704484701156616, "epoch": 2.408505033399191, "percentage": 48.19, "elapsed_time": "4:49:51", "remaining_time": "5:11:35"} |
| {"current_steps": 1610, "total_steps": 3320, "loss": 0.0188, "lr": 6.125779702613471e-05, "epoch": 2.423558189857936, "percentage": 48.49, "elapsed_time": "4:51:12", "remaining_time": "5:09:17"} |
| {"current_steps": 1620, "total_steps": 3320, "loss": 0.0217, "lr": 6.074498121697983e-05, "epoch": 2.438611346316681, "percentage": 48.8, "elapsed_time": "4:52:29", "remaining_time": "5:06:56"} |
| {"current_steps": 1630, "total_steps": 3320, "loss": 0.0261, "lr": 6.023097761630879e-05, "epoch": 2.4536645027754256, "percentage": 49.1, "elapsed_time": "4:53:46", "remaining_time": "5:04:35"} |
| {"current_steps": 1640, "total_steps": 3320, "loss": 0.016, "lr": 5.971584304405489e-05, "epoch": 2.4687176592341706, "percentage": 49.4, "elapsed_time": "4:55:03", "remaining_time": "5:02:14"} |
| {"current_steps": 1650, "total_steps": 3320, "loss": 0.0173, "lr": 5.919963444517338e-05, "epoch": 2.4837708156929157, "percentage": 49.7, "elapsed_time": "4:56:20", "remaining_time": "4:59:55"} |
| {"current_steps": 1650, "total_steps": 3320, "eval_loss": 0.038775425404310226, "epoch": 2.4837708156929157, "percentage": 49.7, "elapsed_time": "4:59:00", "remaining_time": "5:02:37"} |
| {"current_steps": 1660, "total_steps": 3320, "loss": 0.0204, "lr": 5.868240888334653e-05, "epoch": 2.4988239721516607, "percentage": 50.0, "elapsed_time": "5:00:21", "remaining_time": "5:00:21"} |
| {"current_steps": 1670, "total_steps": 3320, "loss": 0.0163, "lr": 5.816422353467562e-05, "epoch": 2.5138771286104054, "percentage": 50.3, "elapsed_time": "5:01:38", "remaining_time": "4:58:01"} |
| {"current_steps": 1680, "total_steps": 3320, "loss": 0.0207, "lr": 5.7645135681360496e-05, "epoch": 2.5289302850691504, "percentage": 50.6, "elapsed_time": "5:02:54", "remaining_time": "4:55:42"} |
| {"current_steps": 1690, "total_steps": 3320, "loss": 0.0216, "lr": 5.7125202705367234e-05, "epoch": 2.5439834415278955, "percentage": 50.9, "elapsed_time": "5:04:11", "remaining_time": "4:53:23"} |
| {"current_steps": 1700, "total_steps": 3320, "loss": 0.0228, "lr": 5.660448208208513e-05, "epoch": 2.5590365979866405, "percentage": 51.2, "elapsed_time": "5:05:28", "remaining_time": "4:51:05"} |
| {"current_steps": 1700, "total_steps": 3320, "eval_loss": 0.03666573390364647, "epoch": 2.5590365979866405, "percentage": 51.2, "elapsed_time": "5:08:08", "remaining_time": "4:53:38"} |
| {"current_steps": 1710, "total_steps": 3320, "loss": 0.0169, "lr": 5.608303137397294e-05, "epoch": 2.574089754445385, "percentage": 51.51, "elapsed_time": "5:09:30", "remaining_time": "4:51:24"} |
| {"current_steps": 1720, "total_steps": 3320, "loss": 0.0218, "lr": 5.5560908224195886e-05, "epoch": 2.58914291090413, "percentage": 51.81, "elapsed_time": "5:10:47", "remaining_time": "4:49:06"} |
| {"current_steps": 1730, "total_steps": 3320, "loss": 0.0224, "lr": 5.503817035025342e-05, "epoch": 2.6041960673628752, "percentage": 52.11, "elapsed_time": "5:12:04", "remaining_time": "4:46:48"} |
| {"current_steps": 1740, "total_steps": 3320, "loss": 0.019, "lr": 5.4514875537598985e-05, "epoch": 2.61924922382162, "percentage": 52.41, "elapsed_time": "5:13:21", "remaining_time": "4:44:32"} |
| {"current_steps": 1750, "total_steps": 3320, "loss": 0.0328, "lr": 5.399108163325217e-05, "epoch": 2.634302380280365, "percentage": 52.71, "elapsed_time": "5:14:38", "remaining_time": "4:42:16"} |
| {"current_steps": 1750, "total_steps": 3320, "eval_loss": 0.037083230912685394, "epoch": 2.634302380280365, "percentage": 52.71, "elapsed_time": "5:17:18", "remaining_time": "4:44:40"} |
| {"current_steps": 1760, "total_steps": 3320, "loss": 0.0188, "lr": 5.346684653940408e-05, "epoch": 2.64935553673911, "percentage": 53.01, "elapsed_time": "5:18:40", "remaining_time": "4:42:27"} |
| {"current_steps": 1770, "total_steps": 3320, "loss": 0.0203, "lr": 5.294222820701661e-05, "epoch": 2.664408693197855, "percentage": 53.31, "elapsed_time": "5:19:57", "remaining_time": "4:40:11"} |
| {"current_steps": 1780, "total_steps": 3320, "loss": 0.0162, "lr": 5.24172846294163e-05, "epoch": 2.6794618496566, "percentage": 53.61, "elapsed_time": "5:21:13", "remaining_time": "4:37:55"} |
| {"current_steps": 1790, "total_steps": 3320, "loss": 0.018, "lr": 5.1892073835883524e-05, "epoch": 2.6945150061153447, "percentage": 53.92, "elapsed_time": "5:22:30", "remaining_time": "4:35:39"} |
| {"current_steps": 1800, "total_steps": 3320, "loss": 0.0264, "lr": 5.136665388523778e-05, "epoch": 2.7095681625740897, "percentage": 54.22, "elapsed_time": "5:23:47", "remaining_time": "4:33:25"} |
| {"current_steps": 1800, "total_steps": 3320, "eval_loss": 0.03928447514772415, "epoch": 2.7095681625740897, "percentage": 54.22, "elapsed_time": "5:26:27", "remaining_time": "4:35:40"} |
| {"current_steps": 1810, "total_steps": 3320, "loss": 0.0268, "lr": 5.0841082859419585e-05, "epoch": 2.7246213190328348, "percentage": 54.52, "elapsed_time": "5:27:49", "remaining_time": "4:33:29"} |
| {"current_steps": 1820, "total_steps": 3320, "loss": 0.0255, "lr": 5.031541885706987e-05, "epoch": 2.7396744754915794, "percentage": 54.82, "elapsed_time": "5:29:06", "remaining_time": "4:31:14"} |
| {"current_steps": 1830, "total_steps": 3320, "loss": 0.0214, "lr": 4.9789719987107545e-05, "epoch": 2.7547276319503244, "percentage": 55.12, "elapsed_time": "5:30:22", "remaining_time": "4:28:59"} |
| {"current_steps": 1840, "total_steps": 3320, "loss": 0.0207, "lr": 4.926404436230596e-05, "epoch": 2.7697807884090695, "percentage": 55.42, "elapsed_time": "5:31:39", "remaining_time": "4:26:46"} |
| {"current_steps": 1850, "total_steps": 3320, "loss": 0.0235, "lr": 4.8738450092868785e-05, "epoch": 2.7848339448678145, "percentage": 55.72, "elapsed_time": "5:32:56", "remaining_time": "4:24:33"} |
| {"current_steps": 1850, "total_steps": 3320, "eval_loss": 0.036392927169799805, "epoch": 2.7848339448678145, "percentage": 55.72, "elapsed_time": "5:35:36", "remaining_time": "4:26:40"} |
| {"current_steps": 1860, "total_steps": 3320, "loss": 0.0189, "lr": 4.8212995280006426e-05, "epoch": 2.7998871013265596, "percentage": 56.02, "elapsed_time": "5:36:58", "remaining_time": "4:24:30"} |
| {"current_steps": 1870, "total_steps": 3320, "loss": 0.0201, "lr": 4.76877380095132e-05, "epoch": 2.814940257785304, "percentage": 56.33, "elapsed_time": "5:38:14", "remaining_time": "4:22:16"} |
| {"current_steps": 1880, "total_steps": 3320, "loss": 0.0154, "lr": 4.7162736345346303e-05, "epoch": 2.8299934142440493, "percentage": 56.63, "elapsed_time": "5:39:31", "remaining_time": "4:20:03"} |
| {"current_steps": 1890, "total_steps": 3320, "loss": 0.0191, "lr": 4.663804832320726e-05, "epoch": 2.8450465707027943, "percentage": 56.93, "elapsed_time": "5:40:48", "remaining_time": "4:17:51"} |
| {"current_steps": 1900, "total_steps": 3320, "loss": 0.0204, "lr": 4.6113731944126406e-05, "epoch": 2.860099727161539, "percentage": 57.23, "elapsed_time": "5:42:06", "remaining_time": "4:15:40"} |
| {"current_steps": 1900, "total_steps": 3320, "eval_loss": 0.038577429950237274, "epoch": 2.860099727161539, "percentage": 57.23, "elapsed_time": "5:44:46", "remaining_time": "4:17:40"} |
|
|