sedrickkeh's picture
Training in progress, epoch 3
d66923a verified
{"current_steps": 10, "total_steps": 1364, "loss": 0.8133, "learning_rate": 5e-06, "epoch": 0.029261155815654718, "percentage": 0.73, "elapsed_time": "0:04:28", "remaining_time": "10:06:41"}
{"current_steps": 20, "total_steps": 1364, "loss": 0.74, "learning_rate": 5e-06, "epoch": 0.058522311631309436, "percentage": 1.47, "elapsed_time": "0:08:53", "remaining_time": "9:57:46"}
{"current_steps": 30, "total_steps": 1364, "loss": 0.7079, "learning_rate": 5e-06, "epoch": 0.08778346744696415, "percentage": 2.2, "elapsed_time": "0:13:18", "remaining_time": "9:51:53"}
{"current_steps": 40, "total_steps": 1364, "loss": 0.6973, "learning_rate": 5e-06, "epoch": 0.11704462326261887, "percentage": 2.93, "elapsed_time": "0:17:43", "remaining_time": "9:46:44"}
{"current_steps": 50, "total_steps": 1364, "loss": 0.6874, "learning_rate": 5e-06, "epoch": 0.14630577907827358, "percentage": 3.67, "elapsed_time": "0:22:08", "remaining_time": "9:41:53"}
{"current_steps": 60, "total_steps": 1364, "loss": 0.677, "learning_rate": 5e-06, "epoch": 0.1755669348939283, "percentage": 4.4, "elapsed_time": "0:26:33", "remaining_time": "9:37:14"}
{"current_steps": 70, "total_steps": 1364, "loss": 0.6705, "learning_rate": 5e-06, "epoch": 0.20482809070958302, "percentage": 5.13, "elapsed_time": "0:30:58", "remaining_time": "9:32:36"}
{"current_steps": 80, "total_steps": 1364, "loss": 0.6653, "learning_rate": 5e-06, "epoch": 0.23408924652523774, "percentage": 5.87, "elapsed_time": "0:35:23", "remaining_time": "9:28:01"}
{"current_steps": 90, "total_steps": 1364, "loss": 0.6623, "learning_rate": 5e-06, "epoch": 0.26335040234089246, "percentage": 6.6, "elapsed_time": "0:39:48", "remaining_time": "9:23:28"}
{"current_steps": 100, "total_steps": 1364, "loss": 0.6548, "learning_rate": 5e-06, "epoch": 0.29261155815654716, "percentage": 7.33, "elapsed_time": "0:44:13", "remaining_time": "9:18:57"}
{"current_steps": 110, "total_steps": 1364, "loss": 0.6632, "learning_rate": 5e-06, "epoch": 0.3218727139722019, "percentage": 8.06, "elapsed_time": "0:48:38", "remaining_time": "9:14:26"}
{"current_steps": 120, "total_steps": 1364, "loss": 0.6684, "learning_rate": 5e-06, "epoch": 0.3511338697878566, "percentage": 8.8, "elapsed_time": "0:53:03", "remaining_time": "9:09:57"}
{"current_steps": 130, "total_steps": 1364, "loss": 0.6524, "learning_rate": 5e-06, "epoch": 0.38039502560351135, "percentage": 9.53, "elapsed_time": "0:57:28", "remaining_time": "9:05:29"}
{"current_steps": 140, "total_steps": 1364, "loss": 0.6527, "learning_rate": 5e-06, "epoch": 0.40965618141916604, "percentage": 10.26, "elapsed_time": "1:01:53", "remaining_time": "9:01:03"}
{"current_steps": 150, "total_steps": 1364, "loss": 0.6484, "learning_rate": 5e-06, "epoch": 0.4389173372348208, "percentage": 11.0, "elapsed_time": "1:06:18", "remaining_time": "8:56:36"}
{"current_steps": 160, "total_steps": 1364, "loss": 0.6497, "learning_rate": 5e-06, "epoch": 0.4681784930504755, "percentage": 11.73, "elapsed_time": "1:10:43", "remaining_time": "8:52:13"}
{"current_steps": 170, "total_steps": 1364, "loss": 0.655, "learning_rate": 5e-06, "epoch": 0.49743964886613024, "percentage": 12.46, "elapsed_time": "1:15:08", "remaining_time": "8:47:48"}
{"current_steps": 180, "total_steps": 1364, "loss": 0.6547, "learning_rate": 5e-06, "epoch": 0.5267008046817849, "percentage": 13.2, "elapsed_time": "1:19:34", "remaining_time": "8:43:23"}
{"current_steps": 190, "total_steps": 1364, "loss": 0.643, "learning_rate": 5e-06, "epoch": 0.5559619604974396, "percentage": 13.93, "elapsed_time": "1:23:59", "remaining_time": "8:38:55"}
{"current_steps": 200, "total_steps": 1364, "loss": 0.6447, "learning_rate": 5e-06, "epoch": 0.5852231163130943, "percentage": 14.66, "elapsed_time": "1:28:23", "remaining_time": "8:34:29"}
{"current_steps": 210, "total_steps": 1364, "loss": 0.6515, "learning_rate": 5e-06, "epoch": 0.6144842721287491, "percentage": 15.4, "elapsed_time": "1:32:48", "remaining_time": "8:30:01"}
{"current_steps": 220, "total_steps": 1364, "loss": 0.6392, "learning_rate": 5e-06, "epoch": 0.6437454279444038, "percentage": 16.13, "elapsed_time": "1:37:13", "remaining_time": "8:25:35"}
{"current_steps": 230, "total_steps": 1364, "loss": 0.6394, "learning_rate": 5e-06, "epoch": 0.6730065837600585, "percentage": 16.86, "elapsed_time": "1:41:38", "remaining_time": "8:21:08"}
{"current_steps": 240, "total_steps": 1364, "loss": 0.646, "learning_rate": 5e-06, "epoch": 0.7022677395757132, "percentage": 17.6, "elapsed_time": "1:46:03", "remaining_time": "8:16:43"}
{"current_steps": 250, "total_steps": 1364, "loss": 0.6445, "learning_rate": 5e-06, "epoch": 0.731528895391368, "percentage": 18.33, "elapsed_time": "1:50:28", "remaining_time": "8:12:17"}
{"current_steps": 260, "total_steps": 1364, "loss": 0.6471, "learning_rate": 5e-06, "epoch": 0.7607900512070227, "percentage": 19.06, "elapsed_time": "1:54:53", "remaining_time": "8:07:51"}
{"current_steps": 270, "total_steps": 1364, "loss": 0.6494, "learning_rate": 5e-06, "epoch": 0.7900512070226774, "percentage": 19.79, "elapsed_time": "1:59:18", "remaining_time": "8:03:26"}
{"current_steps": 280, "total_steps": 1364, "loss": 0.6474, "learning_rate": 5e-06, "epoch": 0.8193123628383321, "percentage": 20.53, "elapsed_time": "2:03:43", "remaining_time": "7:59:00"}
{"current_steps": 290, "total_steps": 1364, "loss": 0.6403, "learning_rate": 5e-06, "epoch": 0.8485735186539868, "percentage": 21.26, "elapsed_time": "2:08:08", "remaining_time": "7:54:34"}
{"current_steps": 300, "total_steps": 1364, "loss": 0.6319, "learning_rate": 5e-06, "epoch": 0.8778346744696416, "percentage": 21.99, "elapsed_time": "2:12:33", "remaining_time": "7:50:08"}
{"current_steps": 310, "total_steps": 1364, "loss": 0.6454, "learning_rate": 5e-06, "epoch": 0.9070958302852963, "percentage": 22.73, "elapsed_time": "2:16:58", "remaining_time": "7:45:42"}
{"current_steps": 320, "total_steps": 1364, "loss": 0.6373, "learning_rate": 5e-06, "epoch": 0.936356986100951, "percentage": 23.46, "elapsed_time": "2:21:23", "remaining_time": "7:41:17"}
{"current_steps": 330, "total_steps": 1364, "loss": 0.6406, "learning_rate": 5e-06, "epoch": 0.9656181419166057, "percentage": 24.19, "elapsed_time": "2:25:48", "remaining_time": "7:36:51"}
{"current_steps": 340, "total_steps": 1364, "loss": 0.6366, "learning_rate": 5e-06, "epoch": 0.9948792977322605, "percentage": 24.93, "elapsed_time": "2:30:13", "remaining_time": "7:32:25"}
{"current_steps": 341, "total_steps": 1364, "eval_loss": 0.6407667398452759, "epoch": 0.9978054133138259, "percentage": 25.0, "elapsed_time": "2:33:51", "remaining_time": "7:41:34"}
{"current_steps": 350, "total_steps": 1364, "loss": 0.6258, "learning_rate": 5e-06, "epoch": 1.024140453547915, "percentage": 25.66, "elapsed_time": "2:38:25", "remaining_time": "7:38:59"}
{"current_steps": 360, "total_steps": 1364, "loss": 0.6076, "learning_rate": 5e-06, "epoch": 1.0534016093635699, "percentage": 26.39, "elapsed_time": "2:42:50", "remaining_time": "7:34:10"}
{"current_steps": 370, "total_steps": 1364, "loss": 0.609, "learning_rate": 5e-06, "epoch": 1.0826627651792247, "percentage": 27.13, "elapsed_time": "2:47:16", "remaining_time": "7:29:22"}
{"current_steps": 380, "total_steps": 1364, "loss": 0.607, "learning_rate": 5e-06, "epoch": 1.1119239209948792, "percentage": 27.86, "elapsed_time": "2:51:41", "remaining_time": "7:24:35"}
{"current_steps": 390, "total_steps": 1364, "loss": 0.611, "learning_rate": 5e-06, "epoch": 1.141185076810534, "percentage": 28.59, "elapsed_time": "2:56:07", "remaining_time": "7:19:50"}
{"current_steps": 400, "total_steps": 1364, "loss": 0.6136, "learning_rate": 5e-06, "epoch": 1.1704462326261886, "percentage": 29.33, "elapsed_time": "3:00:32", "remaining_time": "7:15:06"}
{"current_steps": 410, "total_steps": 1364, "loss": 0.612, "learning_rate": 5e-06, "epoch": 1.1997073884418434, "percentage": 30.06, "elapsed_time": "3:04:58", "remaining_time": "7:10:23"}
{"current_steps": 420, "total_steps": 1364, "loss": 0.6017, "learning_rate": 5e-06, "epoch": 1.2289685442574982, "percentage": 30.79, "elapsed_time": "3:09:23", "remaining_time": "7:05:40"}
{"current_steps": 430, "total_steps": 1364, "loss": 0.6115, "learning_rate": 5e-06, "epoch": 1.2582297000731528, "percentage": 31.52, "elapsed_time": "3:13:48", "remaining_time": "7:00:59"}
{"current_steps": 440, "total_steps": 1364, "loss": 0.6046, "learning_rate": 5e-06, "epoch": 1.2874908558888076, "percentage": 32.26, "elapsed_time": "3:18:14", "remaining_time": "6:56:18"}
{"current_steps": 450, "total_steps": 1364, "loss": 0.6064, "learning_rate": 5e-06, "epoch": 1.3167520117044624, "percentage": 32.99, "elapsed_time": "3:22:39", "remaining_time": "6:51:37"}
{"current_steps": 460, "total_steps": 1364, "loss": 0.6059, "learning_rate": 5e-06, "epoch": 1.346013167520117, "percentage": 33.72, "elapsed_time": "3:27:05", "remaining_time": "6:46:58"}
{"current_steps": 470, "total_steps": 1364, "loss": 0.6016, "learning_rate": 5e-06, "epoch": 1.3752743233357718, "percentage": 34.46, "elapsed_time": "3:31:30", "remaining_time": "6:42:18"}
{"current_steps": 480, "total_steps": 1364, "loss": 0.606, "learning_rate": 5e-06, "epoch": 1.4045354791514264, "percentage": 35.19, "elapsed_time": "3:35:55", "remaining_time": "6:37:40"}
{"current_steps": 490, "total_steps": 1364, "loss": 0.6069, "learning_rate": 5e-06, "epoch": 1.4337966349670812, "percentage": 35.92, "elapsed_time": "3:40:21", "remaining_time": "6:33:02"}
{"current_steps": 500, "total_steps": 1364, "loss": 0.6006, "learning_rate": 5e-06, "epoch": 1.4630577907827358, "percentage": 36.66, "elapsed_time": "3:44:46", "remaining_time": "6:28:24"}
{"current_steps": 510, "total_steps": 1364, "loss": 0.6053, "learning_rate": 5e-06, "epoch": 1.4923189465983906, "percentage": 37.39, "elapsed_time": "3:49:11", "remaining_time": "6:23:47"}
{"current_steps": 520, "total_steps": 1364, "loss": 0.6085, "learning_rate": 5e-06, "epoch": 1.5215801024140454, "percentage": 38.12, "elapsed_time": "3:53:37", "remaining_time": "6:19:10"}
{"current_steps": 530, "total_steps": 1364, "loss": 0.608, "learning_rate": 5e-06, "epoch": 1.5508412582297, "percentage": 38.86, "elapsed_time": "3:58:02", "remaining_time": "6:14:34"}
{"current_steps": 540, "total_steps": 1364, "loss": 0.6142, "learning_rate": 5e-06, "epoch": 1.5801024140453548, "percentage": 39.59, "elapsed_time": "4:02:28", "remaining_time": "6:09:59"}
{"current_steps": 550, "total_steps": 1364, "loss": 0.6045, "learning_rate": 5e-06, "epoch": 1.6093635698610096, "percentage": 40.32, "elapsed_time": "4:06:53", "remaining_time": "6:05:24"}
{"current_steps": 560, "total_steps": 1364, "loss": 0.6067, "learning_rate": 5e-06, "epoch": 1.6386247256766642, "percentage": 41.06, "elapsed_time": "4:11:19", "remaining_time": "6:00:49"}
{"current_steps": 570, "total_steps": 1364, "loss": 0.5992, "learning_rate": 5e-06, "epoch": 1.667885881492319, "percentage": 41.79, "elapsed_time": "4:15:44", "remaining_time": "5:56:14"}
{"current_steps": 580, "total_steps": 1364, "loss": 0.6033, "learning_rate": 5e-06, "epoch": 1.6971470373079738, "percentage": 42.52, "elapsed_time": "4:20:09", "remaining_time": "5:51:40"}
{"current_steps": 590, "total_steps": 1364, "loss": 0.6081, "learning_rate": 5e-06, "epoch": 1.7264081931236284, "percentage": 43.26, "elapsed_time": "4:24:35", "remaining_time": "5:47:06"}
{"current_steps": 600, "total_steps": 1364, "loss": 0.6033, "learning_rate": 5e-06, "epoch": 1.755669348939283, "percentage": 43.99, "elapsed_time": "4:29:00", "remaining_time": "5:42:32"}
{"current_steps": 610, "total_steps": 1364, "loss": 0.6074, "learning_rate": 5e-06, "epoch": 1.784930504754938, "percentage": 44.72, "elapsed_time": "4:33:25", "remaining_time": "5:37:58"}
{"current_steps": 620, "total_steps": 1364, "loss": 0.6074, "learning_rate": 5e-06, "epoch": 1.8141916605705926, "percentage": 45.45, "elapsed_time": "4:37:51", "remaining_time": "5:33:25"}
{"current_steps": 630, "total_steps": 1364, "loss": 0.6061, "learning_rate": 5e-06, "epoch": 1.8434528163862471, "percentage": 46.19, "elapsed_time": "4:42:16", "remaining_time": "5:28:52"}
{"current_steps": 640, "total_steps": 1364, "loss": 0.6001, "learning_rate": 5e-06, "epoch": 1.872713972201902, "percentage": 46.92, "elapsed_time": "4:46:41", "remaining_time": "5:24:19"}
{"current_steps": 650, "total_steps": 1364, "loss": 0.6069, "learning_rate": 5e-06, "epoch": 1.9019751280175567, "percentage": 47.65, "elapsed_time": "4:51:06", "remaining_time": "5:19:46"}
{"current_steps": 660, "total_steps": 1364, "loss": 0.6065, "learning_rate": 5e-06, "epoch": 1.9312362838332113, "percentage": 48.39, "elapsed_time": "4:55:31", "remaining_time": "5:15:13"}
{"current_steps": 670, "total_steps": 1364, "loss": 0.5951, "learning_rate": 5e-06, "epoch": 1.9604974396488661, "percentage": 49.12, "elapsed_time": "4:59:56", "remaining_time": "5:10:41"}
{"current_steps": 680, "total_steps": 1364, "loss": 0.6091, "learning_rate": 5e-06, "epoch": 1.989758595464521, "percentage": 49.85, "elapsed_time": "5:04:21", "remaining_time": "5:06:08"}
{"current_steps": 683, "total_steps": 1364, "eval_loss": 0.6332206130027771, "epoch": 1.9985369422092174, "percentage": 50.07, "elapsed_time": "5:08:43", "remaining_time": "5:07:49"}
{"current_steps": 690, "total_steps": 1364, "loss": 0.5986, "learning_rate": 5e-06, "epoch": 2.0190197512801755, "percentage": 50.59, "elapsed_time": "5:12:34", "remaining_time": "5:05:19"}
{"current_steps": 700, "total_steps": 1364, "loss": 0.5678, "learning_rate": 5e-06, "epoch": 2.04828090709583, "percentage": 51.32, "elapsed_time": "5:16:59", "remaining_time": "5:00:41"}
{"current_steps": 710, "total_steps": 1364, "loss": 0.5703, "learning_rate": 5e-06, "epoch": 2.077542062911485, "percentage": 52.05, "elapsed_time": "5:21:24", "remaining_time": "4:56:03"}
{"current_steps": 720, "total_steps": 1364, "loss": 0.5703, "learning_rate": 5e-06, "epoch": 2.1068032187271397, "percentage": 52.79, "elapsed_time": "5:25:49", "remaining_time": "4:51:26"}
{"current_steps": 730, "total_steps": 1364, "loss": 0.5712, "learning_rate": 5e-06, "epoch": 2.1360643745427943, "percentage": 53.52, "elapsed_time": "5:30:14", "remaining_time": "4:46:49"}
{"current_steps": 740, "total_steps": 1364, "loss": 0.5777, "learning_rate": 5e-06, "epoch": 2.1653255303584493, "percentage": 54.25, "elapsed_time": "5:34:40", "remaining_time": "4:42:12"}
{"current_steps": 750, "total_steps": 1364, "loss": 0.5774, "learning_rate": 5e-06, "epoch": 2.194586686174104, "percentage": 54.99, "elapsed_time": "5:39:05", "remaining_time": "4:37:35"}
{"current_steps": 760, "total_steps": 1364, "loss": 0.5734, "learning_rate": 5e-06, "epoch": 2.2238478419897585, "percentage": 55.72, "elapsed_time": "5:43:29", "remaining_time": "4:32:59"}
{"current_steps": 770, "total_steps": 1364, "loss": 0.5731, "learning_rate": 5e-06, "epoch": 2.2531089978054135, "percentage": 56.45, "elapsed_time": "5:47:54", "remaining_time": "4:28:23"}
{"current_steps": 780, "total_steps": 1364, "loss": 0.5719, "learning_rate": 5e-06, "epoch": 2.282370153621068, "percentage": 57.18, "elapsed_time": "5:52:19", "remaining_time": "4:23:47"}
{"current_steps": 790, "total_steps": 1364, "loss": 0.572, "learning_rate": 5e-06, "epoch": 2.3116313094367227, "percentage": 57.92, "elapsed_time": "5:56:44", "remaining_time": "4:19:11"}
{"current_steps": 800, "total_steps": 1364, "loss": 0.5772, "learning_rate": 5e-06, "epoch": 2.3408924652523773, "percentage": 58.65, "elapsed_time": "6:01:08", "remaining_time": "4:14:36"}
{"current_steps": 810, "total_steps": 1364, "loss": 0.5708, "learning_rate": 5e-06, "epoch": 2.3701536210680323, "percentage": 59.38, "elapsed_time": "6:05:33", "remaining_time": "4:10:01"}
{"current_steps": 820, "total_steps": 1364, "loss": 0.5803, "learning_rate": 5e-06, "epoch": 2.399414776883687, "percentage": 60.12, "elapsed_time": "6:09:58", "remaining_time": "4:05:26"}
{"current_steps": 830, "total_steps": 1364, "loss": 0.5735, "learning_rate": 5e-06, "epoch": 2.4286759326993415, "percentage": 60.85, "elapsed_time": "6:14:23", "remaining_time": "4:00:52"}
{"current_steps": 840, "total_steps": 1364, "loss": 0.5709, "learning_rate": 5e-06, "epoch": 2.4579370885149965, "percentage": 61.58, "elapsed_time": "6:18:47", "remaining_time": "3:56:17"}
{"current_steps": 850, "total_steps": 1364, "loss": 0.5725, "learning_rate": 5e-06, "epoch": 2.487198244330651, "percentage": 62.32, "elapsed_time": "6:23:12", "remaining_time": "3:51:43"}
{"current_steps": 860, "total_steps": 1364, "loss": 0.569, "learning_rate": 5e-06, "epoch": 2.5164594001463056, "percentage": 63.05, "elapsed_time": "6:27:37", "remaining_time": "3:47:10"}
{"current_steps": 870, "total_steps": 1364, "loss": 0.5695, "learning_rate": 5e-06, "epoch": 2.5457205559619602, "percentage": 63.78, "elapsed_time": "6:32:02", "remaining_time": "3:42:36"}
{"current_steps": 880, "total_steps": 1364, "loss": 0.5757, "learning_rate": 5e-06, "epoch": 2.5749817117776153, "percentage": 64.52, "elapsed_time": "6:36:27", "remaining_time": "3:38:02"}
{"current_steps": 890, "total_steps": 1364, "loss": 0.5727, "learning_rate": 5e-06, "epoch": 2.60424286759327, "percentage": 65.25, "elapsed_time": "6:40:51", "remaining_time": "3:33:29"}
{"current_steps": 900, "total_steps": 1364, "loss": 0.5797, "learning_rate": 5e-06, "epoch": 2.633504023408925, "percentage": 65.98, "elapsed_time": "6:45:16", "remaining_time": "3:28:56"}
{"current_steps": 910, "total_steps": 1364, "loss": 0.5747, "learning_rate": 5e-06, "epoch": 2.6627651792245794, "percentage": 66.72, "elapsed_time": "6:49:41", "remaining_time": "3:24:23"}
{"current_steps": 920, "total_steps": 1364, "loss": 0.5756, "learning_rate": 5e-06, "epoch": 2.692026335040234, "percentage": 67.45, "elapsed_time": "6:54:06", "remaining_time": "3:19:51"}
{"current_steps": 930, "total_steps": 1364, "loss": 0.5753, "learning_rate": 5e-06, "epoch": 2.7212874908558886, "percentage": 68.18, "elapsed_time": "6:58:31", "remaining_time": "3:15:18"}
{"current_steps": 940, "total_steps": 1364, "loss": 0.5764, "learning_rate": 5e-06, "epoch": 2.7505486466715436, "percentage": 68.91, "elapsed_time": "7:02:55", "remaining_time": "3:10:46"}
{"current_steps": 950, "total_steps": 1364, "loss": 0.576, "learning_rate": 5e-06, "epoch": 2.7798098024871982, "percentage": 69.65, "elapsed_time": "7:07:20", "remaining_time": "3:06:13"}
{"current_steps": 960, "total_steps": 1364, "loss": 0.5754, "learning_rate": 5e-06, "epoch": 2.809070958302853, "percentage": 70.38, "elapsed_time": "7:11:45", "remaining_time": "3:01:41"}
{"current_steps": 970, "total_steps": 1364, "loss": 0.5743, "learning_rate": 5e-06, "epoch": 2.838332114118508, "percentage": 71.11, "elapsed_time": "7:16:10", "remaining_time": "2:57:09"}
{"current_steps": 980, "total_steps": 1364, "loss": 0.5728, "learning_rate": 5e-06, "epoch": 2.8675932699341624, "percentage": 71.85, "elapsed_time": "7:20:34", "remaining_time": "2:52:38"}
{"current_steps": 990, "total_steps": 1364, "loss": 0.568, "learning_rate": 5e-06, "epoch": 2.896854425749817, "percentage": 72.58, "elapsed_time": "7:24:59", "remaining_time": "2:48:06"}
{"current_steps": 1000, "total_steps": 1364, "loss": 0.5732, "learning_rate": 5e-06, "epoch": 2.9261155815654716, "percentage": 73.31, "elapsed_time": "7:29:24", "remaining_time": "2:43:35"}
{"current_steps": 1010, "total_steps": 1364, "loss": 0.5647, "learning_rate": 5e-06, "epoch": 2.9553767373811266, "percentage": 74.05, "elapsed_time": "7:33:49", "remaining_time": "2:39:03"}
{"current_steps": 1020, "total_steps": 1364, "loss": 0.5768, "learning_rate": 5e-06, "epoch": 2.984637893196781, "percentage": 74.78, "elapsed_time": "7:38:13", "remaining_time": "2:34:32"}
{"current_steps": 1025, "total_steps": 1364, "eval_loss": 0.632946252822876, "epoch": 2.9992684711046085, "percentage": 75.15, "elapsed_time": "7:43:22", "remaining_time": "2:33:15"}
{"current_steps": 1030, "total_steps": 1364, "loss": 0.5738, "learning_rate": 5e-06, "epoch": 3.0138990490124358, "percentage": 75.51, "elapsed_time": "7:46:23", "remaining_time": "2:31:14"}
{"current_steps": 1040, "total_steps": 1364, "loss": 0.5429, "learning_rate": 5e-06, "epoch": 3.043160204828091, "percentage": 76.25, "elapsed_time": "7:50:47", "remaining_time": "2:26:40"}
{"current_steps": 1050, "total_steps": 1364, "loss": 0.5418, "learning_rate": 5e-06, "epoch": 3.0724213606437454, "percentage": 76.98, "elapsed_time": "7:55:12", "remaining_time": "2:22:06"}
{"current_steps": 1060, "total_steps": 1364, "loss": 0.547, "learning_rate": 5e-06, "epoch": 3.1016825164594, "percentage": 77.71, "elapsed_time": "7:59:37", "remaining_time": "2:17:33"}
{"current_steps": 1070, "total_steps": 1364, "loss": 0.5428, "learning_rate": 5e-06, "epoch": 3.130943672275055, "percentage": 78.45, "elapsed_time": "8:04:02", "remaining_time": "2:12:59"}
{"current_steps": 1080, "total_steps": 1364, "loss": 0.5409, "learning_rate": 5e-06, "epoch": 3.1602048280907096, "percentage": 79.18, "elapsed_time": "8:08:27", "remaining_time": "2:08:26"}
{"current_steps": 1090, "total_steps": 1364, "loss": 0.5358, "learning_rate": 5e-06, "epoch": 3.189465983906364, "percentage": 79.91, "elapsed_time": "8:12:51", "remaining_time": "2:03:53"}
{"current_steps": 1100, "total_steps": 1364, "loss": 0.5438, "learning_rate": 5e-06, "epoch": 3.218727139722019, "percentage": 80.65, "elapsed_time": "8:17:16", "remaining_time": "1:59:20"}
{"current_steps": 1110, "total_steps": 1364, "loss": 0.545, "learning_rate": 5e-06, "epoch": 3.2479882955376738, "percentage": 81.38, "elapsed_time": "8:21:41", "remaining_time": "1:54:48"}
{"current_steps": 1120, "total_steps": 1364, "loss": 0.5406, "learning_rate": 5e-06, "epoch": 3.2772494513533283, "percentage": 82.11, "elapsed_time": "8:26:06", "remaining_time": "1:50:15"}
{"current_steps": 1130, "total_steps": 1364, "loss": 0.5385, "learning_rate": 5e-06, "epoch": 3.306510607168983, "percentage": 82.84, "elapsed_time": "8:30:31", "remaining_time": "1:45:43"}
{"current_steps": 1140, "total_steps": 1364, "loss": 0.5373, "learning_rate": 5e-06, "epoch": 3.335771762984638, "percentage": 83.58, "elapsed_time": "8:34:56", "remaining_time": "1:41:10"}
{"current_steps": 1150, "total_steps": 1364, "loss": 0.5423, "learning_rate": 5e-06, "epoch": 3.3650329188002925, "percentage": 84.31, "elapsed_time": "8:39:21", "remaining_time": "1:36:38"}
{"current_steps": 1160, "total_steps": 1364, "loss": 0.5455, "learning_rate": 5e-06, "epoch": 3.3942940746159476, "percentage": 85.04, "elapsed_time": "8:43:45", "remaining_time": "1:32:06"}
{"current_steps": 1170, "total_steps": 1364, "loss": 0.5418, "learning_rate": 5e-06, "epoch": 3.423555230431602, "percentage": 85.78, "elapsed_time": "8:48:10", "remaining_time": "1:27:34"}
{"current_steps": 1180, "total_steps": 1364, "loss": 0.5422, "learning_rate": 5e-06, "epoch": 3.4528163862472567, "percentage": 86.51, "elapsed_time": "8:52:35", "remaining_time": "1:23:02"}
{"current_steps": 1190, "total_steps": 1364, "loss": 0.5469, "learning_rate": 5e-06, "epoch": 3.4820775420629113, "percentage": 87.24, "elapsed_time": "8:57:00", "remaining_time": "1:18:31"}
{"current_steps": 1200, "total_steps": 1364, "loss": 0.5436, "learning_rate": 5e-06, "epoch": 3.5113386978785663, "percentage": 87.98, "elapsed_time": "9:01:25", "remaining_time": "1:13:59"}
{"current_steps": 1210, "total_steps": 1364, "loss": 0.5393, "learning_rate": 5e-06, "epoch": 3.540599853694221, "percentage": 88.71, "elapsed_time": "9:05:50", "remaining_time": "1:09:28"}
{"current_steps": 1220, "total_steps": 1364, "loss": 0.5423, "learning_rate": 5e-06, "epoch": 3.5698610095098755, "percentage": 89.44, "elapsed_time": "9:10:15", "remaining_time": "1:04:56"}
{"current_steps": 1230, "total_steps": 1364, "loss": 0.5419, "learning_rate": 5e-06, "epoch": 3.5991221653255305, "percentage": 90.18, "elapsed_time": "9:14:40", "remaining_time": "1:00:25"}
{"current_steps": 1240, "total_steps": 1364, "loss": 0.547, "learning_rate": 5e-06, "epoch": 3.628383321141185, "percentage": 90.91, "elapsed_time": "9:19:05", "remaining_time": "0:55:54"}
{"current_steps": 1250, "total_steps": 1364, "loss": 0.5422, "learning_rate": 5e-06, "epoch": 3.6576444769568397, "percentage": 91.64, "elapsed_time": "9:23:30", "remaining_time": "0:51:23"}
{"current_steps": 1260, "total_steps": 1364, "loss": 0.5406, "learning_rate": 5e-06, "epoch": 3.6869056327724943, "percentage": 92.38, "elapsed_time": "9:27:54", "remaining_time": "0:46:52"}
{"current_steps": 1270, "total_steps": 1364, "loss": 0.5399, "learning_rate": 5e-06, "epoch": 3.7161667885881493, "percentage": 93.11, "elapsed_time": "9:32:19", "remaining_time": "0:42:21"}
{"current_steps": 1280, "total_steps": 1364, "loss": 0.5464, "learning_rate": 5e-06, "epoch": 3.745427944403804, "percentage": 93.84, "elapsed_time": "9:36:44", "remaining_time": "0:37:50"}
{"current_steps": 1290, "total_steps": 1364, "loss": 0.541, "learning_rate": 5e-06, "epoch": 3.774689100219459, "percentage": 94.57, "elapsed_time": "9:41:09", "remaining_time": "0:33:20"}
{"current_steps": 1300, "total_steps": 1364, "loss": 0.5466, "learning_rate": 5e-06, "epoch": 3.8039502560351135, "percentage": 95.31, "elapsed_time": "9:45:34", "remaining_time": "0:28:49"}
{"current_steps": 1310, "total_steps": 1364, "loss": 0.5496, "learning_rate": 5e-06, "epoch": 3.833211411850768, "percentage": 96.04, "elapsed_time": "9:49:59", "remaining_time": "0:24:19"}
{"current_steps": 1320, "total_steps": 1364, "loss": 0.5502, "learning_rate": 5e-06, "epoch": 3.8624725676664227, "percentage": 96.77, "elapsed_time": "9:54:24", "remaining_time": "0:19:48"}
{"current_steps": 1330, "total_steps": 1364, "loss": 0.5412, "learning_rate": 5e-06, "epoch": 3.8917337234820777, "percentage": 97.51, "elapsed_time": "9:58:49", "remaining_time": "0:15:18"}
{"current_steps": 1340, "total_steps": 1364, "loss": 0.5422, "learning_rate": 5e-06, "epoch": 3.9209948792977323, "percentage": 98.24, "elapsed_time": "10:03:14", "remaining_time": "0:10:48"}
{"current_steps": 1350, "total_steps": 1364, "loss": 0.5479, "learning_rate": 5e-06, "epoch": 3.950256035113387, "percentage": 98.97, "elapsed_time": "10:07:39", "remaining_time": "0:06:18"}
{"current_steps": 1360, "total_steps": 1364, "loss": 0.5456, "learning_rate": 5e-06, "epoch": 3.979517190929042, "percentage": 99.71, "elapsed_time": "10:12:04", "remaining_time": "0:01:48"}
{"current_steps": 1364, "total_steps": 1364, "eval_loss": 0.6392698287963867, "epoch": 3.9912216532553035, "percentage": 100.0, "elapsed_time": "10:17:38", "remaining_time": "0:00:00"}
{"current_steps": 1364, "total_steps": 1364, "epoch": 3.9912216532553035, "percentage": 100.0, "elapsed_time": "10:18:43", "remaining_time": "0:00:00"}