gsmyrnis's picture
Training in progress, epoch 3
ce0f96f verified
{"current_steps": 10, "total_steps": 927, "loss": 1.0447, "learning_rate": 5e-06, "epoch": 0.032362459546925564, "percentage": 1.08, "elapsed_time": "0:01:01", "remaining_time": "1:33:20"}
{"current_steps": 20, "total_steps": 927, "loss": 0.9033, "learning_rate": 5e-06, "epoch": 0.06472491909385113, "percentage": 2.16, "elapsed_time": "0:01:59", "remaining_time": "1:29:59"}
{"current_steps": 30, "total_steps": 927, "loss": 0.8703, "learning_rate": 5e-06, "epoch": 0.0970873786407767, "percentage": 3.24, "elapsed_time": "0:02:57", "remaining_time": "1:28:15"}
{"current_steps": 40, "total_steps": 927, "loss": 0.8471, "learning_rate": 5e-06, "epoch": 0.12944983818770225, "percentage": 4.31, "elapsed_time": "0:03:55", "remaining_time": "1:26:54"}
{"current_steps": 50, "total_steps": 927, "loss": 0.8193, "learning_rate": 5e-06, "epoch": 0.16181229773462782, "percentage": 5.39, "elapsed_time": "0:04:53", "remaining_time": "1:25:51"}
{"current_steps": 60, "total_steps": 927, "loss": 0.8027, "learning_rate": 5e-06, "epoch": 0.1941747572815534, "percentage": 6.47, "elapsed_time": "0:05:51", "remaining_time": "1:24:46"}
{"current_steps": 70, "total_steps": 927, "loss": 0.7845, "learning_rate": 5e-06, "epoch": 0.22653721682847897, "percentage": 7.55, "elapsed_time": "0:06:49", "remaining_time": "1:23:39"}
{"current_steps": 80, "total_steps": 927, "loss": 0.7727, "learning_rate": 5e-06, "epoch": 0.2588996763754045, "percentage": 8.63, "elapsed_time": "0:07:48", "remaining_time": "1:22:35"}
{"current_steps": 90, "total_steps": 927, "loss": 0.7653, "learning_rate": 5e-06, "epoch": 0.2912621359223301, "percentage": 9.71, "elapsed_time": "0:08:46", "remaining_time": "1:21:33"}
{"current_steps": 100, "total_steps": 927, "loss": 0.7573, "learning_rate": 5e-06, "epoch": 0.32362459546925565, "percentage": 10.79, "elapsed_time": "0:09:44", "remaining_time": "1:20:31"}
{"current_steps": 110, "total_steps": 927, "loss": 0.7512, "learning_rate": 5e-06, "epoch": 0.3559870550161812, "percentage": 11.87, "elapsed_time": "0:10:43", "remaining_time": "1:19:36"}
{"current_steps": 120, "total_steps": 927, "loss": 0.7493, "learning_rate": 5e-06, "epoch": 0.3883495145631068, "percentage": 12.94, "elapsed_time": "0:11:41", "remaining_time": "1:18:36"}
{"current_steps": 130, "total_steps": 927, "loss": 0.749, "learning_rate": 5e-06, "epoch": 0.42071197411003236, "percentage": 14.02, "elapsed_time": "0:12:39", "remaining_time": "1:17:36"}
{"current_steps": 140, "total_steps": 927, "loss": 0.7397, "learning_rate": 5e-06, "epoch": 0.45307443365695793, "percentage": 15.1, "elapsed_time": "0:13:37", "remaining_time": "1:16:36"}
{"current_steps": 150, "total_steps": 927, "loss": 0.7409, "learning_rate": 5e-06, "epoch": 0.4854368932038835, "percentage": 16.18, "elapsed_time": "0:14:35", "remaining_time": "1:15:37"}
{"current_steps": 160, "total_steps": 927, "loss": 0.7375, "learning_rate": 5e-06, "epoch": 0.517799352750809, "percentage": 17.26, "elapsed_time": "0:15:34", "remaining_time": "1:14:38"}
{"current_steps": 170, "total_steps": 927, "loss": 0.732, "learning_rate": 5e-06, "epoch": 0.5501618122977346, "percentage": 18.34, "elapsed_time": "0:16:33", "remaining_time": "1:13:44"}
{"current_steps": 180, "total_steps": 927, "loss": 0.7353, "learning_rate": 5e-06, "epoch": 0.5825242718446602, "percentage": 19.42, "elapsed_time": "0:17:32", "remaining_time": "1:12:45"}
{"current_steps": 190, "total_steps": 927, "loss": 0.7298, "learning_rate": 5e-06, "epoch": 0.6148867313915858, "percentage": 20.5, "elapsed_time": "0:18:30", "remaining_time": "1:11:46"}
{"current_steps": 200, "total_steps": 927, "loss": 0.7261, "learning_rate": 5e-06, "epoch": 0.6472491909385113, "percentage": 21.57, "elapsed_time": "0:19:28", "remaining_time": "1:10:46"}
{"current_steps": 210, "total_steps": 927, "loss": 0.7269, "learning_rate": 5e-06, "epoch": 0.6796116504854369, "percentage": 22.65, "elapsed_time": "0:20:26", "remaining_time": "1:09:47"}
{"current_steps": 220, "total_steps": 927, "loss": 0.7308, "learning_rate": 5e-06, "epoch": 0.7119741100323624, "percentage": 23.73, "elapsed_time": "0:21:24", "remaining_time": "1:08:48"}
{"current_steps": 230, "total_steps": 927, "loss": 0.7216, "learning_rate": 5e-06, "epoch": 0.7443365695792881, "percentage": 24.81, "elapsed_time": "0:22:22", "remaining_time": "1:07:49"}
{"current_steps": 240, "total_steps": 927, "loss": 0.7244, "learning_rate": 5e-06, "epoch": 0.7766990291262136, "percentage": 25.89, "elapsed_time": "0:23:21", "remaining_time": "1:06:50"}
{"current_steps": 250, "total_steps": 927, "loss": 0.719, "learning_rate": 5e-06, "epoch": 0.8090614886731392, "percentage": 26.97, "elapsed_time": "0:24:18", "remaining_time": "1:05:50"}
{"current_steps": 260, "total_steps": 927, "loss": 0.7158, "learning_rate": 5e-06, "epoch": 0.8414239482200647, "percentage": 28.05, "elapsed_time": "0:25:17", "remaining_time": "1:04:51"}
{"current_steps": 270, "total_steps": 927, "loss": 0.7222, "learning_rate": 5e-06, "epoch": 0.8737864077669902, "percentage": 29.13, "elapsed_time": "0:26:15", "remaining_time": "1:03:52"}
{"current_steps": 280, "total_steps": 927, "loss": 0.7206, "learning_rate": 5e-06, "epoch": 0.9061488673139159, "percentage": 30.2, "elapsed_time": "0:27:13", "remaining_time": "1:02:54"}
{"current_steps": 290, "total_steps": 927, "loss": 0.7071, "learning_rate": 5e-06, "epoch": 0.9385113268608414, "percentage": 31.28, "elapsed_time": "0:28:11", "remaining_time": "1:01:56"}
{"current_steps": 300, "total_steps": 927, "loss": 0.7215, "learning_rate": 5e-06, "epoch": 0.970873786407767, "percentage": 32.36, "elapsed_time": "0:29:09", "remaining_time": "1:00:57"}
{"current_steps": 309, "total_steps": 927, "eval_loss": 0.7100771069526672, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "0:30:31", "remaining_time": "1:01:03"}
{"current_steps": 310, "total_steps": 927, "loss": 0.712, "learning_rate": 5e-06, "epoch": 1.0032362459546926, "percentage": 33.44, "elapsed_time": "0:32:14", "remaining_time": "1:04:09"}
{"current_steps": 320, "total_steps": 927, "loss": 0.6624, "learning_rate": 5e-06, "epoch": 1.035598705501618, "percentage": 34.52, "elapsed_time": "0:33:12", "remaining_time": "1:02:58"}
{"current_steps": 330, "total_steps": 927, "loss": 0.661, "learning_rate": 5e-06, "epoch": 1.0679611650485437, "percentage": 35.6, "elapsed_time": "0:34:09", "remaining_time": "1:01:48"}
{"current_steps": 340, "total_steps": 927, "loss": 0.6575, "learning_rate": 5e-06, "epoch": 1.1003236245954693, "percentage": 36.68, "elapsed_time": "0:35:08", "remaining_time": "1:00:39"}
{"current_steps": 350, "total_steps": 927, "loss": 0.6677, "learning_rate": 5e-06, "epoch": 1.132686084142395, "percentage": 37.76, "elapsed_time": "0:36:06", "remaining_time": "0:59:30"}
{"current_steps": 360, "total_steps": 927, "loss": 0.6611, "learning_rate": 5e-06, "epoch": 1.1650485436893203, "percentage": 38.83, "elapsed_time": "0:37:03", "remaining_time": "0:58:22"}
{"current_steps": 370, "total_steps": 927, "loss": 0.6637, "learning_rate": 5e-06, "epoch": 1.197411003236246, "percentage": 39.91, "elapsed_time": "0:38:01", "remaining_time": "0:57:15"}
{"current_steps": 380, "total_steps": 927, "loss": 0.6564, "learning_rate": 5e-06, "epoch": 1.2297734627831716, "percentage": 40.99, "elapsed_time": "0:38:59", "remaining_time": "0:56:08"}
{"current_steps": 390, "total_steps": 927, "loss": 0.6659, "learning_rate": 5e-06, "epoch": 1.262135922330097, "percentage": 42.07, "elapsed_time": "0:39:58", "remaining_time": "0:55:01"}
{"current_steps": 400, "total_steps": 927, "loss": 0.6591, "learning_rate": 5e-06, "epoch": 1.2944983818770226, "percentage": 43.15, "elapsed_time": "0:40:56", "remaining_time": "0:53:55"}
{"current_steps": 410, "total_steps": 927, "loss": 0.6632, "learning_rate": 5e-06, "epoch": 1.3268608414239482, "percentage": 44.23, "elapsed_time": "0:41:54", "remaining_time": "0:52:50"}
{"current_steps": 420, "total_steps": 927, "loss": 0.6651, "learning_rate": 5e-06, "epoch": 1.3592233009708738, "percentage": 45.31, "elapsed_time": "0:42:52", "remaining_time": "0:51:44"}
{"current_steps": 430, "total_steps": 927, "loss": 0.6671, "learning_rate": 5e-06, "epoch": 1.3915857605177995, "percentage": 46.39, "elapsed_time": "0:43:50", "remaining_time": "0:50:39"}
{"current_steps": 440, "total_steps": 927, "loss": 0.656, "learning_rate": 5e-06, "epoch": 1.4239482200647249, "percentage": 47.46, "elapsed_time": "0:44:48", "remaining_time": "0:49:35"}
{"current_steps": 450, "total_steps": 927, "loss": 0.6596, "learning_rate": 5e-06, "epoch": 1.4563106796116505, "percentage": 48.54, "elapsed_time": "0:45:46", "remaining_time": "0:48:31"}
{"current_steps": 460, "total_steps": 927, "loss": 0.6595, "learning_rate": 5e-06, "epoch": 1.4886731391585761, "percentage": 49.62, "elapsed_time": "0:46:45", "remaining_time": "0:47:27"}
{"current_steps": 470, "total_steps": 927, "loss": 0.6628, "learning_rate": 5e-06, "epoch": 1.5210355987055015, "percentage": 50.7, "elapsed_time": "0:47:43", "remaining_time": "0:46:23"}
{"current_steps": 480, "total_steps": 927, "loss": 0.6638, "learning_rate": 5e-06, "epoch": 1.5533980582524272, "percentage": 51.78, "elapsed_time": "0:48:41", "remaining_time": "0:45:20"}
{"current_steps": 490, "total_steps": 927, "loss": 0.6682, "learning_rate": 5e-06, "epoch": 1.5857605177993528, "percentage": 52.86, "elapsed_time": "0:49:39", "remaining_time": "0:44:16"}
{"current_steps": 500, "total_steps": 927, "loss": 0.6612, "learning_rate": 5e-06, "epoch": 1.6181229773462782, "percentage": 53.94, "elapsed_time": "0:50:37", "remaining_time": "0:43:13"}
{"current_steps": 510, "total_steps": 927, "loss": 0.6576, "learning_rate": 5e-06, "epoch": 1.650485436893204, "percentage": 55.02, "elapsed_time": "0:51:35", "remaining_time": "0:42:10"}
{"current_steps": 520, "total_steps": 927, "loss": 0.6644, "learning_rate": 5e-06, "epoch": 1.6828478964401294, "percentage": 56.09, "elapsed_time": "0:52:33", "remaining_time": "0:41:07"}
{"current_steps": 530, "total_steps": 927, "loss": 0.6581, "learning_rate": 5e-06, "epoch": 1.715210355987055, "percentage": 57.17, "elapsed_time": "0:53:31", "remaining_time": "0:40:05"}
{"current_steps": 540, "total_steps": 927, "loss": 0.6583, "learning_rate": 5e-06, "epoch": 1.7475728155339807, "percentage": 58.25, "elapsed_time": "0:54:29", "remaining_time": "0:39:03"}
{"current_steps": 550, "total_steps": 927, "loss": 0.6598, "learning_rate": 5e-06, "epoch": 1.779935275080906, "percentage": 59.33, "elapsed_time": "0:55:27", "remaining_time": "0:38:00"}
{"current_steps": 560, "total_steps": 927, "loss": 0.6639, "learning_rate": 5e-06, "epoch": 1.8122977346278317, "percentage": 60.41, "elapsed_time": "0:56:25", "remaining_time": "0:36:58"}
{"current_steps": 570, "total_steps": 927, "loss": 0.6566, "learning_rate": 5e-06, "epoch": 1.8446601941747574, "percentage": 61.49, "elapsed_time": "0:57:23", "remaining_time": "0:35:56"}
{"current_steps": 580, "total_steps": 927, "loss": 0.6596, "learning_rate": 5e-06, "epoch": 1.8770226537216828, "percentage": 62.57, "elapsed_time": "0:58:21", "remaining_time": "0:34:54"}
{"current_steps": 590, "total_steps": 927, "loss": 0.6559, "learning_rate": 5e-06, "epoch": 1.9093851132686084, "percentage": 63.65, "elapsed_time": "0:59:19", "remaining_time": "0:33:53"}
{"current_steps": 600, "total_steps": 927, "loss": 0.6566, "learning_rate": 5e-06, "epoch": 1.941747572815534, "percentage": 64.72, "elapsed_time": "1:00:17", "remaining_time": "0:32:51"}
{"current_steps": 610, "total_steps": 927, "loss": 0.6579, "learning_rate": 5e-06, "epoch": 1.9741100323624594, "percentage": 65.8, "elapsed_time": "1:01:15", "remaining_time": "0:31:49"}
{"current_steps": 618, "total_steps": 927, "eval_loss": 0.7000192999839783, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "1:02:31", "remaining_time": "0:31:15"}
{"current_steps": 620, "total_steps": 927, "loss": 0.6475, "learning_rate": 5e-06, "epoch": 2.0064724919093853, "percentage": 66.88, "elapsed_time": "1:04:21", "remaining_time": "0:31:51"}
{"current_steps": 630, "total_steps": 927, "loss": 0.6054, "learning_rate": 5e-06, "epoch": 2.0388349514563107, "percentage": 67.96, "elapsed_time": "1:05:19", "remaining_time": "0:30:47"}
{"current_steps": 640, "total_steps": 927, "loss": 0.6071, "learning_rate": 5e-06, "epoch": 2.071197411003236, "percentage": 69.04, "elapsed_time": "1:06:17", "remaining_time": "0:29:43"}
{"current_steps": 650, "total_steps": 927, "loss": 0.6007, "learning_rate": 5e-06, "epoch": 2.103559870550162, "percentage": 70.12, "elapsed_time": "1:07:15", "remaining_time": "0:28:39"}
{"current_steps": 660, "total_steps": 927, "loss": 0.6064, "learning_rate": 5e-06, "epoch": 2.1359223300970873, "percentage": 71.2, "elapsed_time": "1:08:14", "remaining_time": "0:27:36"}
{"current_steps": 670, "total_steps": 927, "loss": 0.6036, "learning_rate": 5e-06, "epoch": 2.168284789644013, "percentage": 72.28, "elapsed_time": "1:09:12", "remaining_time": "0:26:32"}
{"current_steps": 680, "total_steps": 927, "loss": 0.6031, "learning_rate": 5e-06, "epoch": 2.2006472491909386, "percentage": 73.35, "elapsed_time": "1:10:10", "remaining_time": "0:25:29"}
{"current_steps": 690, "total_steps": 927, "loss": 0.6021, "learning_rate": 5e-06, "epoch": 2.233009708737864, "percentage": 74.43, "elapsed_time": "1:11:08", "remaining_time": "0:24:26"}
{"current_steps": 700, "total_steps": 927, "loss": 0.6054, "learning_rate": 5e-06, "epoch": 2.26537216828479, "percentage": 75.51, "elapsed_time": "1:12:06", "remaining_time": "0:23:22"}
{"current_steps": 710, "total_steps": 927, "loss": 0.606, "learning_rate": 5e-06, "epoch": 2.2977346278317152, "percentage": 76.59, "elapsed_time": "1:13:04", "remaining_time": "0:22:20"}
{"current_steps": 720, "total_steps": 927, "loss": 0.6083, "learning_rate": 5e-06, "epoch": 2.3300970873786406, "percentage": 77.67, "elapsed_time": "1:14:02", "remaining_time": "0:21:17"}
{"current_steps": 730, "total_steps": 927, "loss": 0.6128, "learning_rate": 5e-06, "epoch": 2.3624595469255665, "percentage": 78.75, "elapsed_time": "1:15:00", "remaining_time": "0:20:14"}
{"current_steps": 740, "total_steps": 927, "loss": 0.6112, "learning_rate": 5e-06, "epoch": 2.394822006472492, "percentage": 79.83, "elapsed_time": "1:15:58", "remaining_time": "0:19:11"}
{"current_steps": 750, "total_steps": 927, "loss": 0.6054, "learning_rate": 5e-06, "epoch": 2.4271844660194173, "percentage": 80.91, "elapsed_time": "1:16:56", "remaining_time": "0:18:09"}
{"current_steps": 760, "total_steps": 927, "loss": 0.6035, "learning_rate": 5e-06, "epoch": 2.459546925566343, "percentage": 81.98, "elapsed_time": "1:17:54", "remaining_time": "0:17:07"}
{"current_steps": 770, "total_steps": 927, "loss": 0.6094, "learning_rate": 5e-06, "epoch": 2.4919093851132685, "percentage": 83.06, "elapsed_time": "1:18:52", "remaining_time": "0:16:04"}
{"current_steps": 780, "total_steps": 927, "loss": 0.6051, "learning_rate": 5e-06, "epoch": 2.524271844660194, "percentage": 84.14, "elapsed_time": "1:19:50", "remaining_time": "0:15:02"}
{"current_steps": 790, "total_steps": 927, "loss": 0.6031, "learning_rate": 5e-06, "epoch": 2.55663430420712, "percentage": 85.22, "elapsed_time": "1:20:48", "remaining_time": "0:14:00"}
{"current_steps": 800, "total_steps": 927, "loss": 0.6105, "learning_rate": 5e-06, "epoch": 2.588996763754045, "percentage": 86.3, "elapsed_time": "1:21:47", "remaining_time": "0:12:58"}
{"current_steps": 810, "total_steps": 927, "loss": 0.6126, "learning_rate": 5e-06, "epoch": 2.6213592233009706, "percentage": 87.38, "elapsed_time": "1:22:45", "remaining_time": "0:11:57"}
{"current_steps": 820, "total_steps": 927, "loss": 0.6123, "learning_rate": 5e-06, "epoch": 2.6537216828478964, "percentage": 88.46, "elapsed_time": "1:23:43", "remaining_time": "0:10:55"}
{"current_steps": 830, "total_steps": 927, "loss": 0.6154, "learning_rate": 5e-06, "epoch": 2.686084142394822, "percentage": 89.54, "elapsed_time": "1:24:41", "remaining_time": "0:09:53"}
{"current_steps": 840, "total_steps": 927, "loss": 0.6112, "learning_rate": 5e-06, "epoch": 2.7184466019417477, "percentage": 90.61, "elapsed_time": "1:25:39", "remaining_time": "0:08:52"}
{"current_steps": 850, "total_steps": 927, "loss": 0.6094, "learning_rate": 5e-06, "epoch": 2.750809061488673, "percentage": 91.69, "elapsed_time": "1:26:37", "remaining_time": "0:07:50"}
{"current_steps": 860, "total_steps": 927, "loss": 0.6073, "learning_rate": 5e-06, "epoch": 2.783171521035599, "percentage": 92.77, "elapsed_time": "1:27:35", "remaining_time": "0:06:49"}
{"current_steps": 870, "total_steps": 927, "loss": 0.6074, "learning_rate": 5e-06, "epoch": 2.8155339805825244, "percentage": 93.85, "elapsed_time": "1:28:33", "remaining_time": "0:05:48"}
{"current_steps": 880, "total_steps": 927, "loss": 0.615, "learning_rate": 5e-06, "epoch": 2.8478964401294498, "percentage": 94.93, "elapsed_time": "1:29:31", "remaining_time": "0:04:46"}
{"current_steps": 890, "total_steps": 927, "loss": 0.6121, "learning_rate": 5e-06, "epoch": 2.8802588996763756, "percentage": 96.01, "elapsed_time": "1:30:29", "remaining_time": "0:03:45"}
{"current_steps": 900, "total_steps": 927, "loss": 0.609, "learning_rate": 5e-06, "epoch": 2.912621359223301, "percentage": 97.09, "elapsed_time": "1:31:27", "remaining_time": "0:02:44"}
{"current_steps": 910, "total_steps": 927, "loss": 0.613, "learning_rate": 5e-06, "epoch": 2.9449838187702264, "percentage": 98.17, "elapsed_time": "1:32:26", "remaining_time": "0:01:43"}
{"current_steps": 920, "total_steps": 927, "loss": 0.6131, "learning_rate": 5e-06, "epoch": 2.9773462783171523, "percentage": 99.24, "elapsed_time": "1:33:24", "remaining_time": "0:00:42"}
{"current_steps": 927, "total_steps": 927, "eval_loss": 0.7055738568305969, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "1:36:20", "remaining_time": "0:00:00"}
{"current_steps": 927, "total_steps": 927, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "1:37:53", "remaining_time": "0:00:00"}