sedrickkeh's picture
Training in progress, epoch 2
17d9b08 verified
{"current_steps": 10, "total_steps": 672, "loss": 0.7727, "lr": 5e-06, "epoch": 0.04449388209121246, "percentage": 1.49, "elapsed_time": "0:09:47", "remaining_time": "10:48:09"}
{"current_steps": 20, "total_steps": 672, "loss": 0.7067, "lr": 5e-06, "epoch": 0.08898776418242492, "percentage": 2.98, "elapsed_time": "0:19:28", "remaining_time": "10:34:52"}
{"current_steps": 30, "total_steps": 672, "loss": 0.6732, "lr": 5e-06, "epoch": 0.13348164627363737, "percentage": 4.46, "elapsed_time": "0:29:10", "remaining_time": "10:24:28"}
{"current_steps": 40, "total_steps": 672, "loss": 0.6514, "lr": 5e-06, "epoch": 0.17797552836484984, "percentage": 5.95, "elapsed_time": "0:38:53", "remaining_time": "10:14:24"}
{"current_steps": 50, "total_steps": 672, "loss": 0.6433, "lr": 5e-06, "epoch": 0.22246941045606228, "percentage": 7.44, "elapsed_time": "0:48:35", "remaining_time": "10:04:24"}
{"current_steps": 60, "total_steps": 672, "loss": 0.6295, "lr": 5e-06, "epoch": 0.26696329254727474, "percentage": 8.93, "elapsed_time": "0:58:16", "remaining_time": "9:54:29"}
{"current_steps": 70, "total_steps": 672, "loss": 0.615, "lr": 5e-06, "epoch": 0.3114571746384872, "percentage": 10.42, "elapsed_time": "1:07:58", "remaining_time": "9:44:36"}
{"current_steps": 80, "total_steps": 672, "loss": 0.6111, "lr": 5e-06, "epoch": 0.3559510567296997, "percentage": 11.9, "elapsed_time": "1:17:40", "remaining_time": "9:34:47"}
{"current_steps": 90, "total_steps": 672, "loss": 0.6, "lr": 5e-06, "epoch": 0.40044493882091214, "percentage": 13.39, "elapsed_time": "1:27:21", "remaining_time": "9:24:54"}
{"current_steps": 100, "total_steps": 672, "loss": 0.6087, "lr": 5e-06, "epoch": 0.44493882091212456, "percentage": 14.88, "elapsed_time": "1:37:02", "remaining_time": "9:15:05"}
{"current_steps": 110, "total_steps": 672, "loss": 0.5983, "lr": 5e-06, "epoch": 0.489432703003337, "percentage": 16.37, "elapsed_time": "1:46:43", "remaining_time": "9:05:18"}
{"current_steps": 120, "total_steps": 672, "loss": 0.6023, "lr": 5e-06, "epoch": 0.5339265850945495, "percentage": 17.86, "elapsed_time": "1:56:27", "remaining_time": "8:55:41"}
{"current_steps": 130, "total_steps": 672, "loss": 0.5919, "lr": 5e-06, "epoch": 0.578420467185762, "percentage": 19.35, "elapsed_time": "2:06:10", "remaining_time": "8:46:03"}
{"current_steps": 140, "total_steps": 672, "loss": 0.5974, "lr": 5e-06, "epoch": 0.6229143492769744, "percentage": 20.83, "elapsed_time": "2:15:51", "remaining_time": "8:36:15"}
{"current_steps": 150, "total_steps": 672, "loss": 0.5945, "lr": 5e-06, "epoch": 0.6674082313681868, "percentage": 22.32, "elapsed_time": "2:25:34", "remaining_time": "8:26:34"}
{"current_steps": 160, "total_steps": 672, "loss": 0.5892, "lr": 5e-06, "epoch": 0.7119021134593994, "percentage": 23.81, "elapsed_time": "2:35:16", "remaining_time": "8:16:53"}
{"current_steps": 170, "total_steps": 672, "loss": 0.5856, "lr": 5e-06, "epoch": 0.7563959955506118, "percentage": 25.3, "elapsed_time": "2:45:00", "remaining_time": "8:07:14"}
{"current_steps": 180, "total_steps": 672, "loss": 0.5879, "lr": 5e-06, "epoch": 0.8008898776418243, "percentage": 26.79, "elapsed_time": "2:54:42", "remaining_time": "7:57:33"}
{"current_steps": 190, "total_steps": 672, "loss": 0.5897, "lr": 5e-06, "epoch": 0.8453837597330367, "percentage": 28.27, "elapsed_time": "3:04:25", "remaining_time": "7:47:52"}
{"current_steps": 200, "total_steps": 672, "loss": 0.5754, "lr": 5e-06, "epoch": 0.8898776418242491, "percentage": 29.76, "elapsed_time": "3:14:08", "remaining_time": "7:38:11"}
{"current_steps": 210, "total_steps": 672, "loss": 0.5821, "lr": 5e-06, "epoch": 0.9343715239154616, "percentage": 31.25, "elapsed_time": "3:23:50", "remaining_time": "7:28:27"}
{"current_steps": 220, "total_steps": 672, "loss": 0.581, "lr": 5e-06, "epoch": 0.978865406006674, "percentage": 32.74, "elapsed_time": "3:33:32", "remaining_time": "7:18:44"}
{"current_steps": 224, "total_steps": 672, "eval_loss": 0.5854274034500122, "epoch": 0.996662958843159, "percentage": 33.33, "elapsed_time": "3:42:02", "remaining_time": "7:24:05"}
{"current_steps": 230, "total_steps": 672, "loss": 0.5763, "lr": 5e-06, "epoch": 1.0239154616240267, "percentage": 34.23, "elapsed_time": "3:48:29", "remaining_time": "7:19:06"}
{"current_steps": 240, "total_steps": 672, "loss": 0.5449, "lr": 5e-06, "epoch": 1.068409343715239, "percentage": 35.71, "elapsed_time": "3:58:13", "remaining_time": "7:08:47"}
{"current_steps": 250, "total_steps": 672, "loss": 0.5301, "lr": 5e-06, "epoch": 1.1129032258064515, "percentage": 37.2, "elapsed_time": "4:07:57", "remaining_time": "6:58:32"}
{"current_steps": 260, "total_steps": 672, "loss": 0.5374, "lr": 5e-06, "epoch": 1.1573971078976641, "percentage": 38.69, "elapsed_time": "4:17:41", "remaining_time": "6:48:20"}
{"current_steps": 270, "total_steps": 672, "loss": 0.5314, "lr": 5e-06, "epoch": 1.2018909899888766, "percentage": 40.18, "elapsed_time": "4:27:24", "remaining_time": "6:38:09"}
{"current_steps": 280, "total_steps": 672, "loss": 0.5371, "lr": 5e-06, "epoch": 1.246384872080089, "percentage": 41.67, "elapsed_time": "4:37:07", "remaining_time": "6:27:58"}
{"current_steps": 290, "total_steps": 672, "loss": 0.5393, "lr": 5e-06, "epoch": 1.2908787541713014, "percentage": 43.15, "elapsed_time": "4:46:51", "remaining_time": "6:17:51"}
{"current_steps": 300, "total_steps": 672, "loss": 0.5361, "lr": 5e-06, "epoch": 1.3353726362625138, "percentage": 44.64, "elapsed_time": "4:56:34", "remaining_time": "6:07:45"}
{"current_steps": 310, "total_steps": 672, "loss": 0.5353, "lr": 5e-06, "epoch": 1.3798665183537264, "percentage": 46.13, "elapsed_time": "5:06:18", "remaining_time": "5:57:41"}
{"current_steps": 320, "total_steps": 672, "loss": 0.5316, "lr": 5e-06, "epoch": 1.4243604004449388, "percentage": 47.62, "elapsed_time": "5:16:02", "remaining_time": "5:47:38"}
{"current_steps": 330, "total_steps": 672, "loss": 0.5352, "lr": 5e-06, "epoch": 1.4688542825361512, "percentage": 49.11, "elapsed_time": "5:25:47", "remaining_time": "5:37:37"}
{"current_steps": 340, "total_steps": 672, "loss": 0.5415, "lr": 5e-06, "epoch": 1.5133481646273639, "percentage": 50.6, "elapsed_time": "5:35:30", "remaining_time": "5:27:36"}
{"current_steps": 350, "total_steps": 672, "loss": 0.5339, "lr": 5e-06, "epoch": 1.557842046718576, "percentage": 52.08, "elapsed_time": "5:45:14", "remaining_time": "5:17:36"}
{"current_steps": 360, "total_steps": 672, "loss": 0.5295, "lr": 5e-06, "epoch": 1.6023359288097887, "percentage": 53.57, "elapsed_time": "5:54:57", "remaining_time": "5:07:37"}
{"current_steps": 370, "total_steps": 672, "loss": 0.5333, "lr": 5e-06, "epoch": 1.6468298109010011, "percentage": 55.06, "elapsed_time": "6:04:41", "remaining_time": "4:57:40"}
{"current_steps": 380, "total_steps": 672, "loss": 0.5347, "lr": 5e-06, "epoch": 1.6913236929922135, "percentage": 56.55, "elapsed_time": "6:14:26", "remaining_time": "4:47:43"}
{"current_steps": 390, "total_steps": 672, "loss": 0.5338, "lr": 5e-06, "epoch": 1.7358175750834262, "percentage": 58.04, "elapsed_time": "6:24:11", "remaining_time": "4:37:47"}
{"current_steps": 400, "total_steps": 672, "loss": 0.5392, "lr": 5e-06, "epoch": 1.7803114571746383, "percentage": 59.52, "elapsed_time": "6:33:55", "remaining_time": "4:27:52"}
{"current_steps": 410, "total_steps": 672, "loss": 0.52, "lr": 5e-06, "epoch": 1.824805339265851, "percentage": 61.01, "elapsed_time": "6:43:39", "remaining_time": "4:17:57"}
{"current_steps": 420, "total_steps": 672, "loss": 0.5306, "lr": 5e-06, "epoch": 1.8692992213570634, "percentage": 62.5, "elapsed_time": "6:53:23", "remaining_time": "4:08:02"}
{"current_steps": 430, "total_steps": 672, "loss": 0.5369, "lr": 5e-06, "epoch": 1.9137931034482758, "percentage": 63.99, "elapsed_time": "7:03:06", "remaining_time": "3:58:07"}
{"current_steps": 440, "total_steps": 672, "loss": 0.5298, "lr": 5e-06, "epoch": 1.9582869855394884, "percentage": 65.48, "elapsed_time": "7:12:50", "remaining_time": "3:48:13"}
{"current_steps": 449, "total_steps": 672, "eval_loss": 0.5757958889007568, "epoch": 1.9983314794215796, "percentage": 66.82, "elapsed_time": "7:25:45", "remaining_time": "3:41:23"}
{"current_steps": 450, "total_steps": 672, "loss": 0.5412, "lr": 5e-06, "epoch": 2.0033370411568407, "percentage": 66.96, "elapsed_time": "7:27:43", "remaining_time": "3:40:52"}
{"current_steps": 460, "total_steps": 672, "loss": 0.4782, "lr": 5e-06, "epoch": 2.0478309232480534, "percentage": 68.45, "elapsed_time": "7:37:25", "remaining_time": "3:30:48"}
{"current_steps": 470, "total_steps": 672, "loss": 0.4801, "lr": 5e-06, "epoch": 2.092324805339266, "percentage": 69.94, "elapsed_time": "7:47:08", "remaining_time": "3:20:46"}
{"current_steps": 480, "total_steps": 672, "loss": 0.4753, "lr": 5e-06, "epoch": 2.136818687430478, "percentage": 71.43, "elapsed_time": "7:56:48", "remaining_time": "3:10:43"}
{"current_steps": 490, "total_steps": 672, "loss": 0.4844, "lr": 5e-06, "epoch": 2.181312569521691, "percentage": 72.92, "elapsed_time": "8:06:33", "remaining_time": "3:00:43"}
{"current_steps": 500, "total_steps": 672, "loss": 0.4822, "lr": 5e-06, "epoch": 2.225806451612903, "percentage": 74.4, "elapsed_time": "8:16:17", "remaining_time": "2:50:43"}
{"current_steps": 510, "total_steps": 672, "loss": 0.4899, "lr": 5e-06, "epoch": 2.2703003337041157, "percentage": 75.89, "elapsed_time": "8:26:01", "remaining_time": "2:40:44"}
{"current_steps": 520, "total_steps": 672, "loss": 0.4939, "lr": 5e-06, "epoch": 2.3147942157953283, "percentage": 77.38, "elapsed_time": "8:35:43", "remaining_time": "2:30:45"}
{"current_steps": 530, "total_steps": 672, "loss": 0.4835, "lr": 5e-06, "epoch": 2.3592880978865405, "percentage": 78.87, "elapsed_time": "8:45:27", "remaining_time": "2:20:46"}
{"current_steps": 540, "total_steps": 672, "loss": 0.4889, "lr": 5e-06, "epoch": 2.403781979977753, "percentage": 80.36, "elapsed_time": "8:55:10", "remaining_time": "2:10:49"}
{"current_steps": 550, "total_steps": 672, "loss": 0.4865, "lr": 5e-06, "epoch": 2.4482758620689653, "percentage": 81.85, "elapsed_time": "9:04:54", "remaining_time": "2:00:52"}
{"current_steps": 560, "total_steps": 672, "loss": 0.483, "lr": 5e-06, "epoch": 2.492769744160178, "percentage": 83.33, "elapsed_time": "9:14:37", "remaining_time": "1:50:55"}
{"current_steps": 570, "total_steps": 672, "loss": 0.4797, "lr": 5e-06, "epoch": 2.5372636262513906, "percentage": 84.82, "elapsed_time": "9:24:18", "remaining_time": "1:40:58"}
{"current_steps": 580, "total_steps": 672, "loss": 0.477, "lr": 5e-06, "epoch": 2.5817575083426028, "percentage": 86.31, "elapsed_time": "9:34:00", "remaining_time": "1:31:03"}
{"current_steps": 590, "total_steps": 672, "loss": 0.4833, "lr": 5e-06, "epoch": 2.6262513904338154, "percentage": 87.8, "elapsed_time": "9:43:42", "remaining_time": "1:21:07"}
{"current_steps": 600, "total_steps": 672, "loss": 0.4897, "lr": 5e-06, "epoch": 2.6707452725250276, "percentage": 89.29, "elapsed_time": "9:53:25", "remaining_time": "1:11:12"}
{"current_steps": 610, "total_steps": 672, "loss": 0.4893, "lr": 5e-06, "epoch": 2.71523915461624, "percentage": 90.77, "elapsed_time": "10:03:07", "remaining_time": "1:01:18"}
{"current_steps": 620, "total_steps": 672, "loss": 0.4809, "lr": 5e-06, "epoch": 2.759733036707453, "percentage": 92.26, "elapsed_time": "10:12:50", "remaining_time": "0:51:23"}
{"current_steps": 630, "total_steps": 672, "loss": 0.4888, "lr": 5e-06, "epoch": 2.804226918798665, "percentage": 93.75, "elapsed_time": "10:22:30", "remaining_time": "0:41:30"}
{"current_steps": 640, "total_steps": 672, "loss": 0.4844, "lr": 5e-06, "epoch": 2.8487208008898777, "percentage": 95.24, "elapsed_time": "10:32:12", "remaining_time": "0:31:36"}
{"current_steps": 650, "total_steps": 672, "loss": 0.4836, "lr": 5e-06, "epoch": 2.89321468298109, "percentage": 96.73, "elapsed_time": "10:41:54", "remaining_time": "0:21:43"}
{"current_steps": 660, "total_steps": 672, "loss": 0.4916, "lr": 5e-06, "epoch": 2.9377085650723025, "percentage": 98.21, "elapsed_time": "10:51:37", "remaining_time": "0:11:50"}
{"current_steps": 670, "total_steps": 672, "loss": 0.483, "lr": 5e-06, "epoch": 2.982202447163515, "percentage": 99.7, "elapsed_time": "11:01:20", "remaining_time": "0:01:58"}
{"current_steps": 672, "total_steps": 672, "eval_loss": 0.5784014463424683, "epoch": 2.9911012235817576, "percentage": 100.0, "elapsed_time": "11:08:33", "remaining_time": "0:00:00"}
{"current_steps": 672, "total_steps": 672, "epoch": 2.9911012235817576, "percentage": 100.0, "elapsed_time": "11:10:02", "remaining_time": "0:00:00"}