TS-Reasoner-7B / trainer_log.jsonl
ParadiseYu's picture
Upload folder using huggingface_hub
808dbb6 verified
{"current_steps": 1, "total_steps": 780, "loss": 1.3849, "lr": 1.25e-06, "epoch": 0.00256, "percentage": 0.13, "elapsed_time": "0:00:39", "remaining_time": "8:26:54"}
{"current_steps": 2, "total_steps": 780, "loss": 1.4809, "lr": 2.5e-06, "epoch": 0.00512, "percentage": 0.26, "elapsed_time": "0:01:13", "remaining_time": "7:55:30"}
{"current_steps": 3, "total_steps": 780, "loss": 1.3488, "lr": 3.7500000000000005e-06, "epoch": 0.00768, "percentage": 0.38, "elapsed_time": "0:01:47", "remaining_time": "7:44:18"}
{"current_steps": 4, "total_steps": 780, "loss": 1.1901, "lr": 5e-06, "epoch": 0.01024, "percentage": 0.51, "elapsed_time": "0:02:22", "remaining_time": "7:39:41"}
{"current_steps": 5, "total_steps": 780, "loss": 1.1539, "lr": 6.25e-06, "epoch": 0.0128, "percentage": 0.64, "elapsed_time": "0:02:55", "remaining_time": "7:34:16"}
{"current_steps": 6, "total_steps": 780, "loss": 1.0821, "lr": 7.500000000000001e-06, "epoch": 0.01536, "percentage": 0.77, "elapsed_time": "0:03:31", "remaining_time": "7:34:16"}
{"current_steps": 7, "total_steps": 780, "loss": 0.9753, "lr": 8.750000000000001e-06, "epoch": 0.01792, "percentage": 0.9, "elapsed_time": "0:04:06", "remaining_time": "7:33:21"}
{"current_steps": 8, "total_steps": 780, "loss": 0.9717, "lr": 1e-05, "epoch": 0.02048, "percentage": 1.03, "elapsed_time": "0:04:43", "remaining_time": "7:35:21"}
{"current_steps": 9, "total_steps": 780, "loss": 0.9383, "lr": 1.125e-05, "epoch": 0.02304, "percentage": 1.15, "elapsed_time": "0:05:18", "remaining_time": "7:34:55"}
{"current_steps": 10, "total_steps": 780, "loss": 1.0224, "lr": 1.25e-05, "epoch": 0.0256, "percentage": 1.28, "elapsed_time": "0:05:52", "remaining_time": "7:32:17"}
{"current_steps": 11, "total_steps": 780, "loss": 0.8981, "lr": 1.375e-05, "epoch": 0.02816, "percentage": 1.41, "elapsed_time": "0:06:28", "remaining_time": "7:32:34"}
{"current_steps": 12, "total_steps": 780, "loss": 0.9254, "lr": 1.5000000000000002e-05, "epoch": 0.03072, "percentage": 1.54, "elapsed_time": "0:07:05", "remaining_time": "7:33:26"}
{"current_steps": 13, "total_steps": 780, "loss": 0.839, "lr": 1.6250000000000002e-05, "epoch": 0.03328, "percentage": 1.67, "elapsed_time": "0:07:38", "remaining_time": "7:30:43"}
{"current_steps": 14, "total_steps": 780, "loss": 0.8211, "lr": 1.7500000000000002e-05, "epoch": 0.03584, "percentage": 1.79, "elapsed_time": "0:08:12", "remaining_time": "7:28:59"}
{"current_steps": 15, "total_steps": 780, "loss": 0.7587, "lr": 1.8750000000000002e-05, "epoch": 0.0384, "percentage": 1.92, "elapsed_time": "0:08:47", "remaining_time": "7:28:36"}
{"current_steps": 16, "total_steps": 780, "loss": 0.8149, "lr": 2e-05, "epoch": 0.04096, "percentage": 2.05, "elapsed_time": "0:09:21", "remaining_time": "7:26:31"}
{"current_steps": 17, "total_steps": 780, "loss": 0.7836, "lr": 1.9999915456072218e-05, "epoch": 0.04352, "percentage": 2.18, "elapsed_time": "0:09:57", "remaining_time": "7:27:06"}
{"current_steps": 18, "total_steps": 780, "loss": 0.8128, "lr": 1.9999661825718408e-05, "epoch": 0.04608, "percentage": 2.31, "elapsed_time": "0:10:31", "remaining_time": "7:25:33"}
{"current_steps": 19, "total_steps": 780, "loss": 0.7667, "lr": 1.9999239113227146e-05, "epoch": 0.04864, "percentage": 2.44, "elapsed_time": "0:11:08", "remaining_time": "7:25:57"}
{"current_steps": 20, "total_steps": 780, "loss": 0.7523, "lr": 1.9998647325745995e-05, "epoch": 0.0512, "percentage": 2.56, "elapsed_time": "0:11:42", "remaining_time": "7:24:41"}
{"current_steps": 21, "total_steps": 780, "loss": 0.7988, "lr": 1.9997886473281355e-05, "epoch": 0.05376, "percentage": 2.69, "elapsed_time": "0:12:17", "remaining_time": "7:24:30"}
{"current_steps": 22, "total_steps": 780, "loss": 0.7527, "lr": 1.9996956568698325e-05, "epoch": 0.05632, "percentage": 2.82, "elapsed_time": "0:12:52", "remaining_time": "7:23:47"}
{"current_steps": 23, "total_steps": 780, "loss": 0.7438, "lr": 1.9995857627720456e-05, "epoch": 0.05888, "percentage": 2.95, "elapsed_time": "0:13:27", "remaining_time": "7:22:45"}
{"current_steps": 24, "total_steps": 780, "loss": 0.7248, "lr": 1.99945896689295e-05, "epoch": 0.06144, "percentage": 3.08, "elapsed_time": "0:14:00", "remaining_time": "7:21:04"}
{"current_steps": 25, "total_steps": 780, "loss": 0.6776, "lr": 1.9993152713765116e-05, "epoch": 0.064, "percentage": 3.21, "elapsed_time": "0:14:34", "remaining_time": "7:20:04"}
{"current_steps": 26, "total_steps": 780, "loss": 0.8218, "lr": 1.999154678652446e-05, "epoch": 0.06656, "percentage": 3.33, "elapsed_time": "0:15:10", "remaining_time": "7:20:15"}
{"current_steps": 27, "total_steps": 780, "loss": 0.7429, "lr": 1.998977191436181e-05, "epoch": 0.06912, "percentage": 3.46, "elapsed_time": "0:15:45", "remaining_time": "7:19:17"}
{"current_steps": 28, "total_steps": 780, "loss": 0.6964, "lr": 1.9987828127288105e-05, "epoch": 0.07168, "percentage": 3.59, "elapsed_time": "0:16:18", "remaining_time": "7:18:11"}
{"current_steps": 29, "total_steps": 780, "loss": 0.7901, "lr": 1.998571545817042e-05, "epoch": 0.07424, "percentage": 3.72, "elapsed_time": "0:16:52", "remaining_time": "7:16:53"}
{"current_steps": 30, "total_steps": 780, "loss": 0.6802, "lr": 1.9983433942731427e-05, "epoch": 0.0768, "percentage": 3.85, "elapsed_time": "0:17:27", "remaining_time": "7:16:28"}
{"current_steps": 31, "total_steps": 780, "loss": 0.7918, "lr": 1.998098361954878e-05, "epoch": 0.07936, "percentage": 3.97, "elapsed_time": "0:18:01", "remaining_time": "7:15:27"}
{"current_steps": 32, "total_steps": 780, "loss": 0.7565, "lr": 1.9978364530054465e-05, "epoch": 0.08192, "percentage": 4.1, "elapsed_time": "0:18:35", "remaining_time": "7:14:41"}
{"current_steps": 33, "total_steps": 780, "loss": 0.6984, "lr": 1.9975576718534105e-05, "epoch": 0.08448, "percentage": 4.23, "elapsed_time": "0:19:11", "remaining_time": "7:14:28"}
{"current_steps": 34, "total_steps": 780, "loss": 0.711, "lr": 1.9972620232126215e-05, "epoch": 0.08704, "percentage": 4.36, "elapsed_time": "0:19:46", "remaining_time": "7:13:44"}
{"current_steps": 35, "total_steps": 780, "loss": 0.7398, "lr": 1.996949512082138e-05, "epoch": 0.0896, "percentage": 4.49, "elapsed_time": "0:20:20", "remaining_time": "7:13:03"}
{"current_steps": 36, "total_steps": 780, "loss": 0.7466, "lr": 1.996620143746144e-05, "epoch": 0.09216, "percentage": 4.62, "elapsed_time": "0:20:56", "remaining_time": "7:12:54"}
{"current_steps": 37, "total_steps": 780, "loss": 0.7701, "lr": 1.9962739237738585e-05, "epoch": 0.09472, "percentage": 4.74, "elapsed_time": "0:21:31", "remaining_time": "7:12:13"}
{"current_steps": 38, "total_steps": 780, "loss": 0.765, "lr": 1.9959108580194403e-05, "epoch": 0.09728, "percentage": 4.87, "elapsed_time": "0:22:06", "remaining_time": "7:11:41"}
{"current_steps": 39, "total_steps": 780, "loss": 0.7029, "lr": 1.9955309526218903e-05, "epoch": 0.09984, "percentage": 5.0, "elapsed_time": "0:22:41", "remaining_time": "7:11:09"}
{"current_steps": 40, "total_steps": 780, "loss": 0.7248, "lr": 1.9951342140049483e-05, "epoch": 0.1024, "percentage": 5.13, "elapsed_time": "0:23:16", "remaining_time": "7:10:35"}
{"current_steps": 41, "total_steps": 780, "loss": 0.7326, "lr": 1.9947206488769812e-05, "epoch": 0.10496, "percentage": 5.26, "elapsed_time": "0:23:49", "remaining_time": "7:09:34"}
{"current_steps": 42, "total_steps": 780, "loss": 0.6941, "lr": 1.9942902642308737e-05, "epoch": 0.10752, "percentage": 5.38, "elapsed_time": "0:24:24", "remaining_time": "7:08:49"}
{"current_steps": 43, "total_steps": 780, "loss": 0.7328, "lr": 1.9938430673439075e-05, "epoch": 0.11008, "percentage": 5.51, "elapsed_time": "0:25:00", "remaining_time": "7:08:39"}
{"current_steps": 44, "total_steps": 780, "loss": 0.6695, "lr": 1.993379065777639e-05, "epoch": 0.11264, "percentage": 5.64, "elapsed_time": "0:25:35", "remaining_time": "7:08:04"}
{"current_steps": 45, "total_steps": 780, "loss": 0.6808, "lr": 1.9928982673777707e-05, "epoch": 0.1152, "percentage": 5.77, "elapsed_time": "0:26:09", "remaining_time": "7:07:08"}
{"current_steps": 46, "total_steps": 780, "loss": 0.692, "lr": 1.9924006802740203e-05, "epoch": 0.11776, "percentage": 5.9, "elapsed_time": "0:26:42", "remaining_time": "7:06:17"}
{"current_steps": 47, "total_steps": 780, "loss": 0.7251, "lr": 1.9918863128799805e-05, "epoch": 0.12032, "percentage": 6.03, "elapsed_time": "0:27:17", "remaining_time": "7:05:33"}
{"current_steps": 48, "total_steps": 780, "loss": 0.734, "lr": 1.9913551738929803e-05, "epoch": 0.12288, "percentage": 6.15, "elapsed_time": "0:27:51", "remaining_time": "7:04:50"}
{"current_steps": 49, "total_steps": 780, "loss": 0.6667, "lr": 1.9908072722939344e-05, "epoch": 0.12544, "percentage": 6.28, "elapsed_time": "0:28:25", "remaining_time": "7:04:02"}
{"current_steps": 50, "total_steps": 780, "loss": 0.7766, "lr": 1.9902426173471933e-05, "epoch": 0.128, "percentage": 6.41, "elapsed_time": "0:29:01", "remaining_time": "7:03:50"}
{"current_steps": 51, "total_steps": 780, "loss": 0.7355, "lr": 1.9896612186003866e-05, "epoch": 0.13056, "percentage": 6.54, "elapsed_time": "0:29:38", "remaining_time": "7:03:47"}
{"current_steps": 52, "total_steps": 780, "loss": 0.6743, "lr": 1.9890630858842614e-05, "epoch": 0.13312, "percentage": 6.67, "elapsed_time": "0:30:14", "remaining_time": "7:03:16"}
{"current_steps": 53, "total_steps": 780, "loss": 0.6261, "lr": 1.988448229312515e-05, "epoch": 0.13568, "percentage": 6.79, "elapsed_time": "0:30:48", "remaining_time": "7:02:41"}
{"current_steps": 54, "total_steps": 780, "loss": 0.7783, "lr": 1.9878166592816255e-05, "epoch": 0.13824, "percentage": 6.92, "elapsed_time": "0:31:23", "remaining_time": "7:02:09"}
{"current_steps": 55, "total_steps": 780, "loss": 0.6444, "lr": 1.9871683864706752e-05, "epoch": 0.1408, "percentage": 7.05, "elapsed_time": "0:31:58", "remaining_time": "7:01:32"}
{"current_steps": 56, "total_steps": 780, "loss": 0.6984, "lr": 1.9865034218411698e-05, "epoch": 0.14336, "percentage": 7.18, "elapsed_time": "0:32:33", "remaining_time": "7:00:56"}
{"current_steps": 57, "total_steps": 780, "loss": 0.7365, "lr": 1.9858217766368538e-05, "epoch": 0.14592, "percentage": 7.31, "elapsed_time": "0:33:08", "remaining_time": "7:00:21"}
{"current_steps": 58, "total_steps": 780, "loss": 0.7668, "lr": 1.98512346238352e-05, "epoch": 0.14848, "percentage": 7.44, "elapsed_time": "0:33:43", "remaining_time": "6:59:44"}
{"current_steps": 59, "total_steps": 780, "loss": 0.6806, "lr": 1.984408490888814e-05, "epoch": 0.15104, "percentage": 7.56, "elapsed_time": "0:34:17", "remaining_time": "6:59:06"}
{"current_steps": 60, "total_steps": 780, "loss": 0.7316, "lr": 1.9836768742420355e-05, "epoch": 0.1536, "percentage": 7.69, "elapsed_time": "0:34:52", "remaining_time": "6:58:24"}
{"current_steps": 61, "total_steps": 780, "loss": 0.8413, "lr": 1.9829286248139334e-05, "epoch": 0.15616, "percentage": 7.82, "elapsed_time": "0:35:27", "remaining_time": "6:57:51"}
{"current_steps": 62, "total_steps": 780, "loss": 0.7118, "lr": 1.9821637552564973e-05, "epoch": 0.15872, "percentage": 7.95, "elapsed_time": "0:36:03", "remaining_time": "6:57:36"}
{"current_steps": 63, "total_steps": 780, "loss": 0.8131, "lr": 1.9813822785027422e-05, "epoch": 0.16128, "percentage": 8.08, "elapsed_time": "0:36:36", "remaining_time": "6:56:34"}
{"current_steps": 64, "total_steps": 780, "loss": 0.7301, "lr": 1.9805842077664913e-05, "epoch": 0.16384, "percentage": 8.21, "elapsed_time": "0:37:11", "remaining_time": "6:56:05"}
{"current_steps": 65, "total_steps": 780, "loss": 0.7323, "lr": 1.9797695565421507e-05, "epoch": 0.1664, "percentage": 8.33, "elapsed_time": "0:37:45", "remaining_time": "6:55:17"}
{"current_steps": 66, "total_steps": 780, "loss": 0.6715, "lr": 1.978938338604484e-05, "epoch": 0.16896, "percentage": 8.46, "elapsed_time": "0:38:21", "remaining_time": "6:54:52"}
{"current_steps": 67, "total_steps": 780, "loss": 0.685, "lr": 1.978090568008377e-05, "epoch": 0.17152, "percentage": 8.59, "elapsed_time": "0:38:55", "remaining_time": "6:54:13"}
{"current_steps": 68, "total_steps": 780, "loss": 0.6869, "lr": 1.9772262590886006e-05, "epoch": 0.17408, "percentage": 8.72, "elapsed_time": "0:39:29", "remaining_time": "6:53:26"}
{"current_steps": 69, "total_steps": 780, "loss": 0.8062, "lr": 1.9763454264595694e-05, "epoch": 0.17664, "percentage": 8.85, "elapsed_time": "0:40:04", "remaining_time": "6:53:00"}
{"current_steps": 70, "total_steps": 780, "loss": 0.727, "lr": 1.975448085015093e-05, "epoch": 0.1792, "percentage": 8.97, "elapsed_time": "0:40:41", "remaining_time": "6:52:44"}
{"current_steps": 71, "total_steps": 780, "loss": 0.7087, "lr": 1.9745342499281254e-05, "epoch": 0.18176, "percentage": 9.1, "elapsed_time": "0:41:17", "remaining_time": "6:52:23"}
{"current_steps": 72, "total_steps": 780, "loss": 0.6602, "lr": 1.9736039366505087e-05, "epoch": 0.18432, "percentage": 9.23, "elapsed_time": "0:41:51", "remaining_time": "6:51:38"}
{"current_steps": 73, "total_steps": 780, "loss": 0.7275, "lr": 1.9726571609127097e-05, "epoch": 0.18688, "percentage": 9.36, "elapsed_time": "0:42:27", "remaining_time": "6:51:12"}
{"current_steps": 74, "total_steps": 780, "loss": 0.6976, "lr": 1.9716939387235573e-05, "epoch": 0.18944, "percentage": 9.49, "elapsed_time": "0:43:01", "remaining_time": "6:50:32"}
{"current_steps": 75, "total_steps": 780, "loss": 0.6665, "lr": 1.9707142863699687e-05, "epoch": 0.192, "percentage": 9.62, "elapsed_time": "0:43:36", "remaining_time": "6:49:53"}
{"current_steps": 76, "total_steps": 780, "loss": 0.6817, "lr": 1.969718220416675e-05, "epoch": 0.19456, "percentage": 9.74, "elapsed_time": "0:44:12", "remaining_time": "6:49:27"}
{"current_steps": 77, "total_steps": 780, "loss": 0.7231, "lr": 1.9687057577059422e-05, "epoch": 0.19712, "percentage": 9.87, "elapsed_time": "0:44:47", "remaining_time": "6:48:52"}
{"current_steps": 78, "total_steps": 780, "loss": 0.6697, "lr": 1.9676769153572853e-05, "epoch": 0.19968, "percentage": 10.0, "elapsed_time": "0:45:22", "remaining_time": "6:48:26"}
{"current_steps": 79, "total_steps": 780, "loss": 0.6854, "lr": 1.966631710767178e-05, "epoch": 0.20224, "percentage": 10.13, "elapsed_time": "0:45:59", "remaining_time": "6:48:02"}
{"current_steps": 80, "total_steps": 780, "loss": 0.6902, "lr": 1.965570161608762e-05, "epoch": 0.2048, "percentage": 10.26, "elapsed_time": "0:46:34", "remaining_time": "6:47:28"}
{"current_steps": 81, "total_steps": 780, "loss": 0.6949, "lr": 1.9644922858315432e-05, "epoch": 0.20736, "percentage": 10.38, "elapsed_time": "0:47:08", "remaining_time": "6:46:51"}
{"current_steps": 82, "total_steps": 780, "loss": 0.6668, "lr": 1.9633981016610926e-05, "epoch": 0.20992, "percentage": 10.51, "elapsed_time": "0:47:42", "remaining_time": "6:46:09"}
{"current_steps": 83, "total_steps": 780, "loss": 0.7303, "lr": 1.9622876275987355e-05, "epoch": 0.21248, "percentage": 10.64, "elapsed_time": "0:48:17", "remaining_time": "6:45:28"}
{"current_steps": 84, "total_steps": 780, "loss": 0.7113, "lr": 1.9611608824212395e-05, "epoch": 0.21504, "percentage": 10.77, "elapsed_time": "0:48:50", "remaining_time": "6:44:45"}
{"current_steps": 85, "total_steps": 780, "loss": 0.7382, "lr": 1.9600178851804977e-05, "epoch": 0.2176, "percentage": 10.9, "elapsed_time": "0:49:26", "remaining_time": "6:44:14"}
{"current_steps": 86, "total_steps": 780, "loss": 0.6784, "lr": 1.958858655203205e-05, "epoch": 0.22016, "percentage": 11.03, "elapsed_time": "0:50:00", "remaining_time": "6:43:34"}
{"current_steps": 87, "total_steps": 780, "loss": 0.7523, "lr": 1.9576832120905323e-05, "epoch": 0.22272, "percentage": 11.15, "elapsed_time": "0:50:35", "remaining_time": "6:43:03"}
{"current_steps": 88, "total_steps": 780, "loss": 0.6191, "lr": 1.9564915757177955e-05, "epoch": 0.22528, "percentage": 11.28, "elapsed_time": "0:51:11", "remaining_time": "6:42:32"}
{"current_steps": 89, "total_steps": 780, "loss": 0.6708, "lr": 1.9552837662341182e-05, "epoch": 0.22784, "percentage": 11.41, "elapsed_time": "0:51:46", "remaining_time": "6:42:02"}
{"current_steps": 90, "total_steps": 780, "loss": 0.677, "lr": 1.954059804062092e-05, "epoch": 0.2304, "percentage": 11.54, "elapsed_time": "0:52:23", "remaining_time": "6:41:41"}
{"current_steps": 91, "total_steps": 780, "loss": 0.6866, "lr": 1.952819709897431e-05, "epoch": 0.23296, "percentage": 11.67, "elapsed_time": "0:52:59", "remaining_time": "6:41:12"}
{"current_steps": 92, "total_steps": 780, "loss": 0.5733, "lr": 1.951563504708622e-05, "epoch": 0.23552, "percentage": 11.79, "elapsed_time": "0:53:34", "remaining_time": "6:40:39"}
{"current_steps": 93, "total_steps": 780, "loss": 0.6838, "lr": 1.9502912097365677e-05, "epoch": 0.23808, "percentage": 11.92, "elapsed_time": "0:54:10", "remaining_time": "6:40:09"}
{"current_steps": 94, "total_steps": 780, "loss": 0.6759, "lr": 1.9490028464942322e-05, "epoch": 0.24064, "percentage": 12.05, "elapsed_time": "0:54:44", "remaining_time": "6:39:31"}
{"current_steps": 95, "total_steps": 780, "loss": 0.6187, "lr": 1.9476984367662724e-05, "epoch": 0.2432, "percentage": 12.18, "elapsed_time": "0:55:18", "remaining_time": "6:38:44"}
{"current_steps": 96, "total_steps": 780, "loss": 0.7569, "lr": 1.9463780026086735e-05, "epoch": 0.24576, "percentage": 12.31, "elapsed_time": "0:55:52", "remaining_time": "6:38:09"}
{"current_steps": 97, "total_steps": 780, "loss": 0.6306, "lr": 1.9450415663483734e-05, "epoch": 0.24832, "percentage": 12.44, "elapsed_time": "0:56:28", "remaining_time": "6:37:36"}
{"current_steps": 98, "total_steps": 780, "loss": 0.743, "lr": 1.9436891505828854e-05, "epoch": 0.25088, "percentage": 12.56, "elapsed_time": "0:57:04", "remaining_time": "6:37:10"}
{"current_steps": 99, "total_steps": 780, "loss": 0.6156, "lr": 1.9423207781799186e-05, "epoch": 0.25344, "percentage": 12.69, "elapsed_time": "0:57:39", "remaining_time": "6:36:35"}
{"current_steps": 100, "total_steps": 780, "loss": 0.6749, "lr": 1.9409364722769882e-05, "epoch": 0.256, "percentage": 12.82, "elapsed_time": "0:58:14", "remaining_time": "6:36:01"}
{"current_steps": 101, "total_steps": 780, "loss": 0.7428, "lr": 1.939536256281026e-05, "epoch": 0.25856, "percentage": 12.95, "elapsed_time": "0:58:48", "remaining_time": "6:35:21"}
{"current_steps": 102, "total_steps": 780, "loss": 0.7159, "lr": 1.938120153867983e-05, "epoch": 0.26112, "percentage": 13.08, "elapsed_time": "0:59:23", "remaining_time": "6:34:46"}
{"current_steps": 103, "total_steps": 780, "loss": 0.7103, "lr": 1.936688188982433e-05, "epoch": 0.26368, "percentage": 13.21, "elapsed_time": "0:59:57", "remaining_time": "6:34:06"}
{"current_steps": 104, "total_steps": 780, "loss": 0.6595, "lr": 1.9352403858371618e-05, "epoch": 0.26624, "percentage": 13.33, "elapsed_time": "1:00:33", "remaining_time": "6:33:40"}
{"current_steps": 105, "total_steps": 780, "loss": 0.6411, "lr": 1.9337767689127628e-05, "epoch": 0.2688, "percentage": 13.46, "elapsed_time": "1:01:08", "remaining_time": "6:33:04"}
{"current_steps": 106, "total_steps": 780, "loss": 0.6819, "lr": 1.9322973629572207e-05, "epoch": 0.27136, "percentage": 13.59, "elapsed_time": "1:01:44", "remaining_time": "6:32:32"}
{"current_steps": 107, "total_steps": 780, "loss": 0.6587, "lr": 1.9308021929854934e-05, "epoch": 0.27392, "percentage": 13.72, "elapsed_time": "1:02:20", "remaining_time": "6:32:06"}
{"current_steps": 108, "total_steps": 780, "loss": 0.7157, "lr": 1.9292912842790893e-05, "epoch": 0.27648, "percentage": 13.85, "elapsed_time": "1:02:54", "remaining_time": "6:31:28"}
{"current_steps": 109, "total_steps": 780, "loss": 0.6943, "lr": 1.92776466238564e-05, "epoch": 0.27904, "percentage": 13.97, "elapsed_time": "1:03:30", "remaining_time": "6:30:58"}
{"current_steps": 110, "total_steps": 780, "loss": 0.6259, "lr": 1.9262223531184678e-05, "epoch": 0.2816, "percentage": 14.1, "elapsed_time": "1:04:05", "remaining_time": "6:30:23"}
{"current_steps": 111, "total_steps": 780, "loss": 0.6057, "lr": 1.924664382556149e-05, "epoch": 0.28416, "percentage": 14.23, "elapsed_time": "1:04:39", "remaining_time": "6:29:39"}
{"current_steps": 112, "total_steps": 780, "loss": 0.6625, "lr": 1.9230907770420737e-05, "epoch": 0.28672, "percentage": 14.36, "elapsed_time": "1:05:14", "remaining_time": "6:29:04"}
{"current_steps": 113, "total_steps": 780, "loss": 0.6164, "lr": 1.9215015631840005e-05, "epoch": 0.28928, "percentage": 14.49, "elapsed_time": "1:05:48", "remaining_time": "6:28:27"}
{"current_steps": 114, "total_steps": 780, "loss": 0.6616, "lr": 1.9198967678536054e-05, "epoch": 0.29184, "percentage": 14.62, "elapsed_time": "1:06:25", "remaining_time": "6:28:01"}
{"current_steps": 115, "total_steps": 780, "loss": 0.6494, "lr": 1.918276418186028e-05, "epoch": 0.2944, "percentage": 14.74, "elapsed_time": "1:07:00", "remaining_time": "6:27:27"}
{"current_steps": 116, "total_steps": 780, "loss": 0.65, "lr": 1.916640541579415e-05, "epoch": 0.29696, "percentage": 14.87, "elapsed_time": "1:07:34", "remaining_time": "6:26:49"}
{"current_steps": 117, "total_steps": 780, "loss": 0.6374, "lr": 1.9149891656944513e-05, "epoch": 0.29952, "percentage": 15.0, "elapsed_time": "1:08:09", "remaining_time": "6:26:13"}
{"current_steps": 118, "total_steps": 780, "loss": 0.699, "lr": 1.913322318453899e-05, "epoch": 0.30208, "percentage": 15.13, "elapsed_time": "1:08:43", "remaining_time": "6:25:32"}
{"current_steps": 119, "total_steps": 780, "loss": 0.6088, "lr": 1.9116400280421196e-05, "epoch": 0.30464, "percentage": 15.26, "elapsed_time": "1:09:19", "remaining_time": "6:25:04"}
{"current_steps": 120, "total_steps": 780, "loss": 0.752, "lr": 1.9099423229046015e-05, "epoch": 0.3072, "percentage": 15.38, "elapsed_time": "1:09:54", "remaining_time": "6:24:27"}
{"current_steps": 121, "total_steps": 780, "loss": 0.6185, "lr": 1.9082292317474766e-05, "epoch": 0.30976, "percentage": 15.51, "elapsed_time": "1:10:29", "remaining_time": "6:23:52"}
{"current_steps": 122, "total_steps": 780, "loss": 0.7374, "lr": 1.9065007835370358e-05, "epoch": 0.31232, "percentage": 15.64, "elapsed_time": "1:11:06", "remaining_time": "6:23:32"}
{"current_steps": 123, "total_steps": 780, "loss": 0.672, "lr": 1.90475700749924e-05, "epoch": 0.31488, "percentage": 15.77, "elapsed_time": "1:11:40", "remaining_time": "6:22:51"}
{"current_steps": 124, "total_steps": 780, "loss": 0.7168, "lr": 1.902997933119223e-05, "epoch": 0.31744, "percentage": 15.9, "elapsed_time": "1:12:14", "remaining_time": "6:22:11"}
{"current_steps": 125, "total_steps": 780, "loss": 0.6724, "lr": 1.9012235901407976e-05, "epoch": 0.32, "percentage": 16.03, "elapsed_time": "1:12:49", "remaining_time": "6:21:35"}
{"current_steps": 126, "total_steps": 780, "loss": 0.6165, "lr": 1.8994340085659474e-05, "epoch": 0.32256, "percentage": 16.15, "elapsed_time": "1:13:24", "remaining_time": "6:21:03"}
{"current_steps": 127, "total_steps": 780, "loss": 0.6733, "lr": 1.897629218654325e-05, "epoch": 0.32512, "percentage": 16.28, "elapsed_time": "1:14:00", "remaining_time": "6:20:32"}
{"current_steps": 128, "total_steps": 780, "loss": 0.6036, "lr": 1.8958092509227347e-05, "epoch": 0.32768, "percentage": 16.41, "elapsed_time": "1:14:35", "remaining_time": "6:19:59"}
{"current_steps": 129, "total_steps": 780, "loss": 0.581, "lr": 1.8939741361446207e-05, "epoch": 0.33024, "percentage": 16.54, "elapsed_time": "1:15:12", "remaining_time": "6:19:33"}
{"current_steps": 130, "total_steps": 780, "loss": 0.7016, "lr": 1.8921239053495465e-05, "epoch": 0.3328, "percentage": 16.67, "elapsed_time": "1:15:47", "remaining_time": "6:18:55"}
{"current_steps": 131, "total_steps": 780, "loss": 0.6983, "lr": 1.8902585898226663e-05, "epoch": 0.33536, "percentage": 16.79, "elapsed_time": "1:16:23", "remaining_time": "6:18:27"}
{"current_steps": 132, "total_steps": 780, "loss": 0.724, "lr": 1.888378221104201e-05, "epoch": 0.33792, "percentage": 16.92, "elapsed_time": "1:16:57", "remaining_time": "6:17:47"}
{"current_steps": 133, "total_steps": 780, "loss": 0.6245, "lr": 1.8864828309889022e-05, "epoch": 0.34048, "percentage": 17.05, "elapsed_time": "1:17:32", "remaining_time": "6:17:14"}
{"current_steps": 134, "total_steps": 780, "loss": 0.6611, "lr": 1.8845724515255147e-05, "epoch": 0.34304, "percentage": 17.18, "elapsed_time": "1:18:07", "remaining_time": "6:16:39"}
{"current_steps": 135, "total_steps": 780, "loss": 0.6202, "lr": 1.8826471150162354e-05, "epoch": 0.3456, "percentage": 17.31, "elapsed_time": "1:18:43", "remaining_time": "6:16:05"}
{"current_steps": 136, "total_steps": 780, "loss": 0.714, "lr": 1.880706854016166e-05, "epoch": 0.34816, "percentage": 17.44, "elapsed_time": "1:19:16", "remaining_time": "6:15:24"}
{"current_steps": 137, "total_steps": 780, "loss": 0.6921, "lr": 1.8787517013327642e-05, "epoch": 0.35072, "percentage": 17.56, "elapsed_time": "1:19:50", "remaining_time": "6:14:46"}
{"current_steps": 138, "total_steps": 780, "loss": 0.6242, "lr": 1.876781690025287e-05, "epoch": 0.35328, "percentage": 17.69, "elapsed_time": "1:20:25", "remaining_time": "6:14:09"}
{"current_steps": 139, "total_steps": 780, "loss": 0.685, "lr": 1.8747968534042333e-05, "epoch": 0.35584, "percentage": 17.82, "elapsed_time": "1:21:01", "remaining_time": "6:13:37"}
{"current_steps": 140, "total_steps": 780, "loss": 0.6191, "lr": 1.87279722503078e-05, "epoch": 0.3584, "percentage": 17.95, "elapsed_time": "1:21:36", "remaining_time": "6:13:03"}
{"current_steps": 141, "total_steps": 780, "loss": 0.6209, "lr": 1.8707828387162145e-05, "epoch": 0.36096, "percentage": 18.08, "elapsed_time": "1:22:12", "remaining_time": "6:12:34"}
{"current_steps": 142, "total_steps": 780, "loss": 0.6007, "lr": 1.8687537285213627e-05, "epoch": 0.36352, "percentage": 18.21, "elapsed_time": "1:22:46", "remaining_time": "6:11:56"}
{"current_steps": 143, "total_steps": 780, "loss": 0.6939, "lr": 1.866709928756014e-05, "epoch": 0.36608, "percentage": 18.33, "elapsed_time": "1:23:20", "remaining_time": "6:11:16"}
{"current_steps": 144, "total_steps": 780, "loss": 0.6719, "lr": 1.8646514739783404e-05, "epoch": 0.36864, "percentage": 18.46, "elapsed_time": "1:23:56", "remaining_time": "6:10:43"}
{"current_steps": 145, "total_steps": 780, "loss": 0.6735, "lr": 1.8625783989943124e-05, "epoch": 0.3712, "percentage": 18.59, "elapsed_time": "1:24:32", "remaining_time": "6:10:14"}
{"current_steps": 146, "total_steps": 780, "loss": 0.6737, "lr": 1.8604907388571097e-05, "epoch": 0.37376, "percentage": 18.72, "elapsed_time": "1:25:09", "remaining_time": "6:09:47"}
{"current_steps": 147, "total_steps": 780, "loss": 0.7013, "lr": 1.8583885288665307e-05, "epoch": 0.37632, "percentage": 18.85, "elapsed_time": "1:25:44", "remaining_time": "6:09:11"}
{"current_steps": 148, "total_steps": 780, "loss": 0.6418, "lr": 1.8562718045683933e-05, "epoch": 0.37888, "percentage": 18.97, "elapsed_time": "1:26:18", "remaining_time": "6:08:32"}
{"current_steps": 149, "total_steps": 780, "loss": 0.6588, "lr": 1.854140601753934e-05, "epoch": 0.38144, "percentage": 19.1, "elapsed_time": "1:26:53", "remaining_time": "6:07:59"}
{"current_steps": 150, "total_steps": 780, "loss": 0.6395, "lr": 1.8519949564592047e-05, "epoch": 0.384, "percentage": 19.23, "elapsed_time": "1:27:29", "remaining_time": "6:07:27"}
{"current_steps": 151, "total_steps": 780, "loss": 0.7024, "lr": 1.8498349049644614e-05, "epoch": 0.38656, "percentage": 19.36, "elapsed_time": "1:28:03", "remaining_time": "6:06:49"}
{"current_steps": 152, "total_steps": 780, "loss": 0.6104, "lr": 1.8476604837935515e-05, "epoch": 0.38912, "percentage": 19.49, "elapsed_time": "1:28:37", "remaining_time": "6:06:08"}
{"current_steps": 153, "total_steps": 780, "loss": 0.6368, "lr": 1.8454717297132966e-05, "epoch": 0.39168, "percentage": 19.62, "elapsed_time": "1:29:12", "remaining_time": "6:05:34"}
{"current_steps": 154, "total_steps": 780, "loss": 0.7267, "lr": 1.8432686797328697e-05, "epoch": 0.39424, "percentage": 19.74, "elapsed_time": "1:29:49", "remaining_time": "6:05:06"}
{"current_steps": 155, "total_steps": 780, "loss": 0.6158, "lr": 1.8410513711031713e-05, "epoch": 0.3968, "percentage": 19.87, "elapsed_time": "1:30:25", "remaining_time": "6:04:35"}
{"current_steps": 156, "total_steps": 780, "loss": 0.5699, "lr": 1.8388198413161962e-05, "epoch": 0.39936, "percentage": 20.0, "elapsed_time": "1:30:59", "remaining_time": "6:03:59"}
{"current_steps": 157, "total_steps": 780, "loss": 0.6232, "lr": 1.8365741281044046e-05, "epoch": 0.40192, "percentage": 20.13, "elapsed_time": "1:31:33", "remaining_time": "6:03:18"}
{"current_steps": 158, "total_steps": 780, "loss": 0.6156, "lr": 1.8343142694400784e-05, "epoch": 0.40448, "percentage": 20.26, "elapsed_time": "1:32:08", "remaining_time": "6:02:43"}
{"current_steps": 159, "total_steps": 780, "loss": 0.7054, "lr": 1.8320403035346834e-05, "epoch": 0.40704, "percentage": 20.38, "elapsed_time": "1:32:44", "remaining_time": "6:02:11"}
{"current_steps": 160, "total_steps": 780, "loss": 0.6445, "lr": 1.829752268838222e-05, "epoch": 0.4096, "percentage": 20.51, "elapsed_time": "1:33:18", "remaining_time": "6:01:34"}
{"current_steps": 161, "total_steps": 780, "loss": 0.5156, "lr": 1.8274502040385814e-05, "epoch": 0.41216, "percentage": 20.64, "elapsed_time": "1:33:53", "remaining_time": "6:01:01"}
{"current_steps": 162, "total_steps": 780, "loss": 0.6786, "lr": 1.8251341480608823e-05, "epoch": 0.41472, "percentage": 20.77, "elapsed_time": "1:34:28", "remaining_time": "6:00:23"}
{"current_steps": 163, "total_steps": 780, "loss": 0.6856, "lr": 1.8228041400668185e-05, "epoch": 0.41728, "percentage": 20.9, "elapsed_time": "1:35:03", "remaining_time": "5:59:48"}
{"current_steps": 164, "total_steps": 780, "loss": 0.6883, "lr": 1.8204602194539948e-05, "epoch": 0.41984, "percentage": 21.03, "elapsed_time": "1:35:38", "remaining_time": "5:59:12"}
{"current_steps": 165, "total_steps": 780, "loss": 0.651, "lr": 1.8181024258552633e-05, "epoch": 0.4224, "percentage": 21.15, "elapsed_time": "1:36:13", "remaining_time": "5:58:40"}
{"current_steps": 166, "total_steps": 780, "loss": 0.63, "lr": 1.8157307991380496e-05, "epoch": 0.42496, "percentage": 21.28, "elapsed_time": "1:36:48", "remaining_time": "5:58:04"}
{"current_steps": 167, "total_steps": 780, "loss": 0.5996, "lr": 1.8133453794036816e-05, "epoch": 0.42752, "percentage": 21.41, "elapsed_time": "1:37:21", "remaining_time": "5:57:23"}
{"current_steps": 168, "total_steps": 780, "loss": 0.68, "lr": 1.81094620698671e-05, "epoch": 0.43008, "percentage": 21.54, "elapsed_time": "1:37:56", "remaining_time": "5:56:48"}
{"current_steps": 169, "total_steps": 780, "loss": 0.6587, "lr": 1.8085333224542263e-05, "epoch": 0.43264, "percentage": 21.67, "elapsed_time": "1:38:31", "remaining_time": "5:56:10"}
{"current_steps": 170, "total_steps": 780, "loss": 0.6543, "lr": 1.806106766605178e-05, "epoch": 0.4352, "percentage": 21.79, "elapsed_time": "1:39:06", "remaining_time": "5:55:38"}
{"current_steps": 171, "total_steps": 780, "loss": 0.7058, "lr": 1.8036665804696777e-05, "epoch": 0.43776, "percentage": 21.92, "elapsed_time": "1:39:40", "remaining_time": "5:54:59"}
{"current_steps": 172, "total_steps": 780, "loss": 0.6896, "lr": 1.8012128053083097e-05, "epoch": 0.44032, "percentage": 22.05, "elapsed_time": "1:40:15", "remaining_time": "5:54:23"}
{"current_steps": 173, "total_steps": 780, "loss": 0.6617, "lr": 1.798745482611431e-05, "epoch": 0.44288, "percentage": 22.18, "elapsed_time": "1:40:51", "remaining_time": "5:53:51"}
{"current_steps": 174, "total_steps": 780, "loss": 0.6053, "lr": 1.7962646540984733e-05, "epoch": 0.44544, "percentage": 22.31, "elapsed_time": "1:41:27", "remaining_time": "5:53:21"}
{"current_steps": 175, "total_steps": 780, "loss": 0.5854, "lr": 1.7937703617172326e-05, "epoch": 0.448, "percentage": 22.44, "elapsed_time": "1:42:05", "remaining_time": "5:52:56"}
{"current_steps": 176, "total_steps": 780, "loss": 0.7031, "lr": 1.7912626476431648e-05, "epoch": 0.45056, "percentage": 22.56, "elapsed_time": "1:42:40", "remaining_time": "5:52:22"}
{"current_steps": 177, "total_steps": 780, "loss": 0.6616, "lr": 1.7887415542786694e-05, "epoch": 0.45312, "percentage": 22.69, "elapsed_time": "1:43:14", "remaining_time": "5:51:44"}
{"current_steps": 178, "total_steps": 780, "loss": 0.6539, "lr": 1.786207124252373e-05, "epoch": 0.45568, "percentage": 22.82, "elapsed_time": "1:43:48", "remaining_time": "5:51:04"}
{"current_steps": 179, "total_steps": 780, "loss": 0.6462, "lr": 1.7836594004184097e-05, "epoch": 0.45824, "percentage": 22.95, "elapsed_time": "1:44:24", "remaining_time": "5:50:32"}
{"current_steps": 180, "total_steps": 780, "loss": 0.6678, "lr": 1.7810984258556955e-05, "epoch": 0.4608, "percentage": 23.08, "elapsed_time": "1:45:00", "remaining_time": "5:50:01"}
{"current_steps": 181, "total_steps": 780, "loss": 0.654, "lr": 1.7785242438672002e-05, "epoch": 0.46336, "percentage": 23.21, "elapsed_time": "1:45:36", "remaining_time": "5:49:30"}
{"current_steps": 182, "total_steps": 780, "loss": 0.6092, "lr": 1.7759368979792145e-05, "epoch": 0.46592, "percentage": 23.33, "elapsed_time": "1:46:10", "remaining_time": "5:48:53"}
{"current_steps": 183, "total_steps": 780, "loss": 0.6942, "lr": 1.773336431940616e-05, "epoch": 0.46848, "percentage": 23.46, "elapsed_time": "1:46:45", "remaining_time": "5:48:18"}
{"current_steps": 184, "total_steps": 780, "loss": 0.6385, "lr": 1.770722889722126e-05, "epoch": 0.47104, "percentage": 23.59, "elapsed_time": "1:47:20", "remaining_time": "5:47:40"}
{"current_steps": 185, "total_steps": 780, "loss": 0.5967, "lr": 1.7680963155155712e-05, "epoch": 0.4736, "percentage": 23.72, "elapsed_time": "1:47:54", "remaining_time": "5:47:04"}
{"current_steps": 186, "total_steps": 780, "loss": 0.5712, "lr": 1.76545675373313e-05, "epoch": 0.47616, "percentage": 23.85, "elapsed_time": "1:48:29", "remaining_time": "5:46:29"}
{"current_steps": 187, "total_steps": 780, "loss": 0.6759, "lr": 1.7628042490065877e-05, "epoch": 0.47872, "percentage": 23.97, "elapsed_time": "1:49:05", "remaining_time": "5:45:55"}
{"current_steps": 188, "total_steps": 780, "loss": 0.6193, "lr": 1.760138846186577e-05, "epoch": 0.48128, "percentage": 24.1, "elapsed_time": "1:49:40", "remaining_time": "5:45:21"}
{"current_steps": 189, "total_steps": 780, "loss": 0.5843, "lr": 1.7574605903418226e-05, "epoch": 0.48384, "percentage": 24.23, "elapsed_time": "1:50:15", "remaining_time": "5:44:47"}
{"current_steps": 190, "total_steps": 780, "loss": 0.5822, "lr": 1.7547695267583794e-05, "epoch": 0.4864, "percentage": 24.36, "elapsed_time": "1:50:50", "remaining_time": "5:44:13"}
{"current_steps": 191, "total_steps": 780, "loss": 0.6215, "lr": 1.7520657009388634e-05, "epoch": 0.48896, "percentage": 24.49, "elapsed_time": "1:51:27", "remaining_time": "5:43:43"}
{"current_steps": 192, "total_steps": 780, "loss": 0.5839, "lr": 1.749349158601686e-05, "epoch": 0.49152, "percentage": 24.62, "elapsed_time": "1:52:02", "remaining_time": "5:43:06"}
{"current_steps": 193, "total_steps": 780, "loss": 0.5904, "lr": 1.7466199456802784e-05, "epoch": 0.49408, "percentage": 24.74, "elapsed_time": "1:52:37", "remaining_time": "5:42:33"}
{"current_steps": 194, "total_steps": 780, "loss": 0.526, "lr": 1.743878108322318e-05, "epoch": 0.49664, "percentage": 24.87, "elapsed_time": "1:53:12", "remaining_time": "5:41:56"}
{"current_steps": 195, "total_steps": 780, "loss": 0.6384, "lr": 1.741123692888943e-05, "epoch": 0.4992, "percentage": 25.0, "elapsed_time": "1:53:47", "remaining_time": "5:41:21"}
{"current_steps": 196, "total_steps": 780, "loss": 0.6999, "lr": 1.738356745953975e-05, "epoch": 0.50176, "percentage": 25.13, "elapsed_time": "1:54:25", "remaining_time": "5:40:55"}
{"current_steps": 197, "total_steps": 780, "loss": 0.6412, "lr": 1.7355773143031247e-05, "epoch": 0.50432, "percentage": 25.26, "elapsed_time": "1:54:59", "remaining_time": "5:40:17"}
{"current_steps": 198, "total_steps": 780, "loss": 0.5577, "lr": 1.7327854449332067e-05, "epoch": 0.50688, "percentage": 25.38, "elapsed_time": "1:55:34", "remaining_time": "5:39:42"}
{"current_steps": 199, "total_steps": 780, "loss": 0.6713, "lr": 1.729981185051342e-05, "epoch": 0.50944, "percentage": 25.51, "elapsed_time": "1:56:10", "remaining_time": "5:39:12"}
{"current_steps": 200, "total_steps": 780, "loss": 0.6577, "lr": 1.7271645820741586e-05, "epoch": 0.512, "percentage": 25.64, "elapsed_time": "1:56:46", "remaining_time": "5:38:38"}
{"current_steps": 201, "total_steps": 780, "loss": 0.6368, "lr": 1.7243356836269928e-05, "epoch": 0.51456, "percentage": 25.77, "elapsed_time": "1:57:20", "remaining_time": "5:38:01"}
{"current_steps": 202, "total_steps": 780, "loss": 0.6209, "lr": 1.7214945375430816e-05, "epoch": 0.51712, "percentage": 25.9, "elapsed_time": "1:57:55", "remaining_time": "5:37:26"}
{"current_steps": 203, "total_steps": 780, "loss": 0.6142, "lr": 1.718641191862755e-05, "epoch": 0.51968, "percentage": 26.03, "elapsed_time": "1:58:30", "remaining_time": "5:36:50"}
{"current_steps": 204, "total_steps": 780, "loss": 0.5725, "lr": 1.715775694832623e-05, "epoch": 0.52224, "percentage": 26.15, "elapsed_time": "1:59:03", "remaining_time": "5:36:10"}
{"current_steps": 205, "total_steps": 780, "loss": 0.5957, "lr": 1.7128980949047607e-05, "epoch": 0.5248, "percentage": 26.28, "elapsed_time": "1:59:39", "remaining_time": "5:35:37"}
{"current_steps": 206, "total_steps": 780, "loss": 0.673, "lr": 1.7100084407358882e-05, "epoch": 0.52736, "percentage": 26.41, "elapsed_time": "2:00:13", "remaining_time": "5:35:00"}
{"current_steps": 207, "total_steps": 780, "loss": 0.5983, "lr": 1.7071067811865477e-05, "epoch": 0.52992, "percentage": 26.54, "elapsed_time": "2:00:47", "remaining_time": "5:34:22"}
{"current_steps": 208, "total_steps": 780, "loss": 0.6069, "lr": 1.7041931653202788e-05, "epoch": 0.53248, "percentage": 26.67, "elapsed_time": "2:01:21", "remaining_time": "5:33:43"}
{"current_steps": 209, "total_steps": 780, "loss": 0.6489, "lr": 1.7012676424027873e-05, "epoch": 0.53504, "percentage": 26.79, "elapsed_time": "2:01:54", "remaining_time": "5:33:03"}
{"current_steps": 210, "total_steps": 780, "loss": 0.5801, "lr": 1.6983302619011125e-05, "epoch": 0.5376, "percentage": 26.92, "elapsed_time": "2:02:28", "remaining_time": "5:32:24"}
{"current_steps": 211, "total_steps": 780, "loss": 0.5935, "lr": 1.6953810734827917e-05, "epoch": 0.54016, "percentage": 27.05, "elapsed_time": "2:03:02", "remaining_time": "5:31:48"}
{"current_steps": 212, "total_steps": 780, "loss": 0.5463, "lr": 1.6924201270150194e-05, "epoch": 0.54272, "percentage": 27.18, "elapsed_time": "2:03:35", "remaining_time": "5:31:08"}
{"current_steps": 213, "total_steps": 780, "loss": 0.6044, "lr": 1.6894474725638043e-05, "epoch": 0.54528, "percentage": 27.31, "elapsed_time": "2:04:10", "remaining_time": "5:30:32"}
{"current_steps": 214, "total_steps": 780, "loss": 0.67, "lr": 1.686463160393123e-05, "epoch": 0.54784, "percentage": 27.44, "elapsed_time": "2:04:46", "remaining_time": "5:30:01"}
{"current_steps": 215, "total_steps": 780, "loss": 0.6429, "lr": 1.6834672409640705e-05, "epoch": 0.5504, "percentage": 27.56, "elapsed_time": "2:05:21", "remaining_time": "5:29:26"}
{"current_steps": 216, "total_steps": 780, "loss": 0.6335, "lr": 1.680459764934006e-05, "epoch": 0.55296, "percentage": 27.69, "elapsed_time": "2:05:57", "remaining_time": "5:28:53"}
{"current_steps": 217, "total_steps": 780, "loss": 0.6468, "lr": 1.677440783155696e-05, "epoch": 0.55552, "percentage": 27.82, "elapsed_time": "2:06:31", "remaining_time": "5:28:16"}
{"current_steps": 218, "total_steps": 780, "loss": 0.576, "lr": 1.6744103466764566e-05, "epoch": 0.55808, "percentage": 27.95, "elapsed_time": "2:07:05", "remaining_time": "5:27:37"}
{"current_steps": 219, "total_steps": 780, "loss": 0.6891, "lr": 1.671368506737288e-05, "epoch": 0.56064, "percentage": 28.08, "elapsed_time": "2:07:41", "remaining_time": "5:27:05"}
{"current_steps": 220, "total_steps": 780, "loss": 0.5747, "lr": 1.6683153147720098e-05, "epoch": 0.5632, "percentage": 28.21, "elapsed_time": "2:08:16", "remaining_time": "5:26:29"}
{"current_steps": 221, "total_steps": 780, "loss": 0.5986, "lr": 1.66525082240639e-05, "epoch": 0.56576, "percentage": 28.33, "elapsed_time": "2:08:51", "remaining_time": "5:25:55"}
{"current_steps": 222, "total_steps": 780, "loss": 0.5943, "lr": 1.6621750814572728e-05, "epoch": 0.56832, "percentage": 28.46, "elapsed_time": "2:09:25", "remaining_time": "5:25:19"}
{"current_steps": 223, "total_steps": 780, "loss": 0.6973, "lr": 1.6590881439317025e-05, "epoch": 0.57088, "percentage": 28.59, "elapsed_time": "2:10:00", "remaining_time": "5:24:43"}
{"current_steps": 224, "total_steps": 780, "loss": 0.6694, "lr": 1.6559900620260435e-05, "epoch": 0.57344, "percentage": 28.72, "elapsed_time": "2:10:35", "remaining_time": "5:24:07"}
{"current_steps": 225, "total_steps": 780, "loss": 0.6559, "lr": 1.6528808881250986e-05, "epoch": 0.576, "percentage": 28.85, "elapsed_time": "2:11:10", "remaining_time": "5:23:33"}
{"current_steps": 226, "total_steps": 780, "loss": 0.5997, "lr": 1.6497606748012227e-05, "epoch": 0.57856, "percentage": 28.97, "elapsed_time": "2:11:44", "remaining_time": "5:22:57"}
{"current_steps": 227, "total_steps": 780, "loss": 0.6631, "lr": 1.646629474813433e-05, "epoch": 0.58112, "percentage": 29.1, "elapsed_time": "2:12:19", "remaining_time": "5:22:22"}
{"current_steps": 228, "total_steps": 780, "loss": 0.6076, "lr": 1.64348734110652e-05, "epoch": 0.58368, "percentage": 29.23, "elapsed_time": "2:12:55", "remaining_time": "5:21:48"}
{"current_steps": 229, "total_steps": 780, "loss": 0.6892, "lr": 1.6403343268101476e-05, "epoch": 0.58624, "percentage": 29.36, "elapsed_time": "2:13:30", "remaining_time": "5:21:13"}
{"current_steps": 230, "total_steps": 780, "loss": 0.6187, "lr": 1.6371704852379587e-05, "epoch": 0.5888, "percentage": 29.49, "elapsed_time": "2:14:05", "remaining_time": "5:20:38"}
{"current_steps": 231, "total_steps": 780, "loss": 0.5672, "lr": 1.6339958698866716e-05, "epoch": 0.59136, "percentage": 29.62, "elapsed_time": "2:14:40", "remaining_time": "5:20:04"}
{"current_steps": 232, "total_steps": 780, "loss": 0.606, "lr": 1.6308105344351776e-05, "epoch": 0.59392, "percentage": 29.74, "elapsed_time": "2:15:14", "remaining_time": "5:19:27"}
{"current_steps": 233, "total_steps": 780, "loss": 0.5996, "lr": 1.6276145327436298e-05, "epoch": 0.59648, "percentage": 29.87, "elapsed_time": "2:15:48", "remaining_time": "5:18:50"}
{"current_steps": 234, "total_steps": 780, "loss": 0.5606, "lr": 1.6244079188525358e-05, "epoch": 0.59904, "percentage": 30.0, "elapsed_time": "2:16:25", "remaining_time": "5:18:18"}
{"current_steps": 235, "total_steps": 780, "loss": 0.5877, "lr": 1.621190746981842e-05, "epoch": 0.6016, "percentage": 30.13, "elapsed_time": "2:17:00", "remaining_time": "5:17:44"}
{"current_steps": 236, "total_steps": 780, "loss": 0.5617, "lr": 1.617963071530018e-05, "epoch": 0.60416, "percentage": 30.26, "elapsed_time": "2:17:36", "remaining_time": "5:17:11"}
{"current_steps": 237, "total_steps": 780, "loss": 0.5666, "lr": 1.6147249470731355e-05, "epoch": 0.60672, "percentage": 30.38, "elapsed_time": "2:18:11", "remaining_time": "5:16:36"}
{"current_steps": 238, "total_steps": 780, "loss": 0.5915, "lr": 1.6114764283639467e-05, "epoch": 0.60928, "percentage": 30.51, "elapsed_time": "2:18:47", "remaining_time": "5:16:05"}
{"current_steps": 239, "total_steps": 780, "loss": 0.6164, "lr": 1.608217570330958e-05, "epoch": 0.61184, "percentage": 30.64, "elapsed_time": "2:19:23", "remaining_time": "5:15:30"}
{"current_steps": 240, "total_steps": 780, "loss": 0.5671, "lr": 1.6049484280775012e-05, "epoch": 0.6144, "percentage": 30.77, "elapsed_time": "2:19:56", "remaining_time": "5:14:53"}
{"current_steps": 241, "total_steps": 780, "loss": 0.5998, "lr": 1.601669056880801e-05, "epoch": 0.61696, "percentage": 30.9, "elapsed_time": "2:20:32", "remaining_time": "5:14:19"}
{"current_steps": 242, "total_steps": 780, "loss": 0.5544, "lr": 1.598379512191042e-05, "epoch": 0.61952, "percentage": 31.03, "elapsed_time": "2:21:07", "remaining_time": "5:13:43"}
{"current_steps": 243, "total_steps": 780, "loss": 0.6324, "lr": 1.5950798496304303e-05, "epoch": 0.62208, "percentage": 31.15, "elapsed_time": "2:21:42", "remaining_time": "5:13:10"}
{"current_steps": 244, "total_steps": 780, "loss": 0.6248, "lr": 1.591770124992252e-05, "epoch": 0.62464, "percentage": 31.28, "elapsed_time": "2:22:16", "remaining_time": "5:12:32"}
{"current_steps": 245, "total_steps": 780, "loss": 0.537, "lr": 1.5884503942399314e-05, "epoch": 0.6272, "percentage": 31.41, "elapsed_time": "2:22:50", "remaining_time": "5:11:56"}
{"current_steps": 246, "total_steps": 780, "loss": 0.6311, "lr": 1.585120713506084e-05, "epoch": 0.62976, "percentage": 31.54, "elapsed_time": "2:23:26", "remaining_time": "5:11:22"}
{"current_steps": 247, "total_steps": 780, "loss": 0.6263, "lr": 1.5817811390915676e-05, "epoch": 0.63232, "percentage": 31.67, "elapsed_time": "2:24:00", "remaining_time": "5:10:46"}
{"current_steps": 248, "total_steps": 780, "loss": 0.5819, "lr": 1.5784317274645294e-05, "epoch": 0.63488, "percentage": 31.79, "elapsed_time": "2:24:37", "remaining_time": "5:10:13"}
{"current_steps": 249, "total_steps": 780, "loss": 0.5841, "lr": 1.575072535259452e-05, "epoch": 0.63744, "percentage": 31.92, "elapsed_time": "2:25:13", "remaining_time": "5:09:41"}
{"current_steps": 250, "total_steps": 780, "loss": 0.5926, "lr": 1.571703619276197e-05, "epoch": 0.64, "percentage": 32.05, "elapsed_time": "2:25:47", "remaining_time": "5:09:05"}
{"current_steps": 251, "total_steps": 780, "loss": 0.6193, "lr": 1.5683250364790415e-05, "epoch": 0.64256, "percentage": 32.18, "elapsed_time": "2:26:22", "remaining_time": "5:08:29"}
{"current_steps": 252, "total_steps": 780, "loss": 0.6108, "lr": 1.5649368439957182e-05, "epoch": 0.64512, "percentage": 32.31, "elapsed_time": "2:26:57", "remaining_time": "5:07:55"}
{"current_steps": 253, "total_steps": 780, "loss": 0.5812, "lr": 1.5615390991164465e-05, "epoch": 0.64768, "percentage": 32.44, "elapsed_time": "2:27:33", "remaining_time": "5:07:21"}
{"current_steps": 254, "total_steps": 780, "loss": 0.5771, "lr": 1.5581318592929665e-05, "epoch": 0.65024, "percentage": 32.56, "elapsed_time": "2:28:09", "remaining_time": "5:06:49"}
{"current_steps": 255, "total_steps": 780, "loss": 0.5901, "lr": 1.5547151821375654e-05, "epoch": 0.6528, "percentage": 32.69, "elapsed_time": "2:28:45", "remaining_time": "5:06:15"}
{"current_steps": 256, "total_steps": 780, "loss": 0.5727, "lr": 1.5512891254221046e-05, "epoch": 0.65536, "percentage": 32.82, "elapsed_time": "2:29:20", "remaining_time": "5:05:41"}
{"current_steps": 257, "total_steps": 780, "loss": 0.5859, "lr": 1.5478537470770425e-05, "epoch": 0.65792, "percentage": 32.95, "elapsed_time": "2:29:54", "remaining_time": "5:05:04"}
{"current_steps": 258, "total_steps": 780, "loss": 0.6468, "lr": 1.5444091051904545e-05, "epoch": 0.66048, "percentage": 33.08, "elapsed_time": "2:30:29", "remaining_time": "5:04:28"}
{"current_steps": 259, "total_steps": 780, "loss": 0.5418, "lr": 1.540955258007052e-05, "epoch": 0.66304, "percentage": 33.21, "elapsed_time": "2:31:05", "remaining_time": "5:03:55"}
{"current_steps": 260, "total_steps": 780, "loss": 0.5494, "lr": 1.537492263927196e-05, "epoch": 0.6656, "percentage": 33.33, "elapsed_time": "2:31:39", "remaining_time": "5:03:19"}
{"current_steps": 261, "total_steps": 780, "loss": 0.5393, "lr": 1.5340201815059116e-05, "epoch": 0.66816, "percentage": 33.46, "elapsed_time": "2:32:13", "remaining_time": "5:02:41"}
{"current_steps": 262, "total_steps": 780, "loss": 0.5406, "lr": 1.5305390694518953e-05, "epoch": 0.67072, "percentage": 33.59, "elapsed_time": "2:32:47", "remaining_time": "5:02:05"}
{"current_steps": 263, "total_steps": 780, "loss": 0.612, "lr": 1.5270489866265236e-05, "epoch": 0.67328, "percentage": 33.72, "elapsed_time": "2:33:23", "remaining_time": "5:01:31"}
{"current_steps": 264, "total_steps": 780, "loss": 0.5988, "lr": 1.52354999204286e-05, "epoch": 0.67584, "percentage": 33.85, "elapsed_time": "2:33:59", "remaining_time": "5:00:59"}
{"current_steps": 265, "total_steps": 780, "loss": 0.5714, "lr": 1.5200421448646525e-05, "epoch": 0.6784, "percentage": 33.97, "elapsed_time": "2:34:34", "remaining_time": "5:00:24"}
{"current_steps": 266, "total_steps": 780, "loss": 0.5977, "lr": 1.5165255044053373e-05, "epoch": 0.68096, "percentage": 34.1, "elapsed_time": "2:35:09", "remaining_time": "4:59:48"}
{"current_steps": 267, "total_steps": 780, "loss": 0.5617, "lr": 1.5130001301270334e-05, "epoch": 0.68352, "percentage": 34.23, "elapsed_time": "2:35:43", "remaining_time": "4:59:12"}
{"current_steps": 268, "total_steps": 780, "loss": 0.578, "lr": 1.509466081639539e-05, "epoch": 0.68608, "percentage": 34.36, "elapsed_time": "2:36:17", "remaining_time": "4:58:34"}
{"current_steps": 269, "total_steps": 780, "loss": 0.6552, "lr": 1.5059234186993217e-05, "epoch": 0.68864, "percentage": 34.49, "elapsed_time": "2:36:52", "remaining_time": "4:57:59"}
{"current_steps": 270, "total_steps": 780, "loss": 0.6026, "lr": 1.5023722012085098e-05, "epoch": 0.6912, "percentage": 34.62, "elapsed_time": "2:37:28", "remaining_time": "4:57:26"}
{"current_steps": 271, "total_steps": 780, "loss": 0.5201, "lr": 1.4988124892138782e-05, "epoch": 0.69376, "percentage": 34.74, "elapsed_time": "2:38:03", "remaining_time": "4:56:51"}
{"current_steps": 272, "total_steps": 780, "loss": 0.5915, "lr": 1.4952443429058334e-05, "epoch": 0.69632, "percentage": 34.87, "elapsed_time": "2:38:39", "remaining_time": "4:56:18"}
{"current_steps": 273, "total_steps": 780, "loss": 0.5461, "lr": 1.4916678226173966e-05, "epoch": 0.69888, "percentage": 35.0, "elapsed_time": "2:39:15", "remaining_time": "4:55:45"}
{"current_steps": 274, "total_steps": 780, "loss": 0.6289, "lr": 1.4880829888231818e-05, "epoch": 0.70144, "percentage": 35.13, "elapsed_time": "2:39:50", "remaining_time": "4:55:11"}
{"current_steps": 275, "total_steps": 780, "loss": 0.5839, "lr": 1.4844899021383756e-05, "epoch": 0.704, "percentage": 35.26, "elapsed_time": "2:40:24", "remaining_time": "4:54:34"}
{"current_steps": 276, "total_steps": 780, "loss": 0.608, "lr": 1.4808886233177096e-05, "epoch": 0.70656, "percentage": 35.38, "elapsed_time": "2:40:59", "remaining_time": "4:53:59"}
{"current_steps": 277, "total_steps": 780, "loss": 0.5602, "lr": 1.4772792132544354e-05, "epoch": 0.70912, "percentage": 35.51, "elapsed_time": "2:41:34", "remaining_time": "4:53:23"}
{"current_steps": 278, "total_steps": 780, "loss": 0.604, "lr": 1.4736617329792942e-05, "epoch": 0.71168, "percentage": 35.64, "elapsed_time": "2:42:08", "remaining_time": "4:52:47"}
{"current_steps": 279, "total_steps": 780, "loss": 0.5981, "lr": 1.4700362436594834e-05, "epoch": 0.71424, "percentage": 35.77, "elapsed_time": "2:42:42", "remaining_time": "4:52:11"}
{"current_steps": 280, "total_steps": 780, "loss": 0.5817, "lr": 1.4664028065976245e-05, "epoch": 0.7168, "percentage": 35.9, "elapsed_time": "2:43:17", "remaining_time": "4:51:36"}
{"current_steps": 281, "total_steps": 780, "loss": 0.6396, "lr": 1.4627614832307261e-05, "epoch": 0.71936, "percentage": 36.03, "elapsed_time": "2:43:51", "remaining_time": "4:50:58"}
{"current_steps": 282, "total_steps": 780, "loss": 0.6185, "lr": 1.459112335129144e-05, "epoch": 0.72192, "percentage": 36.15, "elapsed_time": "2:44:25", "remaining_time": "4:50:22"}
{"current_steps": 283, "total_steps": 780, "loss": 0.5979, "lr": 1.4554554239955412e-05, "epoch": 0.72448, "percentage": 36.28, "elapsed_time": "2:45:00", "remaining_time": "4:49:46"}
{"current_steps": 284, "total_steps": 780, "loss": 0.5926, "lr": 1.4517908116638433e-05, "epoch": 0.72704, "percentage": 36.41, "elapsed_time": "2:45:35", "remaining_time": "4:49:12"}
{"current_steps": 285, "total_steps": 780, "loss": 0.5807, "lr": 1.4481185600981945e-05, "epoch": 0.7296, "percentage": 36.54, "elapsed_time": "2:46:10", "remaining_time": "4:48:37"}
{"current_steps": 286, "total_steps": 780, "loss": 0.603, "lr": 1.4444387313919092e-05, "epoch": 0.73216, "percentage": 36.67, "elapsed_time": "2:46:46", "remaining_time": "4:48:04"}
{"current_steps": 287, "total_steps": 780, "loss": 0.5523, "lr": 1.440751387766422e-05, "epoch": 0.73472, "percentage": 36.79, "elapsed_time": "2:47:20", "remaining_time": "4:47:26"}
{"current_steps": 288, "total_steps": 780, "loss": 0.5853, "lr": 1.437056591570235e-05, "epoch": 0.73728, "percentage": 36.92, "elapsed_time": "2:47:53", "remaining_time": "4:46:48"}
{"current_steps": 289, "total_steps": 780, "loss": 0.6131, "lr": 1.4333544052778655e-05, "epoch": 0.73984, "percentage": 37.05, "elapsed_time": "2:48:29", "remaining_time": "4:46:14"}
{"current_steps": 290, "total_steps": 780, "loss": 0.5976, "lr": 1.4296448914887866e-05, "epoch": 0.7424, "percentage": 37.18, "elapsed_time": "2:49:04", "remaining_time": "4:45:41"}
{"current_steps": 291, "total_steps": 780, "loss": 0.527, "lr": 1.4259281129263727e-05, "epoch": 0.74496, "percentage": 37.31, "elapsed_time": "2:49:39", "remaining_time": "4:45:05"}
{"current_steps": 292, "total_steps": 780, "loss": 0.6473, "lr": 1.4222041324368347e-05, "epoch": 0.74752, "percentage": 37.44, "elapsed_time": "2:50:14", "remaining_time": "4:44:30"}
{"current_steps": 293, "total_steps": 780, "loss": 0.4679, "lr": 1.4184730129881601e-05, "epoch": 0.75008, "percentage": 37.56, "elapsed_time": "2:50:49", "remaining_time": "4:43:55"}
{"current_steps": 294, "total_steps": 780, "loss": 0.596, "lr": 1.4147348176690479e-05, "epoch": 0.75264, "percentage": 37.69, "elapsed_time": "2:51:26", "remaining_time": "4:43:24"}
{"current_steps": 295, "total_steps": 780, "loss": 0.6384, "lr": 1.4109896096878408e-05, "epoch": 0.7552, "percentage": 37.82, "elapsed_time": "2:52:01", "remaining_time": "4:42:49"}
{"current_steps": 296, "total_steps": 780, "loss": 0.5608, "lr": 1.4072374523714577e-05, "epoch": 0.75776, "percentage": 37.95, "elapsed_time": "2:52:37", "remaining_time": "4:42:15"}
{"current_steps": 297, "total_steps": 780, "loss": 0.5793, "lr": 1.4034784091643218e-05, "epoch": 0.76032, "percentage": 38.08, "elapsed_time": "2:53:13", "remaining_time": "4:41:42"}
{"current_steps": 298, "total_steps": 780, "loss": 0.6529, "lr": 1.399712543627289e-05, "epoch": 0.76288, "percentage": 38.21, "elapsed_time": "2:53:48", "remaining_time": "4:41:07"}
{"current_steps": 299, "total_steps": 780, "loss": 0.6056, "lr": 1.3959399194365712e-05, "epoch": 0.76544, "percentage": 38.33, "elapsed_time": "2:54:25", "remaining_time": "4:40:35"}
{"current_steps": 300, "total_steps": 780, "loss": 0.5853, "lr": 1.392160600382663e-05, "epoch": 0.768, "percentage": 38.46, "elapsed_time": "2:55:03", "remaining_time": "4:40:05"}
{"current_steps": 301, "total_steps": 780, "loss": 0.5898, "lr": 1.3883746503692587e-05, "epoch": 0.77056, "percentage": 38.59, "elapsed_time": "2:55:38", "remaining_time": "4:39:29"}
{"current_steps": 302, "total_steps": 780, "loss": 0.5624, "lr": 1.3845821334121763e-05, "epoch": 0.77312, "percentage": 38.72, "elapsed_time": "2:56:12", "remaining_time": "4:38:54"}
{"current_steps": 303, "total_steps": 780, "loss": 0.6462, "lr": 1.3807831136382706e-05, "epoch": 0.77568, "percentage": 38.85, "elapsed_time": "2:56:47", "remaining_time": "4:38:19"}
{"current_steps": 304, "total_steps": 780, "loss": 0.6181, "lr": 1.3769776552843532e-05, "epoch": 0.77824, "percentage": 38.97, "elapsed_time": "2:57:21", "remaining_time": "4:37:41"}
{"current_steps": 305, "total_steps": 780, "loss": 0.6303, "lr": 1.3731658226961031e-05, "epoch": 0.7808, "percentage": 39.1, "elapsed_time": "2:57:55", "remaining_time": "4:37:06"}
{"current_steps": 306, "total_steps": 780, "loss": 0.5916, "lr": 1.3693476803269799e-05, "epoch": 0.78336, "percentage": 39.23, "elapsed_time": "2:58:30", "remaining_time": "4:36:30"}
{"current_steps": 307, "total_steps": 780, "loss": 0.5691, "lr": 1.3655232927371342e-05, "epoch": 0.78592, "percentage": 39.36, "elapsed_time": "2:59:05", "remaining_time": "4:35:56"}
{"current_steps": 308, "total_steps": 780, "loss": 0.5378, "lr": 1.3616927245923157e-05, "epoch": 0.78848, "percentage": 39.49, "elapsed_time": "2:59:38", "remaining_time": "4:35:18"}
{"current_steps": 309, "total_steps": 780, "loss": 0.6176, "lr": 1.3578560406627798e-05, "epoch": 0.79104, "percentage": 39.62, "elapsed_time": "3:00:14", "remaining_time": "4:34:44"}
{"current_steps": 310, "total_steps": 780, "loss": 0.6209, "lr": 1.3540133058221927e-05, "epoch": 0.7936, "percentage": 39.74, "elapsed_time": "3:00:49", "remaining_time": "4:34:08"}
{"current_steps": 311, "total_steps": 780, "loss": 0.632, "lr": 1.3501645850465327e-05, "epoch": 0.79616, "percentage": 39.87, "elapsed_time": "3:01:24", "remaining_time": "4:33:34"}
{"current_steps": 312, "total_steps": 780, "loss": 0.5552, "lr": 1.346309943412995e-05, "epoch": 0.79872, "percentage": 40.0, "elapsed_time": "3:02:00", "remaining_time": "4:33:00"}
{"current_steps": 313, "total_steps": 780, "loss": 0.6063, "lr": 1.342449446098888e-05, "epoch": 0.80128, "percentage": 40.13, "elapsed_time": "3:02:36", "remaining_time": "4:32:27"}
{"current_steps": 314, "total_steps": 780, "loss": 0.5886, "lr": 1.3385831583805329e-05, "epoch": 0.80384, "percentage": 40.26, "elapsed_time": "3:03:12", "remaining_time": "4:31:53"}
{"current_steps": 315, "total_steps": 780, "loss": 0.5937, "lr": 1.33471114563216e-05, "epoch": 0.8064, "percentage": 40.38, "elapsed_time": "3:03:46", "remaining_time": "4:31:17"}
{"current_steps": 316, "total_steps": 780, "loss": 0.6594, "lr": 1.3308334733248019e-05, "epoch": 0.80896, "percentage": 40.51, "elapsed_time": "3:04:20", "remaining_time": "4:30:41"}
{"current_steps": 317, "total_steps": 780, "loss": 0.5555, "lr": 1.3269502070251885e-05, "epoch": 0.81152, "percentage": 40.64, "elapsed_time": "3:04:56", "remaining_time": "4:30:06"}
{"current_steps": 318, "total_steps": 780, "loss": 0.6004, "lr": 1.323061412394637e-05, "epoch": 0.81408, "percentage": 40.77, "elapsed_time": "3:05:31", "remaining_time": "4:29:32"}
{"current_steps": 319, "total_steps": 780, "loss": 0.5188, "lr": 1.3191671551879418e-05, "epoch": 0.81664, "percentage": 40.9, "elapsed_time": "3:06:07", "remaining_time": "4:28:58"}
{"current_steps": 320, "total_steps": 780, "loss": 0.6318, "lr": 1.3152675012522629e-05, "epoch": 0.8192, "percentage": 41.03, "elapsed_time": "3:06:42", "remaining_time": "4:28:22"}
{"current_steps": 321, "total_steps": 780, "loss": 0.6078, "lr": 1.311362516526012e-05, "epoch": 0.82176, "percentage": 41.15, "elapsed_time": "3:07:15", "remaining_time": "4:27:45"}
{"current_steps": 322, "total_steps": 780, "loss": 0.5636, "lr": 1.3074522670377392e-05, "epoch": 0.82432, "percentage": 41.28, "elapsed_time": "3:07:50", "remaining_time": "4:27:11"}
{"current_steps": 323, "total_steps": 780, "loss": 0.6282, "lr": 1.3035368189050142e-05, "epoch": 0.82688, "percentage": 41.41, "elapsed_time": "3:08:24", "remaining_time": "4:26:34"}
{"current_steps": 324, "total_steps": 780, "loss": 0.5353, "lr": 1.2996162383333097e-05, "epoch": 0.82944, "percentage": 41.54, "elapsed_time": "3:09:00", "remaining_time": "4:26:00"}
{"current_steps": 325, "total_steps": 780, "loss": 0.5553, "lr": 1.2956905916148821e-05, "epoch": 0.832, "percentage": 41.67, "elapsed_time": "3:09:34", "remaining_time": "4:25:23"}
{"current_steps": 326, "total_steps": 780, "loss": 0.5619, "lr": 1.2917599451276498e-05, "epoch": 0.83456, "percentage": 41.79, "elapsed_time": "3:10:11", "remaining_time": "4:24:51"}
{"current_steps": 327, "total_steps": 780, "loss": 0.5301, "lr": 1.2878243653340714e-05, "epoch": 0.83712, "percentage": 41.92, "elapsed_time": "3:10:44", "remaining_time": "4:24:13"}
{"current_steps": 328, "total_steps": 780, "loss": 0.5634, "lr": 1.2838839187800218e-05, "epoch": 0.83968, "percentage": 42.05, "elapsed_time": "3:11:18", "remaining_time": "4:23:37"}
{"current_steps": 329, "total_steps": 780, "loss": 0.565, "lr": 1.2799386720936663e-05, "epoch": 0.84224, "percentage": 42.18, "elapsed_time": "3:11:51", "remaining_time": "4:22:59"}
{"current_steps": 330, "total_steps": 780, "loss": 0.5487, "lr": 1.2759886919843354e-05, "epoch": 0.8448, "percentage": 42.31, "elapsed_time": "3:12:26", "remaining_time": "4:22:25"}
{"current_steps": 331, "total_steps": 780, "loss": 0.5313, "lr": 1.2720340452413962e-05, "epoch": 0.84736, "percentage": 42.44, "elapsed_time": "3:13:01", "remaining_time": "4:21:50"}
{"current_steps": 332, "total_steps": 780, "loss": 0.5445, "lr": 1.2680747987331215e-05, "epoch": 0.84992, "percentage": 42.56, "elapsed_time": "3:13:38", "remaining_time": "4:21:17"}
{"current_steps": 333, "total_steps": 780, "loss": 0.5699, "lr": 1.264111019405562e-05, "epoch": 0.85248, "percentage": 42.69, "elapsed_time": "3:14:12", "remaining_time": "4:20:42"}
{"current_steps": 334, "total_steps": 780, "loss": 0.5473, "lr": 1.2601427742814123e-05, "epoch": 0.85504, "percentage": 42.82, "elapsed_time": "3:14:46", "remaining_time": "4:20:05"}
{"current_steps": 335, "total_steps": 780, "loss": 0.5896, "lr": 1.2561701304588782e-05, "epoch": 0.8576, "percentage": 42.95, "elapsed_time": "3:15:21", "remaining_time": "4:19:30"}
{"current_steps": 336, "total_steps": 780, "loss": 0.5678, "lr": 1.2521931551105427e-05, "epoch": 0.86016, "percentage": 43.08, "elapsed_time": "3:15:57", "remaining_time": "4:18:56"}
{"current_steps": 337, "total_steps": 780, "loss": 0.5465, "lr": 1.248211915482228e-05, "epoch": 0.86272, "percentage": 43.21, "elapsed_time": "3:16:33", "remaining_time": "4:18:22"}
{"current_steps": 338, "total_steps": 780, "loss": 0.5568, "lr": 1.244226478891862e-05, "epoch": 0.86528, "percentage": 43.33, "elapsed_time": "3:17:09", "remaining_time": "4:17:48"}
{"current_steps": 339, "total_steps": 780, "loss": 0.5632, "lr": 1.2402369127283374e-05, "epoch": 0.86784, "percentage": 43.46, "elapsed_time": "3:17:43", "remaining_time": "4:17:12"}
{"current_steps": 340, "total_steps": 780, "loss": 0.5387, "lr": 1.2362432844503725e-05, "epoch": 0.8704, "percentage": 43.59, "elapsed_time": "3:18:19", "remaining_time": "4:16:39"}
{"current_steps": 341, "total_steps": 780, "loss": 0.6314, "lr": 1.2322456615853718e-05, "epoch": 0.87296, "percentage": 43.72, "elapsed_time": "3:18:55", "remaining_time": "4:16:05"}
{"current_steps": 342, "total_steps": 780, "loss": 0.54, "lr": 1.2282441117282831e-05, "epoch": 0.87552, "percentage": 43.85, "elapsed_time": "3:19:29", "remaining_time": "4:15:28"}
{"current_steps": 343, "total_steps": 780, "loss": 0.5748, "lr": 1.224238702540454e-05, "epoch": 0.87808, "percentage": 43.97, "elapsed_time": "3:20:05", "remaining_time": "4:14:55"}
{"current_steps": 344, "total_steps": 780, "loss": 0.595, "lr": 1.2202295017484911e-05, "epoch": 0.88064, "percentage": 44.1, "elapsed_time": "3:20:40", "remaining_time": "4:14:21"}
{"current_steps": 345, "total_steps": 780, "loss": 0.4816, "lr": 1.2162165771431094e-05, "epoch": 0.8832, "percentage": 44.23, "elapsed_time": "3:21:16", "remaining_time": "4:13:46"}
{"current_steps": 346, "total_steps": 780, "loss": 0.5548, "lr": 1.212199996577991e-05, "epoch": 0.88576, "percentage": 44.36, "elapsed_time": "3:21:51", "remaining_time": "4:13:12"}
{"current_steps": 347, "total_steps": 780, "loss": 0.5399, "lr": 1.2081798279686354e-05, "epoch": 0.88832, "percentage": 44.49, "elapsed_time": "3:22:25", "remaining_time": "4:12:35"}
{"current_steps": 348, "total_steps": 780, "loss": 0.5652, "lr": 1.2041561392912118e-05, "epoch": 0.89088, "percentage": 44.62, "elapsed_time": "3:23:02", "remaining_time": "4:12:02"}
{"current_steps": 349, "total_steps": 780, "loss": 0.5431, "lr": 1.2001289985814088e-05, "epoch": 0.89344, "percentage": 44.74, "elapsed_time": "3:23:35", "remaining_time": "4:11:25"}
{"current_steps": 350, "total_steps": 780, "loss": 0.5328, "lr": 1.1960984739332851e-05, "epoch": 0.896, "percentage": 44.87, "elapsed_time": "3:24:10", "remaining_time": "4:10:50"}
{"current_steps": 351, "total_steps": 780, "loss": 0.5948, "lr": 1.1920646334981176e-05, "epoch": 0.89856, "percentage": 45.0, "elapsed_time": "3:24:45", "remaining_time": "4:10:16"}
{"current_steps": 352, "total_steps": 780, "loss": 0.5214, "lr": 1.1880275454832493e-05, "epoch": 0.90112, "percentage": 45.13, "elapsed_time": "3:25:19", "remaining_time": "4:09:39"}
{"current_steps": 353, "total_steps": 780, "loss": 0.6008, "lr": 1.1839872781509358e-05, "epoch": 0.90368, "percentage": 45.26, "elapsed_time": "3:25:54", "remaining_time": "4:09:04"}
{"current_steps": 354, "total_steps": 780, "loss": 0.5804, "lr": 1.1799438998171909e-05, "epoch": 0.90624, "percentage": 45.38, "elapsed_time": "3:26:30", "remaining_time": "4:08:30"}
{"current_steps": 355, "total_steps": 780, "loss": 0.5801, "lr": 1.175897478850632e-05, "epoch": 0.9088, "percentage": 45.51, "elapsed_time": "3:27:05", "remaining_time": "4:07:56"}
{"current_steps": 356, "total_steps": 780, "loss": 0.5786, "lr": 1.1718480836713228e-05, "epoch": 0.91136, "percentage": 45.64, "elapsed_time": "3:27:41", "remaining_time": "4:07:21"}
{"current_steps": 357, "total_steps": 780, "loss": 0.5683, "lr": 1.1677957827496191e-05, "epoch": 0.91392, "percentage": 45.77, "elapsed_time": "3:28:17", "remaining_time": "4:06:48"}
{"current_steps": 358, "total_steps": 780, "loss": 0.5628, "lr": 1.1637406446050072e-05, "epoch": 0.91648, "percentage": 45.9, "elapsed_time": "3:28:53", "remaining_time": "4:06:13"}
{"current_steps": 359, "total_steps": 780, "loss": 0.5568, "lr": 1.1596827378049491e-05, "epoch": 0.91904, "percentage": 46.03, "elapsed_time": "3:29:27", "remaining_time": "4:05:37"}
{"current_steps": 360, "total_steps": 780, "loss": 0.5911, "lr": 1.1556221309637204e-05, "epoch": 0.9216, "percentage": 46.15, "elapsed_time": "3:30:01", "remaining_time": "4:05:02"}
{"current_steps": 361, "total_steps": 780, "loss": 0.4909, "lr": 1.1515588927412509e-05, "epoch": 0.92416, "percentage": 46.28, "elapsed_time": "3:30:37", "remaining_time": "4:04:27"}
{"current_steps": 362, "total_steps": 780, "loss": 0.4918, "lr": 1.147493091841965e-05, "epoch": 0.92672, "percentage": 46.41, "elapsed_time": "3:31:12", "remaining_time": "4:03:52"}
{"current_steps": 363, "total_steps": 780, "loss": 0.5299, "lr": 1.1434247970136188e-05, "epoch": 0.92928, "percentage": 46.54, "elapsed_time": "3:31:49", "remaining_time": "4:03:19"}
{"current_steps": 364, "total_steps": 780, "loss": 0.622, "lr": 1.1393540770461358e-05, "epoch": 0.93184, "percentage": 46.67, "elapsed_time": "3:32:24", "remaining_time": "4:02:44"}
{"current_steps": 365, "total_steps": 780, "loss": 0.5672, "lr": 1.1352810007704476e-05, "epoch": 0.9344, "percentage": 46.79, "elapsed_time": "3:33:00", "remaining_time": "4:02:11"}
{"current_steps": 366, "total_steps": 780, "loss": 0.4876, "lr": 1.1312056370573277e-05, "epoch": 0.93696, "percentage": 46.92, "elapsed_time": "3:33:36", "remaining_time": "4:01:37"}
{"current_steps": 367, "total_steps": 780, "loss": 0.5229, "lr": 1.127128054816227e-05, "epoch": 0.93952, "percentage": 47.05, "elapsed_time": "3:34:11", "remaining_time": "4:01:01"}
{"current_steps": 368, "total_steps": 780, "loss": 0.4969, "lr": 1.1230483229941092e-05, "epoch": 0.94208, "percentage": 47.18, "elapsed_time": "3:34:46", "remaining_time": "4:00:26"}
{"current_steps": 369, "total_steps": 780, "loss": 0.4973, "lr": 1.1189665105742846e-05, "epoch": 0.94464, "percentage": 47.31, "elapsed_time": "3:35:20", "remaining_time": "3:59:51"}
{"current_steps": 370, "total_steps": 780, "loss": 0.55, "lr": 1.1148826865752445e-05, "epoch": 0.9472, "percentage": 47.44, "elapsed_time": "3:35:57", "remaining_time": "3:59:18"}
{"current_steps": 371, "total_steps": 780, "loss": 0.5607, "lr": 1.1107969200494928e-05, "epoch": 0.94976, "percentage": 47.56, "elapsed_time": "3:36:33", "remaining_time": "3:58:44"}
{"current_steps": 372, "total_steps": 780, "loss": 0.5147, "lr": 1.1067092800823798e-05, "epoch": 0.95232, "percentage": 47.69, "elapsed_time": "3:37:08", "remaining_time": "3:58:09"}
{"current_steps": 373, "total_steps": 780, "loss": 0.5039, "lr": 1.1026198357909327e-05, "epoch": 0.95488, "percentage": 47.82, "elapsed_time": "3:37:43", "remaining_time": "3:57:33"}
{"current_steps": 374, "total_steps": 780, "loss": 0.5053, "lr": 1.0985286563226887e-05, "epoch": 0.95744, "percentage": 47.95, "elapsed_time": "3:38:18", "remaining_time": "3:56:59"}
{"current_steps": 375, "total_steps": 780, "loss": 0.5563, "lr": 1.0944358108545236e-05, "epoch": 0.96, "percentage": 48.08, "elapsed_time": "3:38:51", "remaining_time": "3:56:22"}
{"current_steps": 376, "total_steps": 780, "loss": 0.5866, "lr": 1.0903413685914843e-05, "epoch": 0.96256, "percentage": 48.21, "elapsed_time": "3:39:28", "remaining_time": "3:55:48"}
{"current_steps": 377, "total_steps": 780, "loss": 0.573, "lr": 1.0862453987656162e-05, "epoch": 0.96512, "percentage": 48.33, "elapsed_time": "3:40:04", "remaining_time": "3:55:15"}
{"current_steps": 378, "total_steps": 780, "loss": 0.4809, "lr": 1.0821479706347953e-05, "epoch": 0.96768, "percentage": 48.46, "elapsed_time": "3:40:39", "remaining_time": "3:54:40"}
{"current_steps": 379, "total_steps": 780, "loss": 0.5471, "lr": 1.0780491534815549e-05, "epoch": 0.97024, "percentage": 48.59, "elapsed_time": "3:41:13", "remaining_time": "3:54:03"}
{"current_steps": 380, "total_steps": 780, "loss": 0.5732, "lr": 1.0739490166119155e-05, "epoch": 0.9728, "percentage": 48.72, "elapsed_time": "3:41:49", "remaining_time": "3:53:30"}
{"current_steps": 381, "total_steps": 780, "loss": 0.5603, "lr": 1.0698476293542124e-05, "epoch": 0.97536, "percentage": 48.85, "elapsed_time": "3:42:24", "remaining_time": "3:52:54"}
{"current_steps": 382, "total_steps": 780, "loss": 0.5493, "lr": 1.0657450610579225e-05, "epoch": 0.97792, "percentage": 48.97, "elapsed_time": "3:42:58", "remaining_time": "3:52:19"}
{"current_steps": 383, "total_steps": 780, "loss": 0.5611, "lr": 1.0616413810924937e-05, "epoch": 0.98048, "percentage": 49.1, "elapsed_time": "3:43:33", "remaining_time": "3:51:43"}
{"current_steps": 384, "total_steps": 780, "loss": 0.5706, "lr": 1.057536658846171e-05, "epoch": 0.98304, "percentage": 49.23, "elapsed_time": "3:44:08", "remaining_time": "3:51:08"}
{"current_steps": 385, "total_steps": 780, "loss": 0.5511, "lr": 1.053430963724822e-05, "epoch": 0.9856, "percentage": 49.36, "elapsed_time": "3:44:42", "remaining_time": "3:50:32"}
{"current_steps": 386, "total_steps": 780, "loss": 0.4967, "lr": 1.0493243651507654e-05, "epoch": 0.98816, "percentage": 49.49, "elapsed_time": "3:45:17", "remaining_time": "3:49:57"}
{"current_steps": 387, "total_steps": 780, "loss": 0.5375, "lr": 1.0452169325615956e-05, "epoch": 0.99072, "percentage": 49.62, "elapsed_time": "3:45:52", "remaining_time": "3:49:22"}
{"current_steps": 388, "total_steps": 780, "loss": 0.52, "lr": 1.04110873540901e-05, "epoch": 0.99328, "percentage": 49.74, "elapsed_time": "3:46:26", "remaining_time": "3:48:46"}
{"current_steps": 389, "total_steps": 780, "loss": 0.6018, "lr": 1.0369998431576328e-05, "epoch": 0.99584, "percentage": 49.87, "elapsed_time": "3:47:02", "remaining_time": "3:48:12"}
{"current_steps": 390, "total_steps": 780, "loss": 0.5396, "lr": 1.0328903252838415e-05, "epoch": 0.9984, "percentage": 50.0, "elapsed_time": "3:47:37", "remaining_time": "3:47:37"}
{"current_steps": 391, "total_steps": 780, "loss": 0.3953, "lr": 1.0287802512745935e-05, "epoch": 1.00096, "percentage": 50.13, "elapsed_time": "3:48:13", "remaining_time": "3:47:03"}
{"current_steps": 392, "total_steps": 780, "loss": 0.3791, "lr": 1.0246696906262484e-05, "epoch": 1.00352, "percentage": 50.26, "elapsed_time": "3:48:47", "remaining_time": "3:46:27"}
{"current_steps": 393, "total_steps": 780, "loss": 0.3558, "lr": 1.0205587128433944e-05, "epoch": 1.00608, "percentage": 50.38, "elapsed_time": "3:49:22", "remaining_time": "3:45:52"}
{"current_steps": 394, "total_steps": 780, "loss": 0.3351, "lr": 1.016447387437674e-05, "epoch": 1.00864, "percentage": 50.51, "elapsed_time": "3:49:57", "remaining_time": "3:45:17"}
{"current_steps": 395, "total_steps": 780, "loss": 0.3327, "lr": 1.0123357839266066e-05, "epoch": 1.0112, "percentage": 50.64, "elapsed_time": "3:50:31", "remaining_time": "3:44:41"}
{"current_steps": 396, "total_steps": 780, "loss": 0.2687, "lr": 1.0082239718324136e-05, "epoch": 1.01376, "percentage": 50.77, "elapsed_time": "3:51:06", "remaining_time": "3:44:05"}
{"current_steps": 397, "total_steps": 780, "loss": 0.3138, "lr": 1.004112020680845e-05, "epoch": 1.01632, "percentage": 50.9, "elapsed_time": "3:51:43", "remaining_time": "3:43:33"}
{"current_steps": 398, "total_steps": 780, "loss": 0.3256, "lr": 1e-05, "epoch": 1.01888, "percentage": 51.03, "elapsed_time": "3:52:18", "remaining_time": "3:42:57"}
{"current_steps": 399, "total_steps": 780, "loss": 0.3138, "lr": 9.958879793191553e-06, "epoch": 1.02144, "percentage": 51.15, "elapsed_time": "3:52:53", "remaining_time": "3:42:23"}
{"current_steps": 400, "total_steps": 780, "loss": 0.3153, "lr": 9.917760281675867e-06, "epoch": 1.024, "percentage": 51.28, "elapsed_time": "3:53:29", "remaining_time": "3:41:49"}
{"current_steps": 401, "total_steps": 780, "loss": 0.3152, "lr": 9.876642160733937e-06, "epoch": 1.02656, "percentage": 51.41, "elapsed_time": "3:54:03", "remaining_time": "3:41:13"}
{"current_steps": 402, "total_steps": 780, "loss": 0.2928, "lr": 9.835526125623262e-06, "epoch": 1.02912, "percentage": 51.54, "elapsed_time": "3:54:38", "remaining_time": "3:40:38"}
{"current_steps": 403, "total_steps": 780, "loss": 0.3079, "lr": 9.794412871566057e-06, "epoch": 1.03168, "percentage": 51.67, "elapsed_time": "3:55:16", "remaining_time": "3:40:05"}
{"current_steps": 404, "total_steps": 780, "loss": 0.3421, "lr": 9.753303093737518e-06, "epoch": 1.03424, "percentage": 51.79, "elapsed_time": "3:55:51", "remaining_time": "3:39:30"}
{"current_steps": 405, "total_steps": 780, "loss": 0.3364, "lr": 9.71219748725407e-06, "epoch": 1.0368, "percentage": 51.92, "elapsed_time": "3:56:26", "remaining_time": "3:38:55"}
{"current_steps": 406, "total_steps": 780, "loss": 0.3168, "lr": 9.671096747161587e-06, "epoch": 1.03936, "percentage": 52.05, "elapsed_time": "3:57:02", "remaining_time": "3:38:21"}
{"current_steps": 407, "total_steps": 780, "loss": 0.2704, "lr": 9.630001568423677e-06, "epoch": 1.04192, "percentage": 52.18, "elapsed_time": "3:57:37", "remaining_time": "3:37:46"}
{"current_steps": 408, "total_steps": 780, "loss": 0.3153, "lr": 9.588912645909905e-06, "epoch": 1.04448, "percentage": 52.31, "elapsed_time": "3:58:11", "remaining_time": "3:37:10"}
{"current_steps": 409, "total_steps": 780, "loss": 0.3018, "lr": 9.547830674384043e-06, "epoch": 1.04704, "percentage": 52.44, "elapsed_time": "3:58:46", "remaining_time": "3:36:35"}
{"current_steps": 410, "total_steps": 780, "loss": 0.3026, "lr": 9.506756348492348e-06, "epoch": 1.0496, "percentage": 52.56, "elapsed_time": "3:59:21", "remaining_time": "3:36:00"}
{"current_steps": 411, "total_steps": 780, "loss": 0.3179, "lr": 9.465690362751781e-06, "epoch": 1.05216, "percentage": 52.69, "elapsed_time": "3:59:56", "remaining_time": "3:35:25"}
{"current_steps": 412, "total_steps": 780, "loss": 0.3629, "lr": 9.424633411538289e-06, "epoch": 1.05472, "percentage": 52.82, "elapsed_time": "4:00:30", "remaining_time": "3:34:49"}
{"current_steps": 413, "total_steps": 780, "loss": 0.3126, "lr": 9.383586189075065e-06, "epoch": 1.05728, "percentage": 52.95, "elapsed_time": "4:01:06", "remaining_time": "3:34:14"}
{"current_steps": 414, "total_steps": 780, "loss": 0.2997, "lr": 9.342549389420777e-06, "epoch": 1.05984, "percentage": 53.08, "elapsed_time": "4:01:41", "remaining_time": "3:33:39"}
{"current_steps": 415, "total_steps": 780, "loss": 0.2796, "lr": 9.30152370645788e-06, "epoch": 1.0624, "percentage": 53.21, "elapsed_time": "4:02:15", "remaining_time": "3:33:04"}
{"current_steps": 416, "total_steps": 780, "loss": 0.3676, "lr": 9.260509833880848e-06, "epoch": 1.06496, "percentage": 53.33, "elapsed_time": "4:02:51", "remaining_time": "3:32:30"}
{"current_steps": 417, "total_steps": 780, "loss": 0.2902, "lr": 9.21950846518445e-06, "epoch": 1.06752, "percentage": 53.46, "elapsed_time": "4:03:27", "remaining_time": "3:31:55"}
{"current_steps": 418, "total_steps": 780, "loss": 0.2951, "lr": 9.17852029365205e-06, "epoch": 1.07008, "percentage": 53.59, "elapsed_time": "4:04:01", "remaining_time": "3:31:19"}
{"current_steps": 419, "total_steps": 780, "loss": 0.3163, "lr": 9.13754601234384e-06, "epoch": 1.07264, "percentage": 53.72, "elapsed_time": "4:04:36", "remaining_time": "3:30:44"}
{"current_steps": 420, "total_steps": 780, "loss": 0.3362, "lr": 9.096586314085162e-06, "epoch": 1.0752, "percentage": 53.85, "elapsed_time": "4:05:12", "remaining_time": "3:30:10"}
{"current_steps": 421, "total_steps": 780, "loss": 0.284, "lr": 9.055641891454766e-06, "epoch": 1.07776, "percentage": 53.97, "elapsed_time": "4:05:46", "remaining_time": "3:29:34"}
{"current_steps": 422, "total_steps": 780, "loss": 0.3209, "lr": 9.014713436773114e-06, "epoch": 1.08032, "percentage": 54.1, "elapsed_time": "4:06:20", "remaining_time": "3:28:59"}
{"current_steps": 423, "total_steps": 780, "loss": 0.3283, "lr": 8.973801642090674e-06, "epoch": 1.08288, "percentage": 54.23, "elapsed_time": "4:06:57", "remaining_time": "3:28:25"}
{"current_steps": 424, "total_steps": 780, "loss": 0.2894, "lr": 8.932907199176206e-06, "epoch": 1.08544, "percentage": 54.36, "elapsed_time": "4:07:31", "remaining_time": "3:27:49"}
{"current_steps": 425, "total_steps": 780, "loss": 0.3071, "lr": 8.892030799505072e-06, "epoch": 1.088, "percentage": 54.49, "elapsed_time": "4:08:05", "remaining_time": "3:27:14"}
{"current_steps": 426, "total_steps": 780, "loss": 0.326, "lr": 8.85117313424756e-06, "epoch": 1.09056, "percentage": 54.62, "elapsed_time": "4:08:42", "remaining_time": "3:26:40"}
{"current_steps": 427, "total_steps": 780, "loss": 0.3218, "lr": 8.810334894257156e-06, "epoch": 1.09312, "percentage": 54.74, "elapsed_time": "4:09:17", "remaining_time": "3:26:05"}
{"current_steps": 428, "total_steps": 780, "loss": 0.3014, "lr": 8.769516770058915e-06, "epoch": 1.09568, "percentage": 54.87, "elapsed_time": "4:09:51", "remaining_time": "3:25:29"}
{"current_steps": 429, "total_steps": 780, "loss": 0.2813, "lr": 8.728719451837735e-06, "epoch": 1.09824, "percentage": 55.0, "elapsed_time": "4:10:26", "remaining_time": "3:24:54"}
{"current_steps": 430, "total_steps": 780, "loss": 0.2765, "lr": 8.687943629426725e-06, "epoch": 1.1008, "percentage": 55.13, "elapsed_time": "4:11:02", "remaining_time": "3:24:19"}
{"current_steps": 431, "total_steps": 780, "loss": 0.2862, "lr": 8.647189992295526e-06, "epoch": 1.10336, "percentage": 55.26, "elapsed_time": "4:11:38", "remaining_time": "3:23:45"}
{"current_steps": 432, "total_steps": 780, "loss": 0.3143, "lr": 8.606459229538645e-06, "epoch": 1.10592, "percentage": 55.38, "elapsed_time": "4:12:15", "remaining_time": "3:23:12"}
{"current_steps": 433, "total_steps": 780, "loss": 0.3091, "lr": 8.56575202986382e-06, "epoch": 1.10848, "percentage": 55.51, "elapsed_time": "4:12:49", "remaining_time": "3:22:36"}
{"current_steps": 434, "total_steps": 780, "loss": 0.3317, "lr": 8.525069081580351e-06, "epoch": 1.11104, "percentage": 55.64, "elapsed_time": "4:13:25", "remaining_time": "3:22:02"}
{"current_steps": 435, "total_steps": 780, "loss": 0.3065, "lr": 8.484411072587491e-06, "epoch": 1.1136, "percentage": 55.77, "elapsed_time": "4:13:58", "remaining_time": "3:21:26"}
{"current_steps": 436, "total_steps": 780, "loss": 0.2741, "lr": 8.443778690362801e-06, "epoch": 1.11616, "percentage": 55.9, "elapsed_time": "4:14:32", "remaining_time": "3:20:50"}
{"current_steps": 437, "total_steps": 780, "loss": 0.3058, "lr": 8.403172621950512e-06, "epoch": 1.11872, "percentage": 56.03, "elapsed_time": "4:15:06", "remaining_time": "3:20:14"}
{"current_steps": 438, "total_steps": 780, "loss": 0.2868, "lr": 8.362593553949926e-06, "epoch": 1.12128, "percentage": 56.15, "elapsed_time": "4:15:40", "remaining_time": "3:19:37"}
{"current_steps": 439, "total_steps": 780, "loss": 0.3129, "lr": 8.322042172503812e-06, "epoch": 1.12384, "percentage": 56.28, "elapsed_time": "4:16:15", "remaining_time": "3:19:02"}
{"current_steps": 440, "total_steps": 780, "loss": 0.287, "lr": 8.281519163286772e-06, "epoch": 1.1264, "percentage": 56.41, "elapsed_time": "4:16:50", "remaining_time": "3:18:27"}
{"current_steps": 441, "total_steps": 780, "loss": 0.3375, "lr": 8.241025211493684e-06, "epoch": 1.12896, "percentage": 56.54, "elapsed_time": "4:17:25", "remaining_time": "3:17:53"}
{"current_steps": 442, "total_steps": 780, "loss": 0.2843, "lr": 8.200561001828093e-06, "epoch": 1.13152, "percentage": 56.67, "elapsed_time": "4:18:00", "remaining_time": "3:17:17"}
{"current_steps": 443, "total_steps": 780, "loss": 0.3173, "lr": 8.160127218490643e-06, "epoch": 1.13408, "percentage": 56.79, "elapsed_time": "4:18:35", "remaining_time": "3:16:43"}
{"current_steps": 444, "total_steps": 780, "loss": 0.3022, "lr": 8.11972454516751e-06, "epoch": 1.13664, "percentage": 56.92, "elapsed_time": "4:19:11", "remaining_time": "3:16:08"}
{"current_steps": 445, "total_steps": 780, "loss": 0.3453, "lr": 8.079353665018827e-06, "epoch": 1.1392, "percentage": 57.05, "elapsed_time": "4:19:46", "remaining_time": "3:15:34"}
{"current_steps": 446, "total_steps": 780, "loss": 0.33, "lr": 8.039015260667154e-06, "epoch": 1.14176, "percentage": 57.18, "elapsed_time": "4:20:21", "remaining_time": "3:14:58"}
{"current_steps": 447, "total_steps": 780, "loss": 0.311, "lr": 7.998710014185916e-06, "epoch": 1.14432, "percentage": 57.31, "elapsed_time": "4:20:57", "remaining_time": "3:14:23"}
{"current_steps": 448, "total_steps": 780, "loss": 0.3124, "lr": 7.958438607087884e-06, "epoch": 1.14688, "percentage": 57.44, "elapsed_time": "4:21:33", "remaining_time": "3:13:49"}
{"current_steps": 449, "total_steps": 780, "loss": 0.3132, "lr": 7.918201720313648e-06, "epoch": 1.14944, "percentage": 57.56, "elapsed_time": "4:22:08", "remaining_time": "3:13:14"}
{"current_steps": 450, "total_steps": 780, "loss": 0.2898, "lr": 7.878000034220092e-06, "epoch": 1.152, "percentage": 57.69, "elapsed_time": "4:22:44", "remaining_time": "3:12:40"}
{"current_steps": 451, "total_steps": 780, "loss": 0.3116, "lr": 7.837834228568911e-06, "epoch": 1.15456, "percentage": 57.82, "elapsed_time": "4:23:19", "remaining_time": "3:12:05"}
{"current_steps": 452, "total_steps": 780, "loss": 0.3451, "lr": 7.797704982515094e-06, "epoch": 1.15712, "percentage": 57.95, "elapsed_time": "4:23:55", "remaining_time": "3:11:31"}
{"current_steps": 453, "total_steps": 780, "loss": 0.2923, "lr": 7.75761297459546e-06, "epoch": 1.15968, "percentage": 58.08, "elapsed_time": "4:24:29", "remaining_time": "3:10:55"}
{"current_steps": 454, "total_steps": 780, "loss": 0.3156, "lr": 7.717558882717175e-06, "epoch": 1.16224, "percentage": 58.21, "elapsed_time": "4:25:05", "remaining_time": "3:10:20"}
{"current_steps": 455, "total_steps": 780, "loss": 0.2967, "lr": 7.677543384146287e-06, "epoch": 1.1648, "percentage": 58.33, "elapsed_time": "4:25:42", "remaining_time": "3:09:47"}
{"current_steps": 456, "total_steps": 780, "loss": 0.3298, "lr": 7.637567155496277e-06, "epoch": 1.16736, "percentage": 58.46, "elapsed_time": "4:26:20", "remaining_time": "3:09:14"}
{"current_steps": 457, "total_steps": 780, "loss": 0.3067, "lr": 7.597630872716631e-06, "epoch": 1.16992, "percentage": 58.59, "elapsed_time": "4:26:54", "remaining_time": "3:08:38"}
{"current_steps": 458, "total_steps": 780, "loss": 0.3188, "lr": 7.5577352110813825e-06, "epoch": 1.17248, "percentage": 58.72, "elapsed_time": "4:27:29", "remaining_time": "3:08:03"}
{"current_steps": 459, "total_steps": 780, "loss": 0.3103, "lr": 7.517880845177725e-06, "epoch": 1.17504, "percentage": 58.85, "elapsed_time": "4:28:04", "remaining_time": "3:07:28"}
{"current_steps": 460, "total_steps": 780, "loss": 0.2854, "lr": 7.478068448894577e-06, "epoch": 1.1776, "percentage": 58.97, "elapsed_time": "4:28:39", "remaining_time": "3:06:53"}
{"current_steps": 461, "total_steps": 780, "loss": 0.2605, "lr": 7.438298695411218e-06, "epoch": 1.1801599999999999, "percentage": 59.1, "elapsed_time": "4:29:14", "remaining_time": "3:06:18"}
{"current_steps": 462, "total_steps": 780, "loss": 0.2627, "lr": 7.398572257185879e-06, "epoch": 1.18272, "percentage": 59.23, "elapsed_time": "4:29:51", "remaining_time": "3:05:44"}
{"current_steps": 463, "total_steps": 780, "loss": 0.2577, "lr": 7.358889805944383e-06, "epoch": 1.1852800000000001, "percentage": 59.36, "elapsed_time": "4:30:27", "remaining_time": "3:05:10"}
{"current_steps": 464, "total_steps": 780, "loss": 0.3328, "lr": 7.31925201266879e-06, "epoch": 1.18784, "percentage": 59.49, "elapsed_time": "4:31:02", "remaining_time": "3:04:35"}
{"current_steps": 465, "total_steps": 780, "loss": 0.2843, "lr": 7.2796595475860425e-06, "epoch": 1.1904, "percentage": 59.62, "elapsed_time": "4:31:37", "remaining_time": "3:04:00"}
{"current_steps": 466, "total_steps": 780, "loss": 0.3132, "lr": 7.240113080156646e-06, "epoch": 1.19296, "percentage": 59.74, "elapsed_time": "4:32:13", "remaining_time": "3:03:25"}
{"current_steps": 467, "total_steps": 780, "loss": 0.284, "lr": 7.200613279063341e-06, "epoch": 1.19552, "percentage": 59.87, "elapsed_time": "4:32:48", "remaining_time": "3:02:50"}
{"current_steps": 468, "total_steps": 780, "loss": 0.3379, "lr": 7.161160812199785e-06, "epoch": 1.19808, "percentage": 60.0, "elapsed_time": "4:33:22", "remaining_time": "3:02:15"}
{"current_steps": 469, "total_steps": 780, "loss": 0.3304, "lr": 7.121756346659292e-06, "epoch": 1.20064, "percentage": 60.13, "elapsed_time": "4:33:59", "remaining_time": "3:01:41"}
{"current_steps": 470, "total_steps": 780, "loss": 0.2773, "lr": 7.082400548723505e-06, "epoch": 1.2032, "percentage": 60.26, "elapsed_time": "4:34:34", "remaining_time": "3:01:06"}
{"current_steps": 471, "total_steps": 780, "loss": 0.3101, "lr": 7.043094083851181e-06, "epoch": 1.20576, "percentage": 60.38, "elapsed_time": "4:35:10", "remaining_time": "3:00:31"}
{"current_steps": 472, "total_steps": 780, "loss": 0.3011, "lr": 7.003837616666906e-06, "epoch": 1.20832, "percentage": 60.51, "elapsed_time": "4:35:45", "remaining_time": "2:59:56"}
{"current_steps": 473, "total_steps": 780, "loss": 0.2914, "lr": 6.96463181094986e-06, "epoch": 1.21088, "percentage": 60.64, "elapsed_time": "4:36:21", "remaining_time": "2:59:22"}
{"current_steps": 474, "total_steps": 780, "loss": 0.29, "lr": 6.925477329622609e-06, "epoch": 1.21344, "percentage": 60.77, "elapsed_time": "4:36:56", "remaining_time": "2:58:47"}
{"current_steps": 475, "total_steps": 780, "loss": 0.2565, "lr": 6.886374834739883e-06, "epoch": 1.216, "percentage": 60.9, "elapsed_time": "4:37:32", "remaining_time": "2:58:12"}
{"current_steps": 476, "total_steps": 780, "loss": 0.2811, "lr": 6.847324987477375e-06, "epoch": 1.21856, "percentage": 61.03, "elapsed_time": "4:38:06", "remaining_time": "2:57:36"}
{"current_steps": 477, "total_steps": 780, "loss": 0.3277, "lr": 6.808328448120588e-06, "epoch": 1.22112, "percentage": 61.15, "elapsed_time": "4:38:40", "remaining_time": "2:57:01"}
{"current_steps": 478, "total_steps": 780, "loss": 0.2918, "lr": 6.769385876053632e-06, "epoch": 1.2236799999999999, "percentage": 61.28, "elapsed_time": "4:39:15", "remaining_time": "2:56:26"}
{"current_steps": 479, "total_steps": 780, "loss": 0.3103, "lr": 6.730497929748116e-06, "epoch": 1.22624, "percentage": 61.41, "elapsed_time": "4:39:48", "remaining_time": "2:55:50"}
{"current_steps": 480, "total_steps": 780, "loss": 0.3211, "lr": 6.6916652667519855e-06, "epoch": 1.2288000000000001, "percentage": 61.54, "elapsed_time": "4:40:23", "remaining_time": "2:55:14"}
{"current_steps": 481, "total_steps": 780, "loss": 0.3331, "lr": 6.652888543678404e-06, "epoch": 1.23136, "percentage": 61.67, "elapsed_time": "4:40:57", "remaining_time": "2:54:39"}
{"current_steps": 482, "total_steps": 780, "loss": 0.2684, "lr": 6.614168416194674e-06, "epoch": 1.23392, "percentage": 61.79, "elapsed_time": "4:41:32", "remaining_time": "2:54:03"}
{"current_steps": 483, "total_steps": 780, "loss": 0.273, "lr": 6.575505539011123e-06, "epoch": 1.23648, "percentage": 61.92, "elapsed_time": "4:42:05", "remaining_time": "2:53:27"}
{"current_steps": 484, "total_steps": 780, "loss": 0.3324, "lr": 6.536900565870052e-06, "epoch": 1.23904, "percentage": 62.05, "elapsed_time": "4:42:42", "remaining_time": "2:52:53"}
{"current_steps": 485, "total_steps": 780, "loss": 0.2891, "lr": 6.498354149534677e-06, "epoch": 1.2416, "percentage": 62.18, "elapsed_time": "4:43:16", "remaining_time": "2:52:18"}
{"current_steps": 486, "total_steps": 780, "loss": 0.2847, "lr": 6.459866941778077e-06, "epoch": 1.24416, "percentage": 62.31, "elapsed_time": "4:43:51", "remaining_time": "2:51:43"}
{"current_steps": 487, "total_steps": 780, "loss": 0.2841, "lr": 6.421439593372201e-06, "epoch": 1.24672, "percentage": 62.44, "elapsed_time": "4:44:26", "remaining_time": "2:51:08"}
{"current_steps": 488, "total_steps": 780, "loss": 0.3086, "lr": 6.3830727540768445e-06, "epoch": 1.24928, "percentage": 62.56, "elapsed_time": "4:45:01", "remaining_time": "2:50:33"}
{"current_steps": 489, "total_steps": 780, "loss": 0.3166, "lr": 6.344767072628659e-06, "epoch": 1.25184, "percentage": 62.69, "elapsed_time": "4:45:38", "remaining_time": "2:49:58"}
{"current_steps": 490, "total_steps": 780, "loss": 0.279, "lr": 6.3065231967302055e-06, "epoch": 1.2544, "percentage": 62.82, "elapsed_time": "4:46:14", "remaining_time": "2:49:24"}
{"current_steps": 491, "total_steps": 780, "loss": 0.2752, "lr": 6.268341773038973e-06, "epoch": 1.25696, "percentage": 62.95, "elapsed_time": "4:46:47", "remaining_time": "2:48:48"}
{"current_steps": 492, "total_steps": 780, "loss": 0.2958, "lr": 6.230223447156469e-06, "epoch": 1.25952, "percentage": 63.08, "elapsed_time": "4:47:24", "remaining_time": "2:48:14"}
{"current_steps": 493, "total_steps": 780, "loss": 0.274, "lr": 6.1921688636172964e-06, "epoch": 1.26208, "percentage": 63.21, "elapsed_time": "4:47:58", "remaining_time": "2:47:38"}
{"current_steps": 494, "total_steps": 780, "loss": 0.2761, "lr": 6.154178665878241e-06, "epoch": 1.26464, "percentage": 63.33, "elapsed_time": "4:48:34", "remaining_time": "2:47:04"}
{"current_steps": 495, "total_steps": 780, "loss": 0.2883, "lr": 6.116253496307415e-06, "epoch": 1.2671999999999999, "percentage": 63.46, "elapsed_time": "4:49:09", "remaining_time": "2:46:29"}
{"current_steps": 496, "total_steps": 780, "loss": 0.2789, "lr": 6.078393996173375e-06, "epoch": 1.26976, "percentage": 63.59, "elapsed_time": "4:49:44", "remaining_time": "2:45:54"}
{"current_steps": 497, "total_steps": 780, "loss": 0.3174, "lr": 6.040600805634287e-06, "epoch": 1.2723200000000001, "percentage": 63.72, "elapsed_time": "4:50:20", "remaining_time": "2:45:19"}
{"current_steps": 498, "total_steps": 780, "loss": 0.2831, "lr": 6.002874563727116e-06, "epoch": 1.27488, "percentage": 63.85, "elapsed_time": "4:50:55", "remaining_time": "2:44:44"}
{"current_steps": 499, "total_steps": 780, "loss": 0.3047, "lr": 5.965215908356783e-06, "epoch": 1.27744, "percentage": 63.97, "elapsed_time": "4:51:30", "remaining_time": "2:44:09"}
{"current_steps": 500, "total_steps": 780, "loss": 0.2981, "lr": 5.927625476285426e-06, "epoch": 1.28, "percentage": 64.1, "elapsed_time": "4:52:05", "remaining_time": "2:43:34"}
{"current_steps": 501, "total_steps": 780, "loss": 0.3129, "lr": 5.890103903121593e-06, "epoch": 1.28256, "percentage": 64.23, "elapsed_time": "4:53:26", "remaining_time": "2:43:24"}
{"current_steps": 502, "total_steps": 780, "loss": 0.2928, "lr": 5.852651823309521e-06, "epoch": 1.28512, "percentage": 64.36, "elapsed_time": "4:54:03", "remaining_time": "2:42:50"}
{"current_steps": 503, "total_steps": 780, "loss": 0.2899, "lr": 5.815269870118403e-06, "epoch": 1.28768, "percentage": 64.49, "elapsed_time": "4:54:39", "remaining_time": "2:42:15"}
{"current_steps": 504, "total_steps": 780, "loss": 0.3004, "lr": 5.777958675631657e-06, "epoch": 1.29024, "percentage": 64.62, "elapsed_time": "4:55:14", "remaining_time": "2:41:41"}
{"current_steps": 505, "total_steps": 780, "loss": 0.2953, "lr": 5.740718870736272e-06, "epoch": 1.2928, "percentage": 64.74, "elapsed_time": "4:55:51", "remaining_time": "2:41:06"}
{"current_steps": 506, "total_steps": 780, "loss": 0.3021, "lr": 5.703551085112133e-06, "epoch": 1.29536, "percentage": 64.87, "elapsed_time": "4:56:24", "remaining_time": "2:40:30"}
{"current_steps": 507, "total_steps": 780, "loss": 0.2781, "lr": 5.6664559472213495e-06, "epoch": 1.29792, "percentage": 65.0, "elapsed_time": "4:56:57", "remaining_time": "2:39:54"}
{"current_steps": 508, "total_steps": 780, "loss": 0.3122, "lr": 5.629434084297654e-06, "epoch": 1.30048, "percentage": 65.13, "elapsed_time": "4:57:32", "remaining_time": "2:39:18"}
{"current_steps": 509, "total_steps": 780, "loss": 0.3498, "lr": 5.592486122335784e-06, "epoch": 1.30304, "percentage": 65.26, "elapsed_time": "4:58:08", "remaining_time": "2:38:43"}
{"current_steps": 510, "total_steps": 780, "loss": 0.3079, "lr": 5.555612686080909e-06, "epoch": 1.3056, "percentage": 65.38, "elapsed_time": "4:58:43", "remaining_time": "2:38:08"}
{"current_steps": 511, "total_steps": 780, "loss": 0.2685, "lr": 5.518814399018058e-06, "epoch": 1.30816, "percentage": 65.51, "elapsed_time": "4:59:17", "remaining_time": "2:37:33"}
{"current_steps": 512, "total_steps": 780, "loss": 0.2897, "lr": 5.482091883361571e-06, "epoch": 1.3107199999999999, "percentage": 65.64, "elapsed_time": "4:59:53", "remaining_time": "2:36:58"}
{"current_steps": 513, "total_steps": 780, "loss": 0.2751, "lr": 5.445445760044594e-06, "epoch": 1.31328, "percentage": 65.77, "elapsed_time": "5:00:28", "remaining_time": "2:36:23"}
{"current_steps": 514, "total_steps": 780, "loss": 0.2808, "lr": 5.408876648708561e-06, "epoch": 1.3158400000000001, "percentage": 65.9, "elapsed_time": "5:01:02", "remaining_time": "2:35:47"}
{"current_steps": 515, "total_steps": 780, "loss": 0.2751, "lr": 5.372385167692739e-06, "epoch": 1.3184, "percentage": 66.03, "elapsed_time": "5:01:37", "remaining_time": "2:35:12"}
{"current_steps": 516, "total_steps": 780, "loss": 0.2917, "lr": 5.335971934023757e-06, "epoch": 1.32096, "percentage": 66.15, "elapsed_time": "5:02:12", "remaining_time": "2:34:37"}
{"current_steps": 517, "total_steps": 780, "loss": 0.2997, "lr": 5.299637563405169e-06, "epoch": 1.32352, "percentage": 66.28, "elapsed_time": "5:02:48", "remaining_time": "2:34:02"}
{"current_steps": 518, "total_steps": 780, "loss": 0.2627, "lr": 5.263382670207063e-06, "epoch": 1.32608, "percentage": 66.41, "elapsed_time": "5:03:23", "remaining_time": "2:33:26"}
{"current_steps": 519, "total_steps": 780, "loss": 0.2679, "lr": 5.227207867455648e-06, "epoch": 1.32864, "percentage": 66.54, "elapsed_time": "5:03:58", "remaining_time": "2:32:52"}
{"current_steps": 520, "total_steps": 780, "loss": 0.2732, "lr": 5.191113766822905e-06, "epoch": 1.3312, "percentage": 66.67, "elapsed_time": "5:04:35", "remaining_time": "2:32:17"}
{"current_steps": 521, "total_steps": 780, "loss": 0.3065, "lr": 5.155100978616248e-06, "epoch": 1.33376, "percentage": 66.79, "elapsed_time": "5:05:08", "remaining_time": "2:31:41"}
{"current_steps": 522, "total_steps": 780, "loss": 0.3092, "lr": 5.1191701117681815e-06, "epoch": 1.33632, "percentage": 66.92, "elapsed_time": "5:05:44", "remaining_time": "2:31:06"}
{"current_steps": 523, "total_steps": 780, "loss": 0.2825, "lr": 5.083321773826038e-06, "epoch": 1.33888, "percentage": 67.05, "elapsed_time": "5:06:18", "remaining_time": "2:30:31"}
{"current_steps": 524, "total_steps": 780, "loss": 0.2928, "lr": 5.04755657094167e-06, "epoch": 1.34144, "percentage": 67.18, "elapsed_time": "5:06:53", "remaining_time": "2:29:55"}
{"current_steps": 525, "total_steps": 780, "loss": 0.2725, "lr": 5.011875107861221e-06, "epoch": 1.3439999999999999, "percentage": 67.31, "elapsed_time": "5:07:28", "remaining_time": "2:29:20"}
{"current_steps": 526, "total_steps": 780, "loss": 0.3287, "lr": 4.976277987914905e-06, "epoch": 1.34656, "percentage": 67.44, "elapsed_time": "5:08:05", "remaining_time": "2:28:46"}
{"current_steps": 527, "total_steps": 780, "loss": 0.2839, "lr": 4.940765813006784e-06, "epoch": 1.34912, "percentage": 67.56, "elapsed_time": "5:08:40", "remaining_time": "2:28:11"}
{"current_steps": 528, "total_steps": 780, "loss": 0.3033, "lr": 4.905339183604614e-06, "epoch": 1.35168, "percentage": 67.69, "elapsed_time": "5:09:16", "remaining_time": "2:27:36"}
{"current_steps": 529, "total_steps": 780, "loss": 0.301, "lr": 4.86999869872967e-06, "epoch": 1.3542399999999999, "percentage": 67.82, "elapsed_time": "5:09:48", "remaining_time": "2:26:59"}
{"current_steps": 530, "total_steps": 780, "loss": 0.2911, "lr": 4.834744955946631e-06, "epoch": 1.3568, "percentage": 67.95, "elapsed_time": "5:10:23", "remaining_time": "2:26:24"}
{"current_steps": 531, "total_steps": 780, "loss": 0.3027, "lr": 4.79957855135348e-06, "epoch": 1.3593600000000001, "percentage": 68.08, "elapsed_time": "5:10:57", "remaining_time": "2:25:49"}
{"current_steps": 532, "total_steps": 780, "loss": 0.3231, "lr": 4.764500079571403e-06, "epoch": 1.36192, "percentage": 68.21, "elapsed_time": "5:11:33", "remaining_time": "2:25:14"}
{"current_steps": 533, "total_steps": 780, "loss": 0.2855, "lr": 4.729510133734766e-06, "epoch": 1.36448, "percentage": 68.33, "elapsed_time": "5:12:08", "remaining_time": "2:24:38"}
{"current_steps": 534, "total_steps": 780, "loss": 0.2804, "lr": 4.694609305481055e-06, "epoch": 1.36704, "percentage": 68.46, "elapsed_time": "5:12:43", "remaining_time": "2:24:03"}
{"current_steps": 535, "total_steps": 780, "loss": 0.3093, "lr": 4.659798184940887e-06, "epoch": 1.3696, "percentage": 68.59, "elapsed_time": "5:13:18", "remaining_time": "2:23:28"}
{"current_steps": 536, "total_steps": 780, "loss": 0.2445, "lr": 4.6250773607280375e-06, "epoch": 1.37216, "percentage": 68.72, "elapsed_time": "5:13:53", "remaining_time": "2:22:53"}
{"current_steps": 537, "total_steps": 780, "loss": 0.28, "lr": 4.590447419929481e-06, "epoch": 1.37472, "percentage": 68.85, "elapsed_time": "5:14:27", "remaining_time": "2:22:17"}
{"current_steps": 538, "total_steps": 780, "loss": 0.2487, "lr": 4.555908948095455e-06, "epoch": 1.37728, "percentage": 68.97, "elapsed_time": "5:15:02", "remaining_time": "2:21:42"}
{"current_steps": 539, "total_steps": 780, "loss": 0.2874, "lr": 4.521462529229579e-06, "epoch": 1.37984, "percentage": 69.1, "elapsed_time": "5:15:36", "remaining_time": "2:21:07"}
{"current_steps": 540, "total_steps": 780, "loss": 0.2994, "lr": 4.487108745778958e-06, "epoch": 1.3824, "percentage": 69.23, "elapsed_time": "5:16:12", "remaining_time": "2:20:32"}
{"current_steps": 541, "total_steps": 780, "loss": 0.3276, "lr": 4.452848178624348e-06, "epoch": 1.38496, "percentage": 69.36, "elapsed_time": "5:16:49", "remaining_time": "2:19:57"}
{"current_steps": 542, "total_steps": 780, "loss": 0.2484, "lr": 4.418681407070339e-06, "epoch": 1.3875199999999999, "percentage": 69.49, "elapsed_time": "5:17:24", "remaining_time": "2:19:22"}
{"current_steps": 543, "total_steps": 780, "loss": 0.284, "lr": 4.384609008835535e-06, "epoch": 1.39008, "percentage": 69.62, "elapsed_time": "5:17:59", "remaining_time": "2:18:47"}
{"current_steps": 544, "total_steps": 780, "loss": 0.3073, "lr": 4.350631560042821e-06, "epoch": 1.39264, "percentage": 69.74, "elapsed_time": "5:18:32", "remaining_time": "2:18:11"}
{"current_steps": 545, "total_steps": 780, "loss": 0.3176, "lr": 4.3167496352095876e-06, "epoch": 1.3952, "percentage": 69.87, "elapsed_time": "5:19:07", "remaining_time": "2:17:36"}
{"current_steps": 546, "total_steps": 780, "loss": 0.2941, "lr": 4.282963807238032e-06, "epoch": 1.39776, "percentage": 70.0, "elapsed_time": "5:19:42", "remaining_time": "2:17:01"}
{"current_steps": 547, "total_steps": 780, "loss": 0.3092, "lr": 4.2492746474054825e-06, "epoch": 1.40032, "percentage": 70.13, "elapsed_time": "5:20:15", "remaining_time": "2:16:25"}
{"current_steps": 548, "total_steps": 780, "loss": 0.2854, "lr": 4.2156827253547095e-06, "epoch": 1.4028800000000001, "percentage": 70.26, "elapsed_time": "5:20:50", "remaining_time": "2:15:49"}
{"current_steps": 549, "total_steps": 780, "loss": 0.327, "lr": 4.182188609084328e-06, "epoch": 1.40544, "percentage": 70.38, "elapsed_time": "5:21:28", "remaining_time": "2:15:15"}
{"current_steps": 550, "total_steps": 780, "loss": 0.2519, "lr": 4.148792864939164e-06, "epoch": 1.408, "percentage": 70.51, "elapsed_time": "5:22:03", "remaining_time": "2:14:40"}
{"current_steps": 551, "total_steps": 780, "loss": 0.2978, "lr": 4.115496057600689e-06, "epoch": 1.41056, "percentage": 70.64, "elapsed_time": "5:22:39", "remaining_time": "2:14:05"}
{"current_steps": 552, "total_steps": 780, "loss": 0.3189, "lr": 4.082298750077485e-06, "epoch": 1.41312, "percentage": 70.77, "elapsed_time": "5:23:15", "remaining_time": "2:13:30"}
{"current_steps": 553, "total_steps": 780, "loss": 0.2839, "lr": 4.0492015036957e-06, "epoch": 1.41568, "percentage": 70.9, "elapsed_time": "5:23:50", "remaining_time": "2:12:55"}
{"current_steps": 554, "total_steps": 780, "loss": 0.265, "lr": 4.016204878089579e-06, "epoch": 1.41824, "percentage": 71.03, "elapsed_time": "5:24:25", "remaining_time": "2:12:20"}
{"current_steps": 555, "total_steps": 780, "loss": 0.2566, "lr": 3.983309431191995e-06, "epoch": 1.4208, "percentage": 71.15, "elapsed_time": "5:25:00", "remaining_time": "2:11:45"}
{"current_steps": 556, "total_steps": 780, "loss": 0.3097, "lr": 3.950515719224991e-06, "epoch": 1.42336, "percentage": 71.28, "elapsed_time": "5:25:36", "remaining_time": "2:11:10"}
{"current_steps": 557, "total_steps": 780, "loss": 0.2629, "lr": 3.9178242966904225e-06, "epoch": 1.42592, "percentage": 71.41, "elapsed_time": "5:26:13", "remaining_time": "2:10:36"}
{"current_steps": 558, "total_steps": 780, "loss": 0.3089, "lr": 3.885235716360534e-06, "epoch": 1.42848, "percentage": 71.54, "elapsed_time": "5:26:49", "remaining_time": "2:10:01"}
{"current_steps": 559, "total_steps": 780, "loss": 0.2841, "lr": 3.852750529268645e-06, "epoch": 1.4310399999999999, "percentage": 71.67, "elapsed_time": "5:27:23", "remaining_time": "2:09:26"}
{"current_steps": 560, "total_steps": 780, "loss": 0.3019, "lr": 3.820369284699823e-06, "epoch": 1.4336, "percentage": 71.79, "elapsed_time": "5:27:58", "remaining_time": "2:08:50"}
{"current_steps": 561, "total_steps": 780, "loss": 0.2747, "lr": 3.788092530181583e-06, "epoch": 1.43616, "percentage": 71.92, "elapsed_time": "5:28:34", "remaining_time": "2:08:16"}
{"current_steps": 562, "total_steps": 780, "loss": 0.2652, "lr": 3.755920811474647e-06, "epoch": 1.43872, "percentage": 72.05, "elapsed_time": "5:29:09", "remaining_time": "2:07:40"}
{"current_steps": 563, "total_steps": 780, "loss": 0.2763, "lr": 3.7238546725637046e-06, "epoch": 1.44128, "percentage": 72.18, "elapsed_time": "5:29:44", "remaining_time": "2:07:05"}
{"current_steps": 564, "total_steps": 780, "loss": 0.2877, "lr": 3.691894655648225e-06, "epoch": 1.44384, "percentage": 72.31, "elapsed_time": "5:30:22", "remaining_time": "2:06:31"}
{"current_steps": 565, "total_steps": 780, "loss": 0.2975, "lr": 3.6600413011332835e-06, "epoch": 1.4464000000000001, "percentage": 72.44, "elapsed_time": "5:30:57", "remaining_time": "2:05:56"}
{"current_steps": 566, "total_steps": 780, "loss": 0.3059, "lr": 3.6282951476204177e-06, "epoch": 1.44896, "percentage": 72.56, "elapsed_time": "5:31:34", "remaining_time": "2:05:21"}
{"current_steps": 567, "total_steps": 780, "loss": 0.3158, "lr": 3.5966567318985267e-06, "epoch": 1.45152, "percentage": 72.69, "elapsed_time": "5:32:09", "remaining_time": "2:04:46"}
{"current_steps": 568, "total_steps": 780, "loss": 0.2836, "lr": 3.565126588934803e-06, "epoch": 1.45408, "percentage": 72.82, "elapsed_time": "5:32:46", "remaining_time": "2:04:12"}
{"current_steps": 569, "total_steps": 780, "loss": 0.2957, "lr": 3.533705251865668e-06, "epoch": 1.45664, "percentage": 72.95, "elapsed_time": "5:33:21", "remaining_time": "2:03:37"}
{"current_steps": 570, "total_steps": 780, "loss": 0.3121, "lr": 3.502393251987776e-06, "epoch": 1.4592, "percentage": 73.08, "elapsed_time": "5:33:55", "remaining_time": "2:03:01"}
{"current_steps": 571, "total_steps": 780, "loss": 0.2687, "lr": 3.4711911187490165e-06, "epoch": 1.46176, "percentage": 73.21, "elapsed_time": "5:34:30", "remaining_time": "2:02:26"}
{"current_steps": 572, "total_steps": 780, "loss": 0.3278, "lr": 3.4400993797395664e-06, "epoch": 1.46432, "percentage": 73.33, "elapsed_time": "5:35:07", "remaining_time": "2:01:51"}
{"current_steps": 573, "total_steps": 780, "loss": 0.2655, "lr": 3.4091185606829793e-06, "epoch": 1.46688, "percentage": 73.46, "elapsed_time": "5:35:41", "remaining_time": "2:01:16"}
{"current_steps": 574, "total_steps": 780, "loss": 0.3024, "lr": 3.3782491854272736e-06, "epoch": 1.46944, "percentage": 73.59, "elapsed_time": "5:36:17", "remaining_time": "2:00:41"}
{"current_steps": 575, "total_steps": 780, "loss": 0.2755, "lr": 3.3474917759361036e-06, "epoch": 1.472, "percentage": 73.72, "elapsed_time": "5:36:52", "remaining_time": "2:00:06"}
{"current_steps": 576, "total_steps": 780, "loss": 0.2863, "lr": 3.316846852279907e-06, "epoch": 1.4745599999999999, "percentage": 73.85, "elapsed_time": "5:37:28", "remaining_time": "1:59:31"}
{"current_steps": 577, "total_steps": 780, "loss": 0.281, "lr": 3.2863149326271226e-06, "epoch": 1.47712, "percentage": 73.97, "elapsed_time": "5:38:04", "remaining_time": "1:58:56"}
{"current_steps": 578, "total_steps": 780, "loss": 0.27, "lr": 3.255896533235439e-06, "epoch": 1.47968, "percentage": 74.1, "elapsed_time": "5:38:40", "remaining_time": "1:58:21"}
{"current_steps": 579, "total_steps": 780, "loss": 0.2756, "lr": 3.2255921684430423e-06, "epoch": 1.48224, "percentage": 74.23, "elapsed_time": "5:39:15", "remaining_time": "1:57:46"}
{"current_steps": 580, "total_steps": 780, "loss": 0.321, "lr": 3.195402350659945e-06, "epoch": 1.4848, "percentage": 74.36, "elapsed_time": "5:39:49", "remaining_time": "1:57:11"}
{"current_steps": 581, "total_steps": 780, "loss": 0.2877, "lr": 3.165327590359295e-06, "epoch": 1.48736, "percentage": 74.49, "elapsed_time": "5:40:23", "remaining_time": "1:56:35"}
{"current_steps": 582, "total_steps": 780, "loss": 0.3027, "lr": 3.135368396068771e-06, "epoch": 1.4899200000000001, "percentage": 74.62, "elapsed_time": "5:40:57", "remaining_time": "1:55:59"}
{"current_steps": 583, "total_steps": 780, "loss": 0.2573, "lr": 3.1055252743619623e-06, "epoch": 1.49248, "percentage": 74.74, "elapsed_time": "5:41:32", "remaining_time": "1:55:24"}
{"current_steps": 584, "total_steps": 780, "loss": 0.2703, "lr": 3.0757987298498106e-06, "epoch": 1.49504, "percentage": 74.87, "elapsed_time": "5:42:08", "remaining_time": "1:54:49"}
{"current_steps": 585, "total_steps": 780, "loss": 0.2836, "lr": 3.046189265172085e-06, "epoch": 1.4976, "percentage": 75.0, "elapsed_time": "5:42:44", "remaining_time": "1:54:14"}
{"current_steps": 586, "total_steps": 780, "loss": 0.2958, "lr": 3.0166973809888776e-06, "epoch": 1.5001600000000002, "percentage": 75.13, "elapsed_time": "5:43:19", "remaining_time": "1:53:39"}
{"current_steps": 587, "total_steps": 780, "loss": 0.2819, "lr": 2.987323575972132e-06, "epoch": 1.50272, "percentage": 75.26, "elapsed_time": "5:43:55", "remaining_time": "1:53:04"}
{"current_steps": 588, "total_steps": 780, "loss": 0.2939, "lr": 2.958068346797217e-06, "epoch": 1.50528, "percentage": 75.38, "elapsed_time": "5:44:30", "remaining_time": "1:52:29"}
{"current_steps": 589, "total_steps": 780, "loss": 0.2822, "lr": 2.9289321881345257e-06, "epoch": 1.5078399999999998, "percentage": 75.51, "elapsed_time": "5:45:05", "remaining_time": "1:51:54"}
{"current_steps": 590, "total_steps": 780, "loss": 0.3133, "lr": 2.8999155926411203e-06, "epoch": 1.5104, "percentage": 75.64, "elapsed_time": "5:45:40", "remaining_time": "1:51:18"}
{"current_steps": 591, "total_steps": 780, "loss": 0.2718, "lr": 2.871019050952395e-06, "epoch": 1.51296, "percentage": 75.77, "elapsed_time": "5:46:15", "remaining_time": "1:50:43"}
{"current_steps": 592, "total_steps": 780, "loss": 0.2287, "lr": 2.8422430516737733e-06, "epoch": 1.51552, "percentage": 75.9, "elapsed_time": "5:46:50", "remaining_time": "1:50:08"}
{"current_steps": 593, "total_steps": 780, "loss": 0.2805, "lr": 2.813588081372456e-06, "epoch": 1.5180799999999999, "percentage": 76.03, "elapsed_time": "5:47:26", "remaining_time": "1:49:33"}
{"current_steps": 594, "total_steps": 780, "loss": 0.2783, "lr": 2.7850546245691866e-06, "epoch": 1.52064, "percentage": 76.15, "elapsed_time": "5:48:02", "remaining_time": "1:48:59"}
{"current_steps": 595, "total_steps": 780, "loss": 0.2936, "lr": 2.7566431637300738e-06, "epoch": 1.5232, "percentage": 76.28, "elapsed_time": "5:48:37", "remaining_time": "1:48:23"}
{"current_steps": 596, "total_steps": 780, "loss": 0.2858, "lr": 2.7283541792584165e-06, "epoch": 1.52576, "percentage": 76.41, "elapsed_time": "5:49:12", "remaining_time": "1:47:48"}
{"current_steps": 597, "total_steps": 780, "loss": 0.2717, "lr": 2.7001881494865845e-06, "epoch": 1.52832, "percentage": 76.54, "elapsed_time": "5:49:48", "remaining_time": "1:47:13"}
{"current_steps": 598, "total_steps": 780, "loss": 0.2761, "lr": 2.672145550667933e-06, "epoch": 1.53088, "percentage": 76.67, "elapsed_time": "5:50:22", "remaining_time": "1:46:38"}
{"current_steps": 599, "total_steps": 780, "loss": 0.266, "lr": 2.6442268569687567e-06, "epoch": 1.5334400000000001, "percentage": 76.79, "elapsed_time": "5:50:58", "remaining_time": "1:46:03"}
{"current_steps": 600, "total_steps": 780, "loss": 0.2839, "lr": 2.616432540460255e-06, "epoch": 1.536, "percentage": 76.92, "elapsed_time": "5:51:35", "remaining_time": "1:45:28"}
{"current_steps": 601, "total_steps": 780, "loss": 0.2996, "lr": 2.5887630711105705e-06, "epoch": 1.53856, "percentage": 77.05, "elapsed_time": "5:52:10", "remaining_time": "1:44:53"}
{"current_steps": 602, "total_steps": 780, "loss": 0.2827, "lr": 2.561218916776823e-06, "epoch": 1.54112, "percentage": 77.18, "elapsed_time": "5:52:46", "remaining_time": "1:44:18"}
{"current_steps": 603, "total_steps": 780, "loss": 0.2962, "lr": 2.5338005431972144e-06, "epoch": 1.5436800000000002, "percentage": 77.31, "elapsed_time": "5:53:20", "remaining_time": "1:43:42"}
{"current_steps": 604, "total_steps": 780, "loss": 0.2769, "lr": 2.5065084139831443e-06, "epoch": 1.54624, "percentage": 77.44, "elapsed_time": "5:53:56", "remaining_time": "1:43:08"}
{"current_steps": 605, "total_steps": 780, "loss": 0.2798, "lr": 2.4793429906113676e-06, "epoch": 1.5488, "percentage": 77.56, "elapsed_time": "5:54:32", "remaining_time": "1:42:33"}
{"current_steps": 606, "total_steps": 780, "loss": 0.2837, "lr": 2.4523047324162087e-06, "epoch": 1.5513599999999999, "percentage": 77.69, "elapsed_time": "5:55:07", "remaining_time": "1:41:57"}
{"current_steps": 607, "total_steps": 780, "loss": 0.3107, "lr": 2.4253940965817726e-06, "epoch": 1.55392, "percentage": 77.82, "elapsed_time": "5:55:42", "remaining_time": "1:41:22"}
{"current_steps": 608, "total_steps": 780, "loss": 0.3172, "lr": 2.3986115381342347e-06, "epoch": 1.55648, "percentage": 77.95, "elapsed_time": "5:56:17", "remaining_time": "1:40:47"}
{"current_steps": 609, "total_steps": 780, "loss": 0.2837, "lr": 2.3719575099341298e-06, "epoch": 1.55904, "percentage": 78.08, "elapsed_time": "5:56:51", "remaining_time": "1:40:12"}
{"current_steps": 610, "total_steps": 780, "loss": 0.2551, "lr": 2.345432462668702e-06, "epoch": 1.5615999999999999, "percentage": 78.21, "elapsed_time": "5:57:29", "remaining_time": "1:39:37"}
{"current_steps": 611, "total_steps": 780, "loss": 0.2574, "lr": 2.3190368448442936e-06, "epoch": 1.56416, "percentage": 78.33, "elapsed_time": "5:58:05", "remaining_time": "1:39:02"}
{"current_steps": 612, "total_steps": 780, "loss": 0.3037, "lr": 2.292771102778739e-06, "epoch": 1.5667200000000001, "percentage": 78.46, "elapsed_time": "5:58:38", "remaining_time": "1:38:27"}
{"current_steps": 613, "total_steps": 780, "loss": 0.3067, "lr": 2.266635680593845e-06, "epoch": 1.56928, "percentage": 78.59, "elapsed_time": "5:59:12", "remaining_time": "1:37:51"}
{"current_steps": 614, "total_steps": 780, "loss": 0.2807, "lr": 2.2406310202078586e-06, "epoch": 1.57184, "percentage": 78.72, "elapsed_time": "5:59:48", "remaining_time": "1:37:16"}
{"current_steps": 615, "total_steps": 780, "loss": 0.2997, "lr": 2.2147575613280013e-06, "epoch": 1.5744, "percentage": 78.85, "elapsed_time": "6:00:24", "remaining_time": "1:36:41"}
{"current_steps": 616, "total_steps": 780, "loss": 0.2528, "lr": 2.1890157414430448e-06, "epoch": 1.5769600000000001, "percentage": 78.97, "elapsed_time": "6:00:59", "remaining_time": "1:36:06"}
{"current_steps": 617, "total_steps": 780, "loss": 0.2771, "lr": 2.163405995815904e-06, "epoch": 1.57952, "percentage": 79.1, "elapsed_time": "6:01:33", "remaining_time": "1:35:31"}
{"current_steps": 618, "total_steps": 780, "loss": 0.3045, "lr": 2.1379287574762717e-06, "epoch": 1.58208, "percentage": 79.23, "elapsed_time": "6:02:08", "remaining_time": "1:34:55"}
{"current_steps": 619, "total_steps": 780, "loss": 0.319, "lr": 2.11258445721331e-06, "epoch": 1.58464, "percentage": 79.36, "elapsed_time": "6:02:43", "remaining_time": "1:34:20"}
{"current_steps": 620, "total_steps": 780, "loss": 0.2799, "lr": 2.0873735235683535e-06, "epoch": 1.5872000000000002, "percentage": 79.49, "elapsed_time": "6:03:18", "remaining_time": "1:33:45"}
{"current_steps": 621, "total_steps": 780, "loss": 0.2626, "lr": 2.0622963828276744e-06, "epoch": 1.58976, "percentage": 79.62, "elapsed_time": "6:03:52", "remaining_time": "1:33:10"}
{"current_steps": 622, "total_steps": 780, "loss": 0.2744, "lr": 2.037353459015272e-06, "epoch": 1.59232, "percentage": 79.74, "elapsed_time": "6:04:27", "remaining_time": "1:32:34"}
{"current_steps": 623, "total_steps": 780, "loss": 0.2296, "lr": 2.0125451738856903e-06, "epoch": 1.5948799999999999, "percentage": 79.87, "elapsed_time": "6:05:04", "remaining_time": "1:31:59"}
{"current_steps": 624, "total_steps": 780, "loss": 0.2595, "lr": 1.9878719469169104e-06, "epoch": 1.59744, "percentage": 80.0, "elapsed_time": "6:05:39", "remaining_time": "1:31:24"}
{"current_steps": 625, "total_steps": 780, "loss": 0.2906, "lr": 1.9633341953032246e-06, "epoch": 1.6, "percentage": 80.13, "elapsed_time": "6:06:12", "remaining_time": "1:30:49"}
{"current_steps": 626, "total_steps": 780, "loss": 0.2756, "lr": 1.9389323339482204e-06, "epoch": 1.60256, "percentage": 80.26, "elapsed_time": "6:06:48", "remaining_time": "1:30:14"}
{"current_steps": 627, "total_steps": 780, "loss": 0.3068, "lr": 1.9146667754577408e-06, "epoch": 1.6051199999999999, "percentage": 80.38, "elapsed_time": "6:07:23", "remaining_time": "1:29:39"}
{"current_steps": 628, "total_steps": 780, "loss": 0.2839, "lr": 1.890537930132903e-06, "epoch": 1.60768, "percentage": 80.51, "elapsed_time": "6:07:59", "remaining_time": "1:29:04"}
{"current_steps": 629, "total_steps": 780, "loss": 0.2491, "lr": 1.8665462059631866e-06, "epoch": 1.6102400000000001, "percentage": 80.64, "elapsed_time": "6:08:33", "remaining_time": "1:28:28"}
{"current_steps": 630, "total_steps": 780, "loss": 0.2904, "lr": 1.8426920086195065e-06, "epoch": 1.6128, "percentage": 80.77, "elapsed_time": "6:09:07", "remaining_time": "1:27:53"}
{"current_steps": 631, "total_steps": 780, "loss": 0.2441, "lr": 1.8189757414473686e-06, "epoch": 1.61536, "percentage": 80.9, "elapsed_time": "6:09:42", "remaining_time": "1:27:18"}
{"current_steps": 632, "total_steps": 780, "loss": 0.3003, "lr": 1.795397805460053e-06, "epoch": 1.61792, "percentage": 81.03, "elapsed_time": "6:10:18", "remaining_time": "1:26:43"}
{"current_steps": 633, "total_steps": 780, "loss": 0.2896, "lr": 1.7719585993318177e-06, "epoch": 1.6204800000000001, "percentage": 81.15, "elapsed_time": "6:10:53", "remaining_time": "1:26:07"}
{"current_steps": 634, "total_steps": 780, "loss": 0.2794, "lr": 1.7486585193911787e-06, "epoch": 1.62304, "percentage": 81.28, "elapsed_time": "6:11:28", "remaining_time": "1:25:32"}
{"current_steps": 635, "total_steps": 780, "loss": 0.2616, "lr": 1.7254979596141886e-06, "epoch": 1.6256, "percentage": 81.41, "elapsed_time": "6:12:02", "remaining_time": "1:24:57"}
{"current_steps": 636, "total_steps": 780, "loss": 0.2912, "lr": 1.7024773116177839e-06, "epoch": 1.62816, "percentage": 81.54, "elapsed_time": "6:12:38", "remaining_time": "1:24:22"}
{"current_steps": 637, "total_steps": 780, "loss": 0.2617, "lr": 1.6795969646531685e-06, "epoch": 1.63072, "percentage": 81.67, "elapsed_time": "6:13:14", "remaining_time": "1:23:47"}
{"current_steps": 638, "total_steps": 780, "loss": 0.2784, "lr": 1.6568573055992188e-06, "epoch": 1.63328, "percentage": 81.79, "elapsed_time": "6:13:49", "remaining_time": "1:23:12"}
{"current_steps": 639, "total_steps": 780, "loss": 0.2696, "lr": 1.6342587189559577e-06, "epoch": 1.63584, "percentage": 81.92, "elapsed_time": "6:14:24", "remaining_time": "1:22:37"}
{"current_steps": 640, "total_steps": 780, "loss": 0.2386, "lr": 1.6118015868380387e-06, "epoch": 1.6383999999999999, "percentage": 82.05, "elapsed_time": "6:15:00", "remaining_time": "1:22:02"}
{"current_steps": 641, "total_steps": 780, "loss": 0.2955, "lr": 1.5894862889682906e-06, "epoch": 1.64096, "percentage": 82.18, "elapsed_time": "6:15:36", "remaining_time": "1:21:26"}
{"current_steps": 642, "total_steps": 780, "loss": 0.2843, "lr": 1.5673132026713046e-06, "epoch": 1.64352, "percentage": 82.31, "elapsed_time": "6:16:13", "remaining_time": "1:20:52"}
{"current_steps": 643, "total_steps": 780, "loss": 0.3071, "lr": 1.5452827028670358e-06, "epoch": 1.64608, "percentage": 82.44, "elapsed_time": "6:16:48", "remaining_time": "1:20:17"}
{"current_steps": 644, "total_steps": 780, "loss": 0.251, "lr": 1.523395162064486e-06, "epoch": 1.6486399999999999, "percentage": 82.56, "elapsed_time": "6:17:22", "remaining_time": "1:19:41"}
{"current_steps": 645, "total_steps": 780, "loss": 0.2755, "lr": 1.50165095035539e-06, "epoch": 1.6512, "percentage": 82.69, "elapsed_time": "6:17:58", "remaining_time": "1:19:06"}
{"current_steps": 646, "total_steps": 780, "loss": 0.2614, "lr": 1.480050435407957e-06, "epoch": 1.6537600000000001, "percentage": 82.82, "elapsed_time": "6:18:33", "remaining_time": "1:18:31"}
{"current_steps": 647, "total_steps": 780, "loss": 0.255, "lr": 1.4585939824606621e-06, "epoch": 1.65632, "percentage": 82.95, "elapsed_time": "6:19:08", "remaining_time": "1:17:56"}
{"current_steps": 648, "total_steps": 780, "loss": 0.2807, "lr": 1.437281954316071e-06, "epoch": 1.65888, "percentage": 83.08, "elapsed_time": "6:19:43", "remaining_time": "1:17:21"}
{"current_steps": 649, "total_steps": 780, "loss": 0.2702, "lr": 1.4161147113346917e-06, "epoch": 1.66144, "percentage": 83.21, "elapsed_time": "6:20:19", "remaining_time": "1:16:46"}
{"current_steps": 650, "total_steps": 780, "loss": 0.251, "lr": 1.395092611428902e-06, "epoch": 1.6640000000000001, "percentage": 83.33, "elapsed_time": "6:20:54", "remaining_time": "1:16:10"}
{"current_steps": 651, "total_steps": 780, "loss": 0.2985, "lr": 1.374216010056879e-06, "epoch": 1.66656, "percentage": 83.46, "elapsed_time": "6:21:30", "remaining_time": "1:15:35"}
{"current_steps": 652, "total_steps": 780, "loss": 0.3067, "lr": 1.353485260216596e-06, "epoch": 1.66912, "percentage": 83.59, "elapsed_time": "6:22:05", "remaining_time": "1:15:00"}
{"current_steps": 653, "total_steps": 780, "loss": 0.2331, "lr": 1.3329007124398608e-06, "epoch": 1.67168, "percentage": 83.72, "elapsed_time": "6:22:40", "remaining_time": "1:14:25"}
{"current_steps": 654, "total_steps": 780, "loss": 0.2878, "lr": 1.3124627147863733e-06, "epoch": 1.67424, "percentage": 83.85, "elapsed_time": "6:23:16", "remaining_time": "1:13:50"}
{"current_steps": 655, "total_steps": 780, "loss": 0.2522, "lr": 1.2921716128378581e-06, "epoch": 1.6768, "percentage": 83.97, "elapsed_time": "6:23:51", "remaining_time": "1:13:15"}
{"current_steps": 656, "total_steps": 780, "loss": 0.261, "lr": 1.272027749692203e-06, "epoch": 1.67936, "percentage": 84.1, "elapsed_time": "6:24:25", "remaining_time": "1:12:39"}
{"current_steps": 657, "total_steps": 780, "loss": 0.2708, "lr": 1.2520314659576683e-06, "epoch": 1.6819199999999999, "percentage": 84.23, "elapsed_time": "6:25:00", "remaining_time": "1:12:04"}
{"current_steps": 658, "total_steps": 780, "loss": 0.3082, "lr": 1.2321830997471329e-06, "epoch": 1.68448, "percentage": 84.36, "elapsed_time": "6:25:35", "remaining_time": "1:11:29"}
{"current_steps": 659, "total_steps": 780, "loss": 0.2438, "lr": 1.212482986672361e-06, "epoch": 1.68704, "percentage": 84.49, "elapsed_time": "6:26:11", "remaining_time": "1:10:54"}
{"current_steps": 660, "total_steps": 780, "loss": 0.2664, "lr": 1.1929314598383423e-06, "epoch": 1.6896, "percentage": 84.62, "elapsed_time": "6:26:46", "remaining_time": "1:10:19"}
{"current_steps": 661, "total_steps": 780, "loss": 0.2784, "lr": 1.1735288498376495e-06, "epoch": 1.6921599999999999, "percentage": 84.74, "elapsed_time": "6:27:20", "remaining_time": "1:09:43"}
{"current_steps": 662, "total_steps": 780, "loss": 0.2585, "lr": 1.1542754847448544e-06, "epoch": 1.69472, "percentage": 84.87, "elapsed_time": "6:27:56", "remaining_time": "1:09:09"}
{"current_steps": 663, "total_steps": 780, "loss": 0.2675, "lr": 1.13517169011098e-06, "epoch": 1.6972800000000001, "percentage": 85.0, "elapsed_time": "6:28:31", "remaining_time": "1:08:33"}
{"current_steps": 664, "total_steps": 780, "loss": 0.2456, "lr": 1.1162177889579906e-06, "epoch": 1.69984, "percentage": 85.13, "elapsed_time": "6:29:06", "remaining_time": "1:07:58"}
{"current_steps": 665, "total_steps": 780, "loss": 0.2219, "lr": 1.0974141017733386e-06, "epoch": 1.7024, "percentage": 85.26, "elapsed_time": "6:29:42", "remaining_time": "1:07:23"}
{"current_steps": 666, "total_steps": 780, "loss": 0.2878, "lr": 1.078760946504539e-06, "epoch": 1.70496, "percentage": 85.38, "elapsed_time": "6:30:15", "remaining_time": "1:06:48"}
{"current_steps": 667, "total_steps": 780, "loss": 0.2581, "lr": 1.0602586385537928e-06, "epoch": 1.7075200000000001, "percentage": 85.51, "elapsed_time": "6:30:50", "remaining_time": "1:06:12"}
{"current_steps": 668, "total_steps": 780, "loss": 0.2498, "lr": 1.041907490772658e-06, "epoch": 1.71008, "percentage": 85.64, "elapsed_time": "6:31:26", "remaining_time": "1:05:37"}
{"current_steps": 669, "total_steps": 780, "loss": 0.2505, "lr": 1.0237078134567535e-06, "epoch": 1.71264, "percentage": 85.77, "elapsed_time": "6:32:00", "remaining_time": "1:05:02"}
{"current_steps": 670, "total_steps": 780, "loss": 0.2754, "lr": 1.0056599143405244e-06, "epoch": 1.7151999999999998, "percentage": 85.9, "elapsed_time": "6:32:37", "remaining_time": "1:04:27"}
{"current_steps": 671, "total_steps": 780, "loss": 0.2798, "lr": 9.877640985920268e-07, "epoch": 1.71776, "percentage": 86.03, "elapsed_time": "6:33:11", "remaining_time": "1:03:52"}
{"current_steps": 672, "total_steps": 780, "loss": 0.2298, "lr": 9.700206688077707e-07, "epoch": 1.72032, "percentage": 86.15, "elapsed_time": "6:33:46", "remaining_time": "1:03:17"}
{"current_steps": 673, "total_steps": 780, "loss": 0.2805, "lr": 9.524299250076052e-07, "epoch": 1.72288, "percentage": 86.28, "elapsed_time": "6:34:21", "remaining_time": "1:02:41"}
{"current_steps": 674, "total_steps": 780, "loss": 0.2548, "lr": 9.349921646296423e-07, "epoch": 1.7254399999999999, "percentage": 86.41, "elapsed_time": "6:34:56", "remaining_time": "1:02:06"}
{"current_steps": 675, "total_steps": 780, "loss": 0.2343, "lr": 9.177076825252351e-07, "epoch": 1.728, "percentage": 86.54, "elapsed_time": "6:35:30", "remaining_time": "1:01:31"}
{"current_steps": 676, "total_steps": 780, "loss": 0.2783, "lr": 9.00576770953987e-07, "epoch": 1.73056, "percentage": 86.67, "elapsed_time": "6:36:04", "remaining_time": "1:00:56"}
{"current_steps": 677, "total_steps": 780, "loss": 0.2596, "lr": 8.835997195788071e-07, "epoch": 1.73312, "percentage": 86.79, "elapsed_time": "6:36:40", "remaining_time": "1:00:21"}
{"current_steps": 678, "total_steps": 780, "loss": 0.2754, "lr": 8.667768154610124e-07, "epoch": 1.73568, "percentage": 86.92, "elapsed_time": "6:37:16", "remaining_time": "0:59:45"}
{"current_steps": 679, "total_steps": 780, "loss": 0.2655, "lr": 8.501083430554868e-07, "epoch": 1.73824, "percentage": 87.05, "elapsed_time": "6:37:52", "remaining_time": "0:59:10"}
{"current_steps": 680, "total_steps": 780, "loss": 0.2853, "lr": 8.335945842058524e-07, "epoch": 1.7408000000000001, "percentage": 87.18, "elapsed_time": "6:38:26", "remaining_time": "0:58:35"}
{"current_steps": 681, "total_steps": 780, "loss": 0.2669, "lr": 8.172358181397178e-07, "epoch": 1.74336, "percentage": 87.31, "elapsed_time": "6:39:01", "remaining_time": "0:58:00"}
{"current_steps": 682, "total_steps": 780, "loss": 0.2939, "lr": 8.010323214639492e-07, "epoch": 1.74592, "percentage": 87.44, "elapsed_time": "6:39:36", "remaining_time": "0:57:25"}
{"current_steps": 683, "total_steps": 780, "loss": 0.2919, "lr": 7.849843681599978e-07, "epoch": 1.74848, "percentage": 87.56, "elapsed_time": "6:40:09", "remaining_time": "0:56:49"}
{"current_steps": 684, "total_steps": 780, "loss": 0.2405, "lr": 7.690922295792647e-07, "epoch": 1.7510400000000002, "percentage": 87.69, "elapsed_time": "6:40:44", "remaining_time": "0:56:14"}
{"current_steps": 685, "total_steps": 780, "loss": 0.2692, "lr": 7.53356174438512e-07, "epoch": 1.7536, "percentage": 87.82, "elapsed_time": "6:41:20", "remaining_time": "0:55:39"}
{"current_steps": 686, "total_steps": 780, "loss": 0.2444, "lr": 7.377764688153244e-07, "epoch": 1.75616, "percentage": 87.95, "elapsed_time": "6:41:54", "remaining_time": "0:55:04"}
{"current_steps": 687, "total_steps": 780, "loss": 0.2283, "lr": 7.223533761435986e-07, "epoch": 1.7587199999999998, "percentage": 88.08, "elapsed_time": "6:42:29", "remaining_time": "0:54:29"}
{"current_steps": 688, "total_steps": 780, "loss": 0.2447, "lr": 7.070871572091076e-07, "epoch": 1.76128, "percentage": 88.21, "elapsed_time": "6:43:04", "remaining_time": "0:53:54"}
{"current_steps": 689, "total_steps": 780, "loss": 0.3117, "lr": 6.919780701450684e-07, "epoch": 1.76384, "percentage": 88.33, "elapsed_time": "6:43:40", "remaining_time": "0:53:18"}
{"current_steps": 690, "total_steps": 780, "loss": 0.2489, "lr": 6.770263704277958e-07, "epoch": 1.7664, "percentage": 88.46, "elapsed_time": "6:44:13", "remaining_time": "0:52:43"}
{"current_steps": 691, "total_steps": 780, "loss": 0.2933, "lr": 6.62232310872375e-07, "epoch": 1.7689599999999999, "percentage": 88.59, "elapsed_time": "6:44:47", "remaining_time": "0:52:08"}
{"current_steps": 692, "total_steps": 780, "loss": 0.2976, "lr": 6.475961416283838e-07, "epoch": 1.77152, "percentage": 88.72, "elapsed_time": "6:45:22", "remaining_time": "0:51:32"}
{"current_steps": 693, "total_steps": 780, "loss": 0.2525, "lr": 6.331181101756733e-07, "epoch": 1.77408, "percentage": 88.85, "elapsed_time": "6:45:58", "remaining_time": "0:50:57"}
{"current_steps": 694, "total_steps": 780, "loss": 0.2724, "lr": 6.187984613201703e-07, "epoch": 1.77664, "percentage": 88.97, "elapsed_time": "6:46:33", "remaining_time": "0:50:22"}
{"current_steps": 695, "total_steps": 780, "loss": 0.2676, "lr": 6.046374371897446e-07, "epoch": 1.7792, "percentage": 89.1, "elapsed_time": "6:47:08", "remaining_time": "0:49:47"}
{"current_steps": 696, "total_steps": 780, "loss": 0.2734, "lr": 5.906352772301193e-07, "epoch": 1.78176, "percentage": 89.23, "elapsed_time": "6:47:42", "remaining_time": "0:49:12"}
{"current_steps": 697, "total_steps": 780, "loss": 0.2753, "lr": 5.767922182008145e-07, "epoch": 1.7843200000000001, "percentage": 89.36, "elapsed_time": "6:48:17", "remaining_time": "0:48:37"}
{"current_steps": 698, "total_steps": 780, "loss": 0.2673, "lr": 5.631084941711473e-07, "epoch": 1.78688, "percentage": 89.49, "elapsed_time": "6:48:51", "remaining_time": "0:48:01"}
{"current_steps": 699, "total_steps": 780, "loss": 0.2901, "lr": 5.495843365162701e-07, "epoch": 1.78944, "percentage": 89.62, "elapsed_time": "6:49:26", "remaining_time": "0:47:26"}
{"current_steps": 700, "total_steps": 780, "loss": 0.2747, "lr": 5.362199739132656e-07, "epoch": 1.792, "percentage": 89.74, "elapsed_time": "6:50:00", "remaining_time": "0:46:51"}
{"current_steps": 701, "total_steps": 780, "loss": 0.2524, "lr": 5.230156323372759e-07, "epoch": 1.7945600000000002, "percentage": 89.87, "elapsed_time": "6:50:35", "remaining_time": "0:46:16"}
{"current_steps": 702, "total_steps": 780, "loss": 0.2676, "lr": 5.099715350576817e-07, "epoch": 1.79712, "percentage": 90.0, "elapsed_time": "6:51:11", "remaining_time": "0:45:41"}
{"current_steps": 703, "total_steps": 780, "loss": 0.2747, "lr": 4.970879026343256e-07, "epoch": 1.79968, "percentage": 90.13, "elapsed_time": "6:51:46", "remaining_time": "0:45:06"}
{"current_steps": 704, "total_steps": 780, "loss": 0.2708, "lr": 4.843649529137861e-07, "epoch": 1.8022399999999998, "percentage": 90.26, "elapsed_time": "6:52:21", "remaining_time": "0:44:30"}
{"current_steps": 705, "total_steps": 780, "loss": 0.3164, "lr": 4.7180290102568973e-07, "epoch": 1.8048, "percentage": 90.38, "elapsed_time": "6:52:55", "remaining_time": "0:43:55"}
{"current_steps": 706, "total_steps": 780, "loss": 0.2927, "lr": 4.594019593790799e-07, "epoch": 1.80736, "percentage": 90.51, "elapsed_time": "6:53:30", "remaining_time": "0:43:20"}
{"current_steps": 707, "total_steps": 780, "loss": 0.2628, "lr": 4.471623376588197e-07, "epoch": 1.80992, "percentage": 90.64, "elapsed_time": "6:54:06", "remaining_time": "0:42:45"}
{"current_steps": 708, "total_steps": 780, "loss": 0.2582, "lr": 4.35084242822047e-07, "epoch": 1.8124799999999999, "percentage": 90.77, "elapsed_time": "6:54:41", "remaining_time": "0:42:10"}
{"current_steps": 709, "total_steps": 780, "loss": 0.2753, "lr": 4.2316787909467915e-07, "epoch": 1.81504, "percentage": 90.9, "elapsed_time": "6:55:15", "remaining_time": "0:41:35"}
{"current_steps": 710, "total_steps": 780, "loss": 0.2678, "lr": 4.114134479679543e-07, "epoch": 1.8176, "percentage": 91.03, "elapsed_time": "6:55:49", "remaining_time": "0:40:59"}
{"current_steps": 711, "total_steps": 780, "loss": 0.2892, "lr": 3.998211481950254e-07, "epoch": 1.82016, "percentage": 91.15, "elapsed_time": "6:56:24", "remaining_time": "0:40:24"}
{"current_steps": 712, "total_steps": 780, "loss": 0.2728, "lr": 3.883911757876058e-07, "epoch": 1.82272, "percentage": 91.28, "elapsed_time": "6:56:59", "remaining_time": "0:39:49"}
{"current_steps": 713, "total_steps": 780, "loss": 0.2735, "lr": 3.771237240126469e-07, "epoch": 1.82528, "percentage": 91.41, "elapsed_time": "6:57:35", "remaining_time": "0:39:14"}
{"current_steps": 714, "total_steps": 780, "loss": 0.2597, "lr": 3.66018983389077e-07, "epoch": 1.8278400000000001, "percentage": 91.54, "elapsed_time": "6:58:09", "remaining_time": "0:38:39"}
{"current_steps": 715, "total_steps": 780, "loss": 0.2665, "lr": 3.5507714168457e-07, "epoch": 1.8304, "percentage": 91.67, "elapsed_time": "6:58:45", "remaining_time": "0:38:04"}
{"current_steps": 716, "total_steps": 780, "loss": 0.2805, "lr": 3.442983839123826e-07, "epoch": 1.83296, "percentage": 91.79, "elapsed_time": "6:59:19", "remaining_time": "0:37:28"}
{"current_steps": 717, "total_steps": 780, "loss": 0.246, "lr": 3.3368289232822094e-07, "epoch": 1.83552, "percentage": 91.92, "elapsed_time": "6:59:54", "remaining_time": "0:36:53"}
{"current_steps": 718, "total_steps": 780, "loss": 0.2947, "lr": 3.232308464271505e-07, "epoch": 1.8380800000000002, "percentage": 92.05, "elapsed_time": "7:00:29", "remaining_time": "0:36:18"}
{"current_steps": 719, "total_steps": 780, "loss": 0.3191, "lr": 3.1294242294057974e-07, "epoch": 1.84064, "percentage": 92.18, "elapsed_time": "7:01:06", "remaining_time": "0:35:43"}
{"current_steps": 720, "total_steps": 780, "loss": 0.2548, "lr": 3.028177958332512e-07, "epoch": 1.8432, "percentage": 92.31, "elapsed_time": "7:01:42", "remaining_time": "0:35:08"}
{"current_steps": 721, "total_steps": 780, "loss": 0.3028, "lr": 2.928571363003152e-07, "epoch": 1.8457599999999998, "percentage": 92.44, "elapsed_time": "7:02:17", "remaining_time": "0:34:33"}
{"current_steps": 722, "total_steps": 780, "loss": 0.2631, "lr": 2.8306061276442753e-07, "epoch": 1.84832, "percentage": 92.56, "elapsed_time": "7:02:52", "remaining_time": "0:33:58"}
{"current_steps": 723, "total_steps": 780, "loss": 0.2518, "lr": 2.7342839087290183e-07, "epoch": 1.85088, "percentage": 92.69, "elapsed_time": "7:03:28", "remaining_time": "0:33:23"}
{"current_steps": 724, "total_steps": 780, "loss": 0.2908, "lr": 2.639606334949163e-07, "epoch": 1.85344, "percentage": 92.82, "elapsed_time": "7:04:03", "remaining_time": "0:32:48"}
{"current_steps": 725, "total_steps": 780, "loss": 0.2649, "lr": 2.5465750071874797e-07, "epoch": 1.8559999999999999, "percentage": 92.95, "elapsed_time": "7:04:39", "remaining_time": "0:32:12"}
{"current_steps": 726, "total_steps": 780, "loss": 0.2664, "lr": 2.455191498490739e-07, "epoch": 1.85856, "percentage": 93.08, "elapsed_time": "7:05:15", "remaining_time": "0:31:37"}
{"current_steps": 727, "total_steps": 780, "loss": 0.2172, "lr": 2.365457354043088e-07, "epoch": 1.86112, "percentage": 93.21, "elapsed_time": "7:05:49", "remaining_time": "0:31:02"}
{"current_steps": 728, "total_steps": 780, "loss": 0.2504, "lr": 2.27737409113995e-07, "epoch": 1.86368, "percentage": 93.33, "elapsed_time": "7:06:24", "remaining_time": "0:30:27"}
{"current_steps": 729, "total_steps": 780, "loss": 0.2615, "lr": 2.1909431991623097e-07, "epoch": 1.86624, "percentage": 93.46, "elapsed_time": "7:06:59", "remaining_time": "0:29:52"}
{"current_steps": 730, "total_steps": 780, "loss": 0.2668, "lr": 2.106166139551602e-07, "epoch": 1.8688, "percentage": 93.59, "elapsed_time": "7:07:33", "remaining_time": "0:29:17"}
{"current_steps": 731, "total_steps": 780, "loss": 0.2797, "lr": 2.0230443457849414e-07, "epoch": 1.8713600000000001, "percentage": 93.72, "elapsed_time": "7:08:07", "remaining_time": "0:28:41"}
{"current_steps": 732, "total_steps": 780, "loss": 0.2304, "lr": 1.941579223350898e-07, "epoch": 1.87392, "percentage": 93.85, "elapsed_time": "7:08:41", "remaining_time": "0:28:06"}
{"current_steps": 733, "total_steps": 780, "loss": 0.2505, "lr": 1.8617721497257823e-07, "epoch": 1.87648, "percentage": 93.97, "elapsed_time": "7:09:16", "remaining_time": "0:27:31"}
{"current_steps": 734, "total_steps": 780, "loss": 0.2364, "lr": 1.7836244743502762e-07, "epoch": 1.87904, "percentage": 94.1, "elapsed_time": "7:09:53", "remaining_time": "0:26:56"}
{"current_steps": 735, "total_steps": 780, "loss": 0.2449, "lr": 1.7071375186066607e-07, "epoch": 1.8816000000000002, "percentage": 94.23, "elapsed_time": "7:10:27", "remaining_time": "0:26:21"}
{"current_steps": 736, "total_steps": 780, "loss": 0.2692, "lr": 1.6323125757964799e-07, "epoch": 1.88416, "percentage": 94.36, "elapsed_time": "7:11:04", "remaining_time": "0:25:46"}
{"current_steps": 737, "total_steps": 780, "loss": 0.2652, "lr": 1.5591509111186342e-07, "epoch": 1.88672, "percentage": 94.49, "elapsed_time": "7:11:39", "remaining_time": "0:25:11"}
{"current_steps": 738, "total_steps": 780, "loss": 0.2881, "lr": 1.4876537616480335e-07, "epoch": 1.8892799999999998, "percentage": 94.62, "elapsed_time": "7:12:15", "remaining_time": "0:24:35"}
{"current_steps": 739, "total_steps": 780, "loss": 0.2622, "lr": 1.4178223363146226e-07, "epoch": 1.89184, "percentage": 94.74, "elapsed_time": "7:12:48", "remaining_time": "0:24:00"}
{"current_steps": 740, "total_steps": 780, "loss": 0.2961, "lr": 1.349657815883032e-07, "epoch": 1.8944, "percentage": 94.87, "elapsed_time": "7:13:23", "remaining_time": "0:23:25"}
{"current_steps": 741, "total_steps": 780, "loss": 0.2736, "lr": 1.283161352932505e-07, "epoch": 1.89696, "percentage": 95.0, "elapsed_time": "7:13:59", "remaining_time": "0:22:50"}
{"current_steps": 742, "total_steps": 780, "loss": 0.2583, "lr": 1.218334071837468e-07, "epoch": 1.8995199999999999, "percentage": 95.13, "elapsed_time": "7:14:34", "remaining_time": "0:22:15"}
{"current_steps": 743, "total_steps": 780, "loss": 0.2758, "lr": 1.1551770687485142e-07, "epoch": 1.90208, "percentage": 95.26, "elapsed_time": "7:15:07", "remaining_time": "0:21:40"}
{"current_steps": 744, "total_steps": 780, "loss": 0.2657, "lr": 1.0936914115738717e-07, "epoch": 1.90464, "percentage": 95.38, "elapsed_time": "7:15:41", "remaining_time": "0:21:04"}
{"current_steps": 745, "total_steps": 780, "loss": 0.2642, "lr": 1.0338781399613307e-07, "epoch": 1.9072, "percentage": 95.51, "elapsed_time": "7:16:15", "remaining_time": "0:20:29"}
{"current_steps": 746, "total_steps": 780, "loss": 0.2545, "lr": 9.757382652806791e-08, "epoch": 1.90976, "percentage": 95.64, "elapsed_time": "7:16:53", "remaining_time": "0:19:54"}
{"current_steps": 747, "total_steps": 780, "loss": 0.2583, "lr": 9.192727706065829e-08, "epoch": 1.91232, "percentage": 95.77, "elapsed_time": "7:17:27", "remaining_time": "0:19:19"}
{"current_steps": 748, "total_steps": 780, "loss": 0.2814, "lr": 8.644826107019888e-08, "epoch": 1.9148800000000001, "percentage": 95.9, "elapsed_time": "7:18:02", "remaining_time": "0:18:44"}
{"current_steps": 749, "total_steps": 780, "loss": 0.2601, "lr": 8.113687120019587e-08, "epoch": 1.91744, "percentage": 96.03, "elapsed_time": "7:18:37", "remaining_time": "0:18:09"}
{"current_steps": 750, "total_steps": 780, "loss": 0.2621, "lr": 7.599319725980047e-08, "epoch": 1.92, "percentage": 96.15, "elapsed_time": "7:19:11", "remaining_time": "0:17:34"}
{"current_steps": 751, "total_steps": 780, "loss": 0.2881, "lr": 7.101732622229462e-08, "epoch": 1.92256, "percentage": 96.28, "elapsed_time": "7:19:47", "remaining_time": "0:16:58"}
{"current_steps": 752, "total_steps": 780, "loss": 0.3086, "lr": 6.62093422236132e-08, "epoch": 1.9251200000000002, "percentage": 96.41, "elapsed_time": "7:20:24", "remaining_time": "0:16:23"}
{"current_steps": 753, "total_steps": 780, "loss": 0.2647, "lr": 6.15693265609274e-08, "epoch": 1.92768, "percentage": 96.54, "elapsed_time": "7:20:58", "remaining_time": "0:15:48"}
{"current_steps": 754, "total_steps": 780, "loss": 0.2815, "lr": 5.709735769126479e-08, "epoch": 1.93024, "percentage": 96.67, "elapsed_time": "7:21:32", "remaining_time": "0:15:13"}
{"current_steps": 755, "total_steps": 780, "loss": 0.2307, "lr": 5.279351123019028e-08, "epoch": 1.9327999999999999, "percentage": 96.79, "elapsed_time": "7:22:04", "remaining_time": "0:14:38"}
{"current_steps": 756, "total_steps": 780, "loss": 0.2741, "lr": 4.8657859950520524e-08, "epoch": 1.93536, "percentage": 96.92, "elapsed_time": "7:22:41", "remaining_time": "0:14:03"}
{"current_steps": 757, "total_steps": 780, "loss": 0.2949, "lr": 4.469047378109603e-08, "epoch": 1.93792, "percentage": 97.05, "elapsed_time": "7:23:16", "remaining_time": "0:13:28"}
{"current_steps": 758, "total_steps": 780, "loss": 0.2564, "lr": 4.0891419805597634e-08, "epoch": 1.94048, "percentage": 97.18, "elapsed_time": "7:23:52", "remaining_time": "0:12:52"}
{"current_steps": 759, "total_steps": 780, "loss": 0.2654, "lr": 3.7260762261416287e-08, "epoch": 1.9430399999999999, "percentage": 97.31, "elapsed_time": "7:24:28", "remaining_time": "0:12:17"}
{"current_steps": 760, "total_steps": 780, "loss": 0.2441, "lr": 3.379856253855951e-08, "epoch": 1.9456, "percentage": 97.44, "elapsed_time": "7:25:01", "remaining_time": "0:11:42"}
{"current_steps": 761, "total_steps": 780, "loss": 0.2748, "lr": 3.0504879178622214e-08, "epoch": 1.9481600000000001, "percentage": 97.56, "elapsed_time": "7:25:35", "remaining_time": "0:11:07"}
{"current_steps": 762, "total_steps": 780, "loss": 0.2456, "lr": 2.73797678737886e-08, "epoch": 1.95072, "percentage": 97.69, "elapsed_time": "7:26:10", "remaining_time": "0:10:32"}
{"current_steps": 763, "total_steps": 780, "loss": 0.2799, "lr": 2.442328146589512e-08, "epoch": 1.95328, "percentage": 97.82, "elapsed_time": "7:26:47", "remaining_time": "0:09:57"}
{"current_steps": 764, "total_steps": 780, "loss": 0.2402, "lr": 2.163546994553789e-08, "epoch": 1.95584, "percentage": 97.95, "elapsed_time": "7:27:22", "remaining_time": "0:09:22"}
{"current_steps": 765, "total_steps": 780, "loss": 0.2944, "lr": 1.9016380451223337e-08, "epoch": 1.9584000000000001, "percentage": 98.08, "elapsed_time": "7:27:58", "remaining_time": "0:08:47"}
{"current_steps": 766, "total_steps": 780, "loss": 0.2704, "lr": 1.656605726857441e-08, "epoch": 1.96096, "percentage": 98.21, "elapsed_time": "7:28:35", "remaining_time": "0:08:11"}
{"current_steps": 767, "total_steps": 780, "loss": 0.3189, "lr": 1.4284541829580056e-08, "epoch": 1.96352, "percentage": 98.33, "elapsed_time": "7:29:09", "remaining_time": "0:07:36"}
{"current_steps": 768, "total_steps": 780, "loss": 0.2729, "lr": 1.2171872711895794e-08, "epoch": 1.96608, "percentage": 98.46, "elapsed_time": "7:29:43", "remaining_time": "0:07:01"}
{"current_steps": 769, "total_steps": 780, "loss": 0.2613, "lr": 1.0228085638190887e-08, "epoch": 1.96864, "percentage": 98.59, "elapsed_time": "7:30:19", "remaining_time": "0:06:26"}
{"current_steps": 770, "total_steps": 780, "loss": 0.2625, "lr": 8.453213475543287e-09, "epoch": 1.9712, "percentage": 98.72, "elapsed_time": "7:30:54", "remaining_time": "0:05:51"}
{"current_steps": 771, "total_steps": 780, "loss": 0.2557, "lr": 6.84728623488562e-09, "epoch": 1.97376, "percentage": 98.85, "elapsed_time": "7:31:28", "remaining_time": "0:05:16"}
{"current_steps": 772, "total_steps": 780, "loss": 0.2712, "lr": 5.410331070498931e-09, "epoch": 1.9763199999999999, "percentage": 98.97, "elapsed_time": "7:32:04", "remaining_time": "0:04:41"}
{"current_steps": 773, "total_steps": 780, "loss": 0.2593, "lr": 4.142372279548612e-09, "epoch": 1.97888, "percentage": 99.1, "elapsed_time": "7:32:38", "remaining_time": "0:04:05"}
{"current_steps": 774, "total_steps": 780, "loss": 0.2226, "lr": 3.043431301678057e-09, "epoch": 1.98144, "percentage": 99.23, "elapsed_time": "7:33:15", "remaining_time": "0:03:30"}
{"current_steps": 775, "total_steps": 780, "loss": 0.2807, "lr": 2.11352671864562e-09, "epoch": 1.984, "percentage": 99.36, "elapsed_time": "7:33:50", "remaining_time": "0:02:55"}
{"current_steps": 776, "total_steps": 780, "loss": 0.2718, "lr": 1.3526742540070913e-09, "epoch": 1.9865599999999999, "percentage": 99.49, "elapsed_time": "7:34:26", "remaining_time": "0:02:20"}
{"current_steps": 777, "total_steps": 780, "loss": 0.2749, "lr": 7.608867728536862e-10, "epoch": 1.98912, "percentage": 99.62, "elapsed_time": "7:35:01", "remaining_time": "0:01:45"}
{"current_steps": 778, "total_steps": 780, "loss": 0.2902, "lr": 3.381742815944389e-10, "epoch": 1.9916800000000001, "percentage": 99.74, "elapsed_time": "7:35:36", "remaining_time": "0:01:10"}
{"current_steps": 779, "total_steps": 780, "loss": 0.2478, "lr": 8.454392778189935e-11, "epoch": 1.99424, "percentage": 99.87, "elapsed_time": "7:36:11", "remaining_time": "0:00:35"}
{"current_steps": 780, "total_steps": 780, "loss": 0.2642, "lr": 0.0, "epoch": 1.9968, "percentage": 100.0, "elapsed_time": "7:36:47", "remaining_time": "0:00:00"}
{"current_steps": 780, "total_steps": 780, "epoch": 1.9968, "percentage": 100.0, "elapsed_time": "7:37:33", "remaining_time": "0:00:00"}