hf-reset
Reset repository without checkpoints directories
c544b93
{"current_steps": 5, "total_steps": 3750, "loss": 0.8749, "lr": 4.266666666666667e-07, "epoch": 0.008, "percentage": 0.13, "elapsed_time": "0:00:28", "remaining_time": "5:59:38"}
{"current_steps": 10, "total_steps": 3750, "loss": 0.8863, "lr": 9.600000000000001e-07, "epoch": 0.016, "percentage": 0.27, "elapsed_time": "0:00:46", "remaining_time": "4:49:04"}
{"current_steps": 15, "total_steps": 3750, "loss": 0.8563, "lr": 1.4933333333333336e-06, "epoch": 0.024, "percentage": 0.4, "elapsed_time": "0:01:07", "remaining_time": "4:40:47"}
{"current_steps": 20, "total_steps": 3750, "loss": 0.7908, "lr": 2.0266666666666666e-06, "epoch": 0.032, "percentage": 0.53, "elapsed_time": "0:01:27", "remaining_time": "4:33:28"}
{"current_steps": 25, "total_steps": 3750, "loss": 0.8504, "lr": 2.56e-06, "epoch": 0.04, "percentage": 0.67, "elapsed_time": "0:01:46", "remaining_time": "4:23:59"}
{"current_steps": 30, "total_steps": 3750, "loss": 0.7851, "lr": 3.093333333333334e-06, "epoch": 0.048, "percentage": 0.8, "elapsed_time": "0:02:04", "remaining_time": "4:17:50"}
{"current_steps": 35, "total_steps": 3750, "loss": 0.7479, "lr": 3.6266666666666674e-06, "epoch": 0.056, "percentage": 0.93, "elapsed_time": "0:02:25", "remaining_time": "4:17:43"}
{"current_steps": 40, "total_steps": 3750, "loss": 0.745, "lr": 4.16e-06, "epoch": 0.064, "percentage": 1.07, "elapsed_time": "0:02:43", "remaining_time": "4:12:53"}
{"current_steps": 45, "total_steps": 3750, "loss": 0.6973, "lr": 4.693333333333334e-06, "epoch": 0.072, "percentage": 1.2, "elapsed_time": "0:03:04", "remaining_time": "4:13:07"}
{"current_steps": 50, "total_steps": 3750, "loss": 0.6999, "lr": 5.226666666666667e-06, "epoch": 0.08, "percentage": 1.33, "elapsed_time": "0:03:23", "remaining_time": "4:10:32"}
{"current_steps": 55, "total_steps": 3750, "loss": 0.6424, "lr": 5.76e-06, "epoch": 0.088, "percentage": 1.47, "elapsed_time": "0:03:40", "remaining_time": "4:06:53"}
{"current_steps": 60, "total_steps": 3750, "loss": 0.6522, "lr": 6.293333333333334e-06, "epoch": 0.096, "percentage": 1.6, "elapsed_time": "0:03:57", "remaining_time": "4:03:42"}
{"current_steps": 65, "total_steps": 3750, "loss": 0.642, "lr": 6.826666666666667e-06, "epoch": 0.104, "percentage": 1.73, "elapsed_time": "0:04:17", "remaining_time": "4:03:40"}
{"current_steps": 70, "total_steps": 3750, "loss": 0.6009, "lr": 7.360000000000001e-06, "epoch": 0.112, "percentage": 1.87, "elapsed_time": "0:04:36", "remaining_time": "4:02:18"}
{"current_steps": 75, "total_steps": 3750, "loss": 0.648, "lr": 7.893333333333335e-06, "epoch": 0.12, "percentage": 2.0, "elapsed_time": "0:04:54", "remaining_time": "4:00:33"}
{"current_steps": 80, "total_steps": 3750, "loss": 0.597, "lr": 8.426666666666667e-06, "epoch": 0.128, "percentage": 2.13, "elapsed_time": "0:05:11", "remaining_time": "3:58:13"}
{"current_steps": 85, "total_steps": 3750, "loss": 0.5859, "lr": 8.96e-06, "epoch": 0.136, "percentage": 2.27, "elapsed_time": "0:05:32", "remaining_time": "3:58:48"}
{"current_steps": 90, "total_steps": 3750, "loss": 0.5884, "lr": 9.493333333333334e-06, "epoch": 0.144, "percentage": 2.4, "elapsed_time": "0:05:50", "remaining_time": "3:57:19"}
{"current_steps": 95, "total_steps": 3750, "loss": 0.5942, "lr": 1.0026666666666667e-05, "epoch": 0.152, "percentage": 2.53, "elapsed_time": "0:06:10", "remaining_time": "3:57:36"}
{"current_steps": 100, "total_steps": 3750, "loss": 0.5709, "lr": 1.056e-05, "epoch": 0.16, "percentage": 2.67, "elapsed_time": "0:06:28", "remaining_time": "3:56:06"}
{"current_steps": 105, "total_steps": 3750, "loss": 0.5734, "lr": 1.1093333333333334e-05, "epoch": 0.168, "percentage": 2.8, "elapsed_time": "0:07:49", "remaining_time": "4:31:35"}
{"current_steps": 110, "total_steps": 3750, "loss": 0.5718, "lr": 1.1626666666666668e-05, "epoch": 0.176, "percentage": 2.93, "elapsed_time": "0:08:07", "remaining_time": "4:29:02"}
{"current_steps": 115, "total_steps": 3750, "loss": 0.5585, "lr": 1.216e-05, "epoch": 0.184, "percentage": 3.07, "elapsed_time": "0:08:27", "remaining_time": "4:27:17"}
{"current_steps": 120, "total_steps": 3750, "loss": 0.5403, "lr": 1.2693333333333336e-05, "epoch": 0.192, "percentage": 3.2, "elapsed_time": "0:08:46", "remaining_time": "4:25:22"}
{"current_steps": 125, "total_steps": 3750, "loss": 0.5595, "lr": 1.3226666666666668e-05, "epoch": 0.2, "percentage": 3.33, "elapsed_time": "0:09:04", "remaining_time": "4:23:22"}
{"current_steps": 130, "total_steps": 3750, "loss": 0.5393, "lr": 1.376e-05, "epoch": 0.208, "percentage": 3.47, "elapsed_time": "0:09:26", "remaining_time": "4:22:46"}
{"current_steps": 135, "total_steps": 3750, "loss": 0.558, "lr": 1.4293333333333334e-05, "epoch": 0.216, "percentage": 3.6, "elapsed_time": "0:09:46", "remaining_time": "4:21:57"}
{"current_steps": 140, "total_steps": 3750, "loss": 0.5627, "lr": 1.4826666666666666e-05, "epoch": 0.224, "percentage": 3.73, "elapsed_time": "0:10:06", "remaining_time": "4:20:31"}
{"current_steps": 145, "total_steps": 3750, "loss": 0.5543, "lr": 1.5360000000000002e-05, "epoch": 0.232, "percentage": 3.87, "elapsed_time": "0:10:25", "remaining_time": "4:19:05"}
{"current_steps": 150, "total_steps": 3750, "loss": 0.5127, "lr": 1.5893333333333333e-05, "epoch": 0.24, "percentage": 4.0, "elapsed_time": "0:10:43", "remaining_time": "4:17:20"}
{"current_steps": 155, "total_steps": 3750, "loss": 0.525, "lr": 1.642666666666667e-05, "epoch": 0.248, "percentage": 4.13, "elapsed_time": "0:11:03", "remaining_time": "4:16:30"}
{"current_steps": 160, "total_steps": 3750, "loss": 0.4991, "lr": 1.696e-05, "epoch": 0.256, "percentage": 4.27, "elapsed_time": "0:11:23", "remaining_time": "4:15:46"}
{"current_steps": 165, "total_steps": 3750, "loss": 0.5455, "lr": 1.7493333333333334e-05, "epoch": 0.264, "percentage": 4.4, "elapsed_time": "0:11:41", "remaining_time": "4:14:11"}
{"current_steps": 170, "total_steps": 3750, "loss": 0.5186, "lr": 1.8026666666666668e-05, "epoch": 0.272, "percentage": 4.53, "elapsed_time": "0:12:02", "remaining_time": "4:13:36"}
{"current_steps": 175, "total_steps": 3750, "loss": 0.5339, "lr": 1.8560000000000002e-05, "epoch": 0.28, "percentage": 4.67, "elapsed_time": "0:12:22", "remaining_time": "4:12:43"}
{"current_steps": 180, "total_steps": 3750, "loss": 0.5157, "lr": 1.9093333333333336e-05, "epoch": 0.288, "percentage": 4.8, "elapsed_time": "0:12:39", "remaining_time": "4:10:58"}
{"current_steps": 185, "total_steps": 3750, "loss": 0.493, "lr": 1.9626666666666666e-05, "epoch": 0.296, "percentage": 4.93, "elapsed_time": "0:12:57", "remaining_time": "4:09:47"}
{"current_steps": 190, "total_steps": 3750, "loss": 0.5295, "lr": 2.016e-05, "epoch": 0.304, "percentage": 5.07, "elapsed_time": "0:13:19", "remaining_time": "4:09:46"}
{"current_steps": 195, "total_steps": 3750, "loss": 0.4888, "lr": 2.0693333333333334e-05, "epoch": 0.312, "percentage": 5.2, "elapsed_time": "0:13:36", "remaining_time": "4:08:14"}
{"current_steps": 200, "total_steps": 3750, "loss": 0.5145, "lr": 2.1226666666666668e-05, "epoch": 0.32, "percentage": 5.33, "elapsed_time": "0:13:57", "remaining_time": "4:07:39"}
{"current_steps": 205, "total_steps": 3750, "loss": 0.513, "lr": 2.1760000000000002e-05, "epoch": 0.328, "percentage": 5.47, "elapsed_time": "0:15:15", "remaining_time": "4:23:58"}
{"current_steps": 210, "total_steps": 3750, "loss": 0.4933, "lr": 2.2293333333333336e-05, "epoch": 0.336, "percentage": 5.6, "elapsed_time": "0:15:32", "remaining_time": "4:21:58"}
{"current_steps": 215, "total_steps": 3750, "loss": 0.5184, "lr": 2.282666666666667e-05, "epoch": 0.344, "percentage": 5.73, "elapsed_time": "0:15:53", "remaining_time": "4:21:11"}
{"current_steps": 220, "total_steps": 3750, "loss": 0.5346, "lr": 2.336e-05, "epoch": 0.352, "percentage": 5.87, "elapsed_time": "0:16:10", "remaining_time": "4:19:31"}
{"current_steps": 225, "total_steps": 3750, "loss": 0.4984, "lr": 2.3893333333333337e-05, "epoch": 0.36, "percentage": 6.0, "elapsed_time": "0:16:31", "remaining_time": "4:18:48"}
{"current_steps": 230, "total_steps": 3750, "loss": 0.5142, "lr": 2.442666666666667e-05, "epoch": 0.368, "percentage": 6.13, "elapsed_time": "0:16:49", "remaining_time": "4:17:30"}
{"current_steps": 235, "total_steps": 3750, "loss": 0.4951, "lr": 2.496e-05, "epoch": 0.376, "percentage": 6.27, "elapsed_time": "0:17:09", "remaining_time": "4:16:34"}
{"current_steps": 240, "total_steps": 3750, "loss": 0.507, "lr": 2.5493333333333335e-05, "epoch": 0.384, "percentage": 6.4, "elapsed_time": "0:17:26", "remaining_time": "4:14:59"}
{"current_steps": 245, "total_steps": 3750, "loss": 0.5027, "lr": 2.6026666666666666e-05, "epoch": 0.392, "percentage": 6.53, "elapsed_time": "0:17:43", "remaining_time": "4:13:28"}
{"current_steps": 250, "total_steps": 3750, "loss": 0.5073, "lr": 2.6560000000000003e-05, "epoch": 0.4, "percentage": 6.67, "elapsed_time": "0:18:06", "remaining_time": "4:13:30"}
{"current_steps": 255, "total_steps": 3750, "loss": 0.5003, "lr": 2.7093333333333337e-05, "epoch": 0.408, "percentage": 6.8, "elapsed_time": "0:18:25", "remaining_time": "4:12:32"}
{"current_steps": 260, "total_steps": 3750, "loss": 0.5009, "lr": 2.7626666666666668e-05, "epoch": 0.416, "percentage": 6.93, "elapsed_time": "0:18:44", "remaining_time": "4:11:40"}
{"current_steps": 265, "total_steps": 3750, "loss": 0.4787, "lr": 2.816e-05, "epoch": 0.424, "percentage": 7.07, "elapsed_time": "0:19:02", "remaining_time": "4:10:30"}
{"current_steps": 270, "total_steps": 3750, "loss": 0.4723, "lr": 2.869333333333334e-05, "epoch": 0.432, "percentage": 7.2, "elapsed_time": "0:19:24", "remaining_time": "4:10:07"}
{"current_steps": 275, "total_steps": 3750, "loss": 0.4884, "lr": 2.922666666666667e-05, "epoch": 0.44, "percentage": 7.33, "elapsed_time": "0:19:43", "remaining_time": "4:09:17"}
{"current_steps": 280, "total_steps": 3750, "loss": 0.4814, "lr": 2.9760000000000003e-05, "epoch": 0.448, "percentage": 7.47, "elapsed_time": "0:20:03", "remaining_time": "4:08:37"}
{"current_steps": 285, "total_steps": 3750, "loss": 0.4783, "lr": 3.0293333333333334e-05, "epoch": 0.456, "percentage": 7.6, "elapsed_time": "0:20:21", "remaining_time": "4:07:29"}
{"current_steps": 290, "total_steps": 3750, "loss": 0.4755, "lr": 3.0826666666666674e-05, "epoch": 0.464, "percentage": 7.73, "elapsed_time": "0:20:40", "remaining_time": "4:06:36"}
{"current_steps": 295, "total_steps": 3750, "loss": 0.4556, "lr": 3.1360000000000005e-05, "epoch": 0.472, "percentage": 7.87, "elapsed_time": "0:21:00", "remaining_time": "4:06:05"}
{"current_steps": 300, "total_steps": 3750, "loss": 0.4587, "lr": 3.1893333333333335e-05, "epoch": 0.48, "percentage": 8.0, "elapsed_time": "0:21:18", "remaining_time": "4:04:58"}
{"current_steps": 305, "total_steps": 3750, "loss": 0.4923, "lr": 3.2426666666666666e-05, "epoch": 0.488, "percentage": 8.13, "elapsed_time": "0:22:36", "remaining_time": "4:15:23"}
{"current_steps": 310, "total_steps": 3750, "loss": 0.4641, "lr": 3.296e-05, "epoch": 0.496, "percentage": 8.27, "elapsed_time": "0:22:59", "remaining_time": "4:15:10"}
{"current_steps": 315, "total_steps": 3750, "loss": 0.5024, "lr": 3.349333333333334e-05, "epoch": 0.504, "percentage": 8.4, "elapsed_time": "0:23:18", "remaining_time": "4:14:06"}
{"current_steps": 320, "total_steps": 3750, "loss": 0.478, "lr": 3.402666666666667e-05, "epoch": 0.512, "percentage": 8.53, "elapsed_time": "0:23:34", "remaining_time": "4:12:46"}
{"current_steps": 325, "total_steps": 3750, "loss": 0.4812, "lr": 3.456e-05, "epoch": 0.52, "percentage": 8.67, "elapsed_time": "0:23:54", "remaining_time": "4:11:54"}
{"current_steps": 330, "total_steps": 3750, "loss": 0.4896, "lr": 3.509333333333333e-05, "epoch": 0.528, "percentage": 8.8, "elapsed_time": "0:24:12", "remaining_time": "4:10:55"}
{"current_steps": 335, "total_steps": 3750, "loss": 0.4803, "lr": 3.562666666666667e-05, "epoch": 0.536, "percentage": 8.93, "elapsed_time": "0:24:29", "remaining_time": "4:09:36"}
{"current_steps": 340, "total_steps": 3750, "loss": 0.4832, "lr": 3.6160000000000006e-05, "epoch": 0.544, "percentage": 9.07, "elapsed_time": "0:24:48", "remaining_time": "4:08:44"}
{"current_steps": 345, "total_steps": 3750, "loss": 0.4781, "lr": 3.669333333333334e-05, "epoch": 0.552, "percentage": 9.2, "elapsed_time": "0:25:08", "remaining_time": "4:08:06"}
{"current_steps": 350, "total_steps": 3750, "loss": 0.4677, "lr": 3.722666666666667e-05, "epoch": 0.56, "percentage": 9.33, "elapsed_time": "0:25:25", "remaining_time": "4:06:58"}
{"current_steps": 355, "total_steps": 3750, "loss": 0.5033, "lr": 3.7760000000000004e-05, "epoch": 0.568, "percentage": 9.47, "elapsed_time": "0:25:45", "remaining_time": "4:06:21"}
{"current_steps": 360, "total_steps": 3750, "loss": 0.456, "lr": 3.8293333333333335e-05, "epoch": 0.576, "percentage": 9.6, "elapsed_time": "0:26:04", "remaining_time": "4:05:34"}
{"current_steps": 365, "total_steps": 3750, "loss": 0.4611, "lr": 3.882666666666667e-05, "epoch": 0.584, "percentage": 9.73, "elapsed_time": "0:26:22", "remaining_time": "4:04:34"}
{"current_steps": 370, "total_steps": 3750, "loss": 0.4931, "lr": 3.936e-05, "epoch": 0.592, "percentage": 9.87, "elapsed_time": "0:26:39", "remaining_time": "4:03:31"}
{"current_steps": 375, "total_steps": 3750, "loss": 0.4682, "lr": 3.989333333333333e-05, "epoch": 0.6, "percentage": 10.0, "elapsed_time": "0:26:59", "remaining_time": "4:02:55"}
{"current_steps": 380, "total_steps": 3750, "loss": 0.4802, "lr": 3.9999861365387784e-05, "epoch": 0.608, "percentage": 10.13, "elapsed_time": "0:27:17", "remaining_time": "4:02:01"}
{"current_steps": 385, "total_steps": 3750, "loss": 0.4611, "lr": 3.9999298165569614e-05, "epoch": 0.616, "percentage": 10.27, "elapsed_time": "0:27:36", "remaining_time": "4:01:17"}
{"current_steps": 390, "total_steps": 3750, "loss": 0.453, "lr": 3.999830174807269e-05, "epoch": 0.624, "percentage": 10.4, "elapsed_time": "0:27:53", "remaining_time": "4:00:21"}
{"current_steps": 395, "total_steps": 3750, "loss": 0.4651, "lr": 3.9996872134481036e-05, "epoch": 0.632, "percentage": 10.53, "elapsed_time": "0:28:13", "remaining_time": "3:59:47"}
{"current_steps": 400, "total_steps": 3750, "loss": 0.4813, "lr": 3.999500935576245e-05, "epoch": 0.64, "percentage": 10.67, "elapsed_time": "0:28:33", "remaining_time": "3:59:08"}
{"current_steps": 405, "total_steps": 3750, "loss": 0.447, "lr": 3.999271345226776e-05, "epoch": 0.648, "percentage": 10.8, "elapsed_time": "0:30:22", "remaining_time": "4:10:54"}
{"current_steps": 410, "total_steps": 3750, "loss": 0.465, "lr": 3.9989984473730035e-05, "epoch": 0.656, "percentage": 10.93, "elapsed_time": "0:30:40", "remaining_time": "4:09:52"}
{"current_steps": 415, "total_steps": 3750, "loss": 0.4608, "lr": 3.998682247926343e-05, "epoch": 0.664, "percentage": 11.07, "elapsed_time": "0:30:59", "remaining_time": "4:09:05"}
{"current_steps": 420, "total_steps": 3750, "loss": 0.4713, "lr": 3.998322753736193e-05, "epoch": 0.672, "percentage": 11.2, "elapsed_time": "0:31:18", "remaining_time": "4:08:10"}
{"current_steps": 425, "total_steps": 3750, "loss": 0.4667, "lr": 3.99791997258979e-05, "epoch": 0.68, "percentage": 11.33, "elapsed_time": "0:31:35", "remaining_time": "4:07:10"}
{"current_steps": 430, "total_steps": 3750, "loss": 0.4629, "lr": 3.997473913212036e-05, "epoch": 0.688, "percentage": 11.47, "elapsed_time": "0:31:52", "remaining_time": "4:06:02"}
{"current_steps": 435, "total_steps": 3750, "loss": 0.438, "lr": 3.9969845852653087e-05, "epoch": 0.696, "percentage": 11.6, "elapsed_time": "0:32:10", "remaining_time": "4:05:08"}
{"current_steps": 440, "total_steps": 3750, "loss": 0.4649, "lr": 3.996451999349258e-05, "epoch": 0.704, "percentage": 11.73, "elapsed_time": "0:32:29", "remaining_time": "4:04:26"}
{"current_steps": 445, "total_steps": 3750, "loss": 0.4647, "lr": 3.995876167000569e-05, "epoch": 0.712, "percentage": 11.87, "elapsed_time": "0:32:46", "remaining_time": "4:03:26"}
{"current_steps": 450, "total_steps": 3750, "loss": 0.4622, "lr": 3.9952571006927186e-05, "epoch": 0.72, "percentage": 12.0, "elapsed_time": "0:33:07", "remaining_time": "4:02:55"}
{"current_steps": 455, "total_steps": 3750, "loss": 0.4376, "lr": 3.9945948138356995e-05, "epoch": 0.728, "percentage": 12.13, "elapsed_time": "0:33:27", "remaining_time": "4:02:17"}
{"current_steps": 460, "total_steps": 3750, "loss": 0.4465, "lr": 3.993889320775735e-05, "epoch": 0.736, "percentage": 12.27, "elapsed_time": "0:33:46", "remaining_time": "4:01:31"}
{"current_steps": 465, "total_steps": 3750, "loss": 0.4671, "lr": 3.9931406367949627e-05, "epoch": 0.744, "percentage": 12.4, "elapsed_time": "0:34:03", "remaining_time": "4:00:37"}
{"current_steps": 470, "total_steps": 3750, "loss": 0.4427, "lr": 3.9923487781111106e-05, "epoch": 0.752, "percentage": 12.53, "elapsed_time": "0:34:21", "remaining_time": "3:59:45"}
{"current_steps": 475, "total_steps": 3750, "loss": 0.4447, "lr": 3.9915137618771386e-05, "epoch": 0.76, "percentage": 12.67, "elapsed_time": "0:34:40", "remaining_time": "3:59:01"}
{"current_steps": 480, "total_steps": 3750, "loss": 0.4576, "lr": 3.9906356061808713e-05, "epoch": 0.768, "percentage": 12.8, "elapsed_time": "0:35:00", "remaining_time": "3:58:28"}
{"current_steps": 485, "total_steps": 3750, "loss": 0.4296, "lr": 3.9897143300446055e-05, "epoch": 0.776, "percentage": 12.93, "elapsed_time": "0:35:16", "remaining_time": "3:57:30"}
{"current_steps": 490, "total_steps": 3750, "loss": 0.4855, "lr": 3.988749953424696e-05, "epoch": 0.784, "percentage": 13.07, "elapsed_time": "0:35:34", "remaining_time": "3:56:39"}
{"current_steps": 495, "total_steps": 3750, "loss": 0.4606, "lr": 3.9877424972111264e-05, "epoch": 0.792, "percentage": 13.2, "elapsed_time": "0:35:51", "remaining_time": "3:55:50"}
{"current_steps": 500, "total_steps": 3750, "loss": 0.4389, "lr": 3.9866919832270554e-05, "epoch": 0.8, "percentage": 13.33, "elapsed_time": "0:36:12", "remaining_time": "3:55:18"}
{"current_steps": 505, "total_steps": 3750, "loss": 0.4553, "lr": 3.9855984342283414e-05, "epoch": 0.808, "percentage": 13.47, "elapsed_time": "0:37:37", "remaining_time": "4:01:46"}
{"current_steps": 510, "total_steps": 3750, "loss": 0.4498, "lr": 3.9844618739030545e-05, "epoch": 0.816, "percentage": 13.6, "elapsed_time": "0:37:55", "remaining_time": "4:00:58"}
{"current_steps": 515, "total_steps": 3750, "loss": 0.4407, "lr": 3.98328232687096e-05, "epoch": 0.824, "percentage": 13.73, "elapsed_time": "0:38:15", "remaining_time": "4:00:19"}
{"current_steps": 520, "total_steps": 3750, "loss": 0.4672, "lr": 3.982059818682986e-05, "epoch": 0.832, "percentage": 13.87, "elapsed_time": "0:38:33", "remaining_time": "3:59:27"}
{"current_steps": 525, "total_steps": 3750, "loss": 0.4906, "lr": 3.980794375820669e-05, "epoch": 0.84, "percentage": 14.0, "elapsed_time": "0:38:53", "remaining_time": "3:58:52"}
{"current_steps": 530, "total_steps": 3750, "loss": 0.4589, "lr": 3.9794860256955825e-05, "epoch": 0.848, "percentage": 14.13, "elapsed_time": "0:39:11", "remaining_time": "3:58:08"}
{"current_steps": 535, "total_steps": 3750, "loss": 0.4511, "lr": 3.9781347966487415e-05, "epoch": 0.856, "percentage": 14.27, "elapsed_time": "0:39:30", "remaining_time": "3:57:27"}
{"current_steps": 540, "total_steps": 3750, "loss": 0.4564, "lr": 3.9767407179499875e-05, "epoch": 0.864, "percentage": 14.4, "elapsed_time": "0:39:52", "remaining_time": "3:57:01"}
{"current_steps": 545, "total_steps": 3750, "loss": 0.4817, "lr": 3.975303819797358e-05, "epoch": 0.872, "percentage": 14.53, "elapsed_time": "0:40:08", "remaining_time": "3:56:04"}
{"current_steps": 550, "total_steps": 3750, "loss": 0.4573, "lr": 3.973824133316431e-05, "epoch": 0.88, "percentage": 14.67, "elapsed_time": "0:40:28", "remaining_time": "3:55:27"}
{"current_steps": 555, "total_steps": 3750, "loss": 0.4233, "lr": 3.972301690559645e-05, "epoch": 0.888, "percentage": 14.8, "elapsed_time": "0:40:47", "remaining_time": "3:54:50"}
{"current_steps": 560, "total_steps": 3750, "loss": 0.469, "lr": 3.970736524505615e-05, "epoch": 0.896, "percentage": 14.93, "elapsed_time": "0:41:04", "remaining_time": "3:53:56"}
{"current_steps": 565, "total_steps": 3750, "loss": 0.4386, "lr": 3.969128669058411e-05, "epoch": 0.904, "percentage": 15.07, "elapsed_time": "0:41:21", "remaining_time": "3:53:10"}
{"current_steps": 570, "total_steps": 3750, "loss": 0.4482, "lr": 3.9674781590468256e-05, "epoch": 0.912, "percentage": 15.2, "elapsed_time": "0:41:38", "remaining_time": "3:52:21"}
{"current_steps": 575, "total_steps": 3750, "loss": 0.4669, "lr": 3.9657850302236184e-05, "epoch": 0.92, "percentage": 15.33, "elapsed_time": "0:41:58", "remaining_time": "3:51:44"}
{"current_steps": 580, "total_steps": 3750, "loss": 0.4478, "lr": 3.964049319264744e-05, "epoch": 0.928, "percentage": 15.47, "elapsed_time": "0:42:17", "remaining_time": "3:51:06"}
{"current_steps": 585, "total_steps": 3750, "loss": 0.4738, "lr": 3.962271063768555e-05, "epoch": 0.936, "percentage": 15.6, "elapsed_time": "0:42:34", "remaining_time": "3:50:19"}
{"current_steps": 590, "total_steps": 3750, "loss": 0.4728, "lr": 3.960450302254989e-05, "epoch": 0.944, "percentage": 15.73, "elapsed_time": "0:42:53", "remaining_time": "3:49:45"}
{"current_steps": 595, "total_steps": 3750, "loss": 0.4272, "lr": 3.958587074164735e-05, "epoch": 0.952, "percentage": 15.87, "elapsed_time": "0:43:15", "remaining_time": "3:49:22"}
{"current_steps": 600, "total_steps": 3750, "loss": 0.4518, "lr": 3.956681419858376e-05, "epoch": 0.96, "percentage": 16.0, "elapsed_time": "0:43:34", "remaining_time": "3:48:45"}
{"current_steps": 605, "total_steps": 3750, "loss": 0.4495, "lr": 3.954733380615516e-05, "epoch": 0.968, "percentage": 16.13, "elapsed_time": "0:44:56", "remaining_time": "3:53:35"}
{"current_steps": 610, "total_steps": 3750, "loss": 0.4462, "lr": 3.95274299863389e-05, "epoch": 0.976, "percentage": 16.27, "elapsed_time": "0:45:13", "remaining_time": "3:52:48"}
{"current_steps": 615, "total_steps": 3750, "loss": 0.4395, "lr": 3.950710317028443e-05, "epoch": 0.984, "percentage": 16.4, "elapsed_time": "0:45:32", "remaining_time": "3:52:08"}
{"current_steps": 620, "total_steps": 3750, "loss": 0.4426, "lr": 3.9486353798303996e-05, "epoch": 0.992, "percentage": 16.53, "elapsed_time": "0:45:49", "remaining_time": "3:51:20"}
{"current_steps": 625, "total_steps": 3750, "loss": 0.4313, "lr": 3.946518231986313e-05, "epoch": 1.0, "percentage": 16.67, "elapsed_time": "0:46:06", "remaining_time": "3:50:33"}
{"current_steps": 630, "total_steps": 3750, "loss": 0.4267, "lr": 3.9443589193570847e-05, "epoch": 1.008, "percentage": 16.8, "elapsed_time": "0:46:26", "remaining_time": "3:49:58"}
{"current_steps": 635, "total_steps": 3750, "loss": 0.4356, "lr": 3.942157488716976e-05, "epoch": 1.016, "percentage": 16.93, "elapsed_time": "0:46:43", "remaining_time": "3:49:10"}
{"current_steps": 640, "total_steps": 3750, "loss": 0.4312, "lr": 3.939913987752595e-05, "epoch": 1.024, "percentage": 17.07, "elapsed_time": "0:47:02", "remaining_time": "3:48:37"}
{"current_steps": 645, "total_steps": 3750, "loss": 0.4078, "lr": 3.9376284650618605e-05, "epoch": 1.032, "percentage": 17.2, "elapsed_time": "0:47:24", "remaining_time": "3:48:11"}
{"current_steps": 650, "total_steps": 3750, "loss": 0.4466, "lr": 3.935300970152952e-05, "epoch": 1.04, "percentage": 17.33, "elapsed_time": "0:47:43", "remaining_time": "3:47:34"}
{"current_steps": 655, "total_steps": 3750, "loss": 0.4039, "lr": 3.932931553443235e-05, "epoch": 1.048, "percentage": 17.47, "elapsed_time": "0:48:03", "remaining_time": "3:47:06"}
{"current_steps": 660, "total_steps": 3750, "loss": 0.4354, "lr": 3.930520266258173e-05, "epoch": 1.056, "percentage": 17.6, "elapsed_time": "0:48:20", "remaining_time": "3:46:18"}
{"current_steps": 665, "total_steps": 3750, "loss": 0.4201, "lr": 3.928067160830208e-05, "epoch": 1.064, "percentage": 17.73, "elapsed_time": "0:48:38", "remaining_time": "3:45:39"}
{"current_steps": 670, "total_steps": 3750, "loss": 0.4307, "lr": 3.925572290297638e-05, "epoch": 1.072, "percentage": 17.87, "elapsed_time": "0:48:54", "remaining_time": "3:44:52"}
{"current_steps": 675, "total_steps": 3750, "loss": 0.4386, "lr": 3.9230357087034606e-05, "epoch": 1.08, "percentage": 18.0, "elapsed_time": "0:49:13", "remaining_time": "3:44:13"}
{"current_steps": 680, "total_steps": 3750, "loss": 0.4459, "lr": 3.9204574709942036e-05, "epoch": 1.088, "percentage": 18.13, "elapsed_time": "0:49:31", "remaining_time": "3:43:33"}
{"current_steps": 685, "total_steps": 3750, "loss": 0.4074, "lr": 3.917837633018734e-05, "epoch": 1.096, "percentage": 18.27, "elapsed_time": "0:49:48", "remaining_time": "3:42:52"}
{"current_steps": 690, "total_steps": 3750, "loss": 0.4103, "lr": 3.915176251527051e-05, "epoch": 1.104, "percentage": 18.4, "elapsed_time": "0:50:05", "remaining_time": "3:42:07"}
{"current_steps": 695, "total_steps": 3750, "loss": 0.437, "lr": 3.912473384169051e-05, "epoch": 1.112, "percentage": 18.53, "elapsed_time": "0:50:26", "remaining_time": "3:41:42"}
{"current_steps": 700, "total_steps": 3750, "loss": 0.4364, "lr": 3.9097290894932866e-05, "epoch": 1.12, "percentage": 18.67, "elapsed_time": "0:50:45", "remaining_time": "3:41:07"}
{"current_steps": 705, "total_steps": 3750, "loss": 0.4298, "lr": 3.906943426945691e-05, "epoch": 1.1280000000000001, "percentage": 18.8, "elapsed_time": "0:52:05", "remaining_time": "3:44:59"}
{"current_steps": 710, "total_steps": 3750, "loss": 0.4132, "lr": 3.9041164568682955e-05, "epoch": 1.1360000000000001, "percentage": 18.93, "elapsed_time": "0:52:23", "remaining_time": "3:44:19"}
{"current_steps": 715, "total_steps": 3750, "loss": 0.4238, "lr": 3.90124824049792e-05, "epoch": 1.144, "percentage": 19.07, "elapsed_time": "0:52:44", "remaining_time": "3:43:50"}
{"current_steps": 720, "total_steps": 3750, "loss": 0.4144, "lr": 3.8983388399648465e-05, "epoch": 1.152, "percentage": 19.2, "elapsed_time": "0:53:04", "remaining_time": "3:43:22"}
{"current_steps": 725, "total_steps": 3750, "loss": 0.4284, "lr": 3.895388318291474e-05, "epoch": 1.16, "percentage": 19.33, "elapsed_time": "0:53:25", "remaining_time": "3:42:52"}
{"current_steps": 730, "total_steps": 3750, "loss": 0.4444, "lr": 3.892396739390952e-05, "epoch": 1.168, "percentage": 19.47, "elapsed_time": "0:53:42", "remaining_time": "3:42:13"}
{"current_steps": 735, "total_steps": 3750, "loss": 0.4488, "lr": 3.8893641680657986e-05, "epoch": 1.176, "percentage": 19.6, "elapsed_time": "0:54:00", "remaining_time": "3:41:32"}
{"current_steps": 740, "total_steps": 3750, "loss": 0.4557, "lr": 3.886290670006495e-05, "epoch": 1.184, "percentage": 19.73, "elapsed_time": "0:54:18", "remaining_time": "3:40:52"}
{"current_steps": 745, "total_steps": 3750, "loss": 0.4129, "lr": 3.8831763117900605e-05, "epoch": 1.192, "percentage": 19.87, "elapsed_time": "0:54:38", "remaining_time": "3:40:22"}
{"current_steps": 750, "total_steps": 3750, "loss": 0.4323, "lr": 3.8800211608786166e-05, "epoch": 1.2, "percentage": 20.0, "elapsed_time": "0:54:58", "remaining_time": "3:39:54"}
{"current_steps": 755, "total_steps": 3750, "loss": 0.4264, "lr": 3.876825285617918e-05, "epoch": 1.208, "percentage": 20.13, "elapsed_time": "0:55:14", "remaining_time": "3:39:07"}
{"current_steps": 760, "total_steps": 3750, "loss": 0.4226, "lr": 3.873588755235876e-05, "epoch": 1.216, "percentage": 20.27, "elapsed_time": "0:55:32", "remaining_time": "3:38:31"}
{"current_steps": 765, "total_steps": 3750, "loss": 0.425, "lr": 3.870311639841062e-05, "epoch": 1.224, "percentage": 20.4, "elapsed_time": "0:55:50", "remaining_time": "3:37:52"}
{"current_steps": 770, "total_steps": 3750, "loss": 0.3936, "lr": 3.866994010421182e-05, "epoch": 1.232, "percentage": 20.53, "elapsed_time": "0:56:08", "remaining_time": "3:37:15"}
{"current_steps": 775, "total_steps": 3750, "loss": 0.4329, "lr": 3.863635938841545e-05, "epoch": 1.24, "percentage": 20.67, "elapsed_time": "0:56:23", "remaining_time": "3:36:28"}
{"current_steps": 780, "total_steps": 3750, "loss": 0.4064, "lr": 3.8602374978435015e-05, "epoch": 1.248, "percentage": 20.8, "elapsed_time": "0:56:42", "remaining_time": "3:35:56"}
{"current_steps": 785, "total_steps": 3750, "loss": 0.4317, "lr": 3.8567987610428705e-05, "epoch": 1.256, "percentage": 20.93, "elapsed_time": "0:57:01", "remaining_time": "3:35:24"}
{"current_steps": 790, "total_steps": 3750, "loss": 0.4159, "lr": 3.853319802928345e-05, "epoch": 1.264, "percentage": 21.07, "elapsed_time": "0:57:19", "remaining_time": "3:34:48"}
{"current_steps": 795, "total_steps": 3750, "loss": 0.4236, "lr": 3.849800698859877e-05, "epoch": 1.272, "percentage": 21.2, "elapsed_time": "0:57:37", "remaining_time": "3:34:11"}
{"current_steps": 800, "total_steps": 3750, "loss": 0.4472, "lr": 3.846241525067047e-05, "epoch": 1.28, "percentage": 21.33, "elapsed_time": "0:57:59", "remaining_time": "3:33:49"}
{"current_steps": 805, "total_steps": 3750, "loss": 0.4305, "lr": 3.842642358647411e-05, "epoch": 1.288, "percentage": 21.47, "elapsed_time": "0:59:39", "remaining_time": "3:38:14"}
{"current_steps": 810, "total_steps": 3750, "loss": 0.4223, "lr": 3.839003277564831e-05, "epoch": 1.296, "percentage": 21.6, "elapsed_time": "0:59:58", "remaining_time": "3:37:41"}
{"current_steps": 815, "total_steps": 3750, "loss": 0.4367, "lr": 3.835324360647785e-05, "epoch": 1.304, "percentage": 21.73, "elapsed_time": "1:00:19", "remaining_time": "3:37:14"}
{"current_steps": 820, "total_steps": 3750, "loss": 0.4178, "lr": 3.831605687587663e-05, "epoch": 1.312, "percentage": 21.87, "elapsed_time": "1:00:39", "remaining_time": "3:36:43"}
{"current_steps": 825, "total_steps": 3750, "loss": 0.4089, "lr": 3.827847338937037e-05, "epoch": 1.32, "percentage": 22.0, "elapsed_time": "1:00:58", "remaining_time": "3:36:11"}
{"current_steps": 830, "total_steps": 3750, "loss": 0.4286, "lr": 3.824049396107918e-05, "epoch": 1.328, "percentage": 22.13, "elapsed_time": "1:01:16", "remaining_time": "3:35:33"}
{"current_steps": 835, "total_steps": 3750, "loss": 0.4402, "lr": 3.8202119413699914e-05, "epoch": 1.336, "percentage": 22.27, "elapsed_time": "1:01:34", "remaining_time": "3:34:56"}
{"current_steps": 840, "total_steps": 3750, "loss": 0.4249, "lr": 3.8163350578488366e-05, "epoch": 1.3439999999999999, "percentage": 22.4, "elapsed_time": "1:01:53", "remaining_time": "3:34:25"}
{"current_steps": 845, "total_steps": 3750, "loss": 0.4233, "lr": 3.812418829524124e-05, "epoch": 1.3519999999999999, "percentage": 22.53, "elapsed_time": "1:02:10", "remaining_time": "3:33:45"}
{"current_steps": 850, "total_steps": 3750, "loss": 0.4138, "lr": 3.8084633412277974e-05, "epoch": 1.3599999999999999, "percentage": 22.67, "elapsed_time": "1:02:31", "remaining_time": "3:33:17"}
{"current_steps": 855, "total_steps": 3750, "loss": 0.4314, "lr": 3.804468678642238e-05, "epoch": 1.3679999999999999, "percentage": 22.8, "elapsed_time": "1:02:50", "remaining_time": "3:32:47"}
{"current_steps": 860, "total_steps": 3750, "loss": 0.4396, "lr": 3.800434928298403e-05, "epoch": 1.376, "percentage": 22.93, "elapsed_time": "1:03:08", "remaining_time": "3:32:09"}
{"current_steps": 865, "total_steps": 3750, "loss": 0.4144, "lr": 3.796362177573957e-05, "epoch": 1.384, "percentage": 23.07, "elapsed_time": "1:03:26", "remaining_time": "3:31:36"}
{"current_steps": 870, "total_steps": 3750, "loss": 0.4343, "lr": 3.792250514691378e-05, "epoch": 1.392, "percentage": 23.2, "elapsed_time": "1:03:44", "remaining_time": "3:30:58"}
{"current_steps": 875, "total_steps": 3750, "loss": 0.4197, "lr": 3.788100028716043e-05, "epoch": 1.4, "percentage": 23.33, "elapsed_time": "1:03:59", "remaining_time": "3:30:16"}
{"current_steps": 880, "total_steps": 3750, "loss": 0.4042, "lr": 3.7839108095543016e-05, "epoch": 1.408, "percentage": 23.47, "elapsed_time": "1:04:21", "remaining_time": "3:29:55"}
{"current_steps": 885, "total_steps": 3750, "loss": 0.4249, "lr": 3.7796829479515295e-05, "epoch": 1.416, "percentage": 23.6, "elapsed_time": "1:04:39", "remaining_time": "3:29:20"}
{"current_steps": 890, "total_steps": 3750, "loss": 0.4176, "lr": 3.775416535490159e-05, "epoch": 1.424, "percentage": 23.73, "elapsed_time": "1:04:57", "remaining_time": "3:28:44"}
{"current_steps": 895, "total_steps": 3750, "loss": 0.4324, "lr": 3.7711116645876984e-05, "epoch": 1.432, "percentage": 23.87, "elapsed_time": "1:05:14", "remaining_time": "3:28:06"}
{"current_steps": 900, "total_steps": 3750, "loss": 0.442, "lr": 3.7667684284947286e-05, "epoch": 1.44, "percentage": 24.0, "elapsed_time": "1:05:32", "remaining_time": "3:27:32"}
{"current_steps": 905, "total_steps": 3750, "loss": 0.4223, "lr": 3.762386921292885e-05, "epoch": 1.448, "percentage": 24.13, "elapsed_time": "1:06:54", "remaining_time": "3:30:20"}
{"current_steps": 910, "total_steps": 3750, "loss": 0.4432, "lr": 3.757967237892818e-05, "epoch": 1.456, "percentage": 24.27, "elapsed_time": "1:07:11", "remaining_time": "3:29:42"}
{"current_steps": 915, "total_steps": 3750, "loss": 0.413, "lr": 3.7535094740321334e-05, "epoch": 1.464, "percentage": 24.4, "elapsed_time": "1:07:31", "remaining_time": "3:29:13"}
{"current_steps": 920, "total_steps": 3750, "loss": 0.4072, "lr": 3.749013726273328e-05, "epoch": 1.472, "percentage": 24.53, "elapsed_time": "1:07:50", "remaining_time": "3:28:41"}
{"current_steps": 925, "total_steps": 3750, "loss": 0.4291, "lr": 3.7444800920016875e-05, "epoch": 1.48, "percentage": 24.67, "elapsed_time": "1:08:08", "remaining_time": "3:28:05"}
{"current_steps": 930, "total_steps": 3750, "loss": 0.4443, "lr": 3.7399086694231864e-05, "epoch": 1.488, "percentage": 24.8, "elapsed_time": "1:08:24", "remaining_time": "3:27:24"}
{"current_steps": 935, "total_steps": 3750, "loss": 0.4347, "lr": 3.735299557562352e-05, "epoch": 1.496, "percentage": 24.93, "elapsed_time": "1:08:41", "remaining_time": "3:26:47"}
{"current_steps": 940, "total_steps": 3750, "loss": 0.431, "lr": 3.7306528562601245e-05, "epoch": 1.504, "percentage": 25.07, "elapsed_time": "1:09:00", "remaining_time": "3:26:18"}
{"current_steps": 945, "total_steps": 3750, "loss": 0.418, "lr": 3.7259686661716945e-05, "epoch": 1.512, "percentage": 25.2, "elapsed_time": "1:09:21", "remaining_time": "3:25:52"}
{"current_steps": 950, "total_steps": 3750, "loss": 0.4183, "lr": 3.7212470887643204e-05, "epoch": 1.52, "percentage": 25.33, "elapsed_time": "1:09:39", "remaining_time": "3:25:19"}
{"current_steps": 955, "total_steps": 3750, "loss": 0.4253, "lr": 3.7164882263151315e-05, "epoch": 1.528, "percentage": 25.47, "elapsed_time": "1:09:59", "remaining_time": "3:24:50"}
{"current_steps": 960, "total_steps": 3750, "loss": 0.4123, "lr": 3.711692181908913e-05, "epoch": 1.536, "percentage": 25.6, "elapsed_time": "1:10:19", "remaining_time": "3:24:23"}
{"current_steps": 965, "total_steps": 3750, "loss": 0.4208, "lr": 3.706859059435871e-05, "epoch": 1.544, "percentage": 25.73, "elapsed_time": "1:10:36", "remaining_time": "3:23:46"}
{"current_steps": 970, "total_steps": 3750, "loss": 0.4212, "lr": 3.701988963589384e-05, "epoch": 1.552, "percentage": 25.87, "elapsed_time": "1:10:58", "remaining_time": "3:23:24"}
{"current_steps": 975, "total_steps": 3750, "loss": 0.417, "lr": 3.697081999863736e-05, "epoch": 1.56, "percentage": 26.0, "elapsed_time": "1:11:16", "remaining_time": "3:22:52"}
{"current_steps": 980, "total_steps": 3750, "loss": 0.4363, "lr": 3.692138274551828e-05, "epoch": 1.568, "percentage": 26.13, "elapsed_time": "1:11:32", "remaining_time": "3:22:12"}
{"current_steps": 985, "total_steps": 3750, "loss": 0.4273, "lr": 3.687157894742878e-05, "epoch": 1.576, "percentage": 26.27, "elapsed_time": "1:11:49", "remaining_time": "3:21:37"}
{"current_steps": 990, "total_steps": 3750, "loss": 0.4393, "lr": 3.682140968320101e-05, "epoch": 1.584, "percentage": 26.4, "elapsed_time": "1:12:07", "remaining_time": "3:21:04"}
{"current_steps": 995, "total_steps": 3750, "loss": 0.4057, "lr": 3.6770876039583725e-05, "epoch": 1.592, "percentage": 26.53, "elapsed_time": "1:12:24", "remaining_time": "3:20:29"}
{"current_steps": 1000, "total_steps": 3750, "loss": 0.4331, "lr": 3.671997911121871e-05, "epoch": 1.6, "percentage": 26.67, "elapsed_time": "1:12:42", "remaining_time": "3:19:56"}
{"current_steps": 1005, "total_steps": 3750, "loss": 0.4163, "lr": 3.6668720000617126e-05, "epoch": 1.608, "percentage": 26.8, "elapsed_time": "1:14:04", "remaining_time": "3:22:19"}
{"current_steps": 1010, "total_steps": 3750, "loss": 0.4091, "lr": 3.661709981813558e-05, "epoch": 1.616, "percentage": 26.93, "elapsed_time": "1:14:22", "remaining_time": "3:21:45"}
{"current_steps": 1015, "total_steps": 3750, "loss": 0.4115, "lr": 3.6565119681952086e-05, "epoch": 1.624, "percentage": 27.07, "elapsed_time": "1:14:40", "remaining_time": "3:21:14"}
{"current_steps": 1020, "total_steps": 3750, "loss": 0.426, "lr": 3.651278071804186e-05, "epoch": 1.6320000000000001, "percentage": 27.2, "elapsed_time": "1:14:59", "remaining_time": "3:20:41"}
{"current_steps": 1025, "total_steps": 3750, "loss": 0.4076, "lr": 3.646008406015291e-05, "epoch": 1.6400000000000001, "percentage": 27.33, "elapsed_time": "1:15:16", "remaining_time": "3:20:07"}
{"current_steps": 1030, "total_steps": 3750, "loss": 0.4079, "lr": 3.6407030849781475e-05, "epoch": 1.6480000000000001, "percentage": 27.47, "elapsed_time": "1:15:36", "remaining_time": "3:19:39"}
{"current_steps": 1035, "total_steps": 3750, "loss": 0.4277, "lr": 3.635362223614733e-05, "epoch": 1.6560000000000001, "percentage": 27.6, "elapsed_time": "1:15:54", "remaining_time": "3:19:06"}
{"current_steps": 1040, "total_steps": 3750, "loss": 0.4062, "lr": 3.629985937616884e-05, "epoch": 1.6640000000000001, "percentage": 27.73, "elapsed_time": "1:16:14", "remaining_time": "3:18:39"}
{"current_steps": 1045, "total_steps": 3750, "loss": 0.4154, "lr": 3.624574343443794e-05, "epoch": 1.6720000000000002, "percentage": 27.87, "elapsed_time": "1:16:34", "remaining_time": "3:18:13"}
{"current_steps": 1050, "total_steps": 3750, "loss": 0.4129, "lr": 3.619127558319492e-05, "epoch": 1.6800000000000002, "percentage": 28.0, "elapsed_time": "1:16:54", "remaining_time": "3:17:46"}
{"current_steps": 1055, "total_steps": 3750, "loss": 0.4175, "lr": 3.613645700230298e-05, "epoch": 1.688, "percentage": 28.13, "elapsed_time": "1:17:14", "remaining_time": "3:17:20"}
{"current_steps": 1060, "total_steps": 3750, "loss": 0.4075, "lr": 3.6081288879222696e-05, "epoch": 1.696, "percentage": 28.27, "elapsed_time": "1:17:35", "remaining_time": "3:16:55"}
{"current_steps": 1065, "total_steps": 3750, "loss": 0.4266, "lr": 3.602577240898633e-05, "epoch": 1.704, "percentage": 28.4, "elapsed_time": "1:17:53", "remaining_time": "3:16:21"}
{"current_steps": 1070, "total_steps": 3750, "loss": 0.4275, "lr": 3.596990879417188e-05, "epoch": 1.712, "percentage": 28.53, "elapsed_time": "1:18:10", "remaining_time": "3:15:49"}
{"current_steps": 1075, "total_steps": 3750, "loss": 0.4191, "lr": 3.591369924487711e-05, "epoch": 1.72, "percentage": 28.67, "elapsed_time": "1:18:29", "remaining_time": "3:15:20"}
{"current_steps": 1080, "total_steps": 3750, "loss": 0.4186, "lr": 3.585714497869326e-05, "epoch": 1.728, "percentage": 28.8, "elapsed_time": "1:18:46", "remaining_time": "3:14:46"}
{"current_steps": 1085, "total_steps": 3750, "loss": 0.4016, "lr": 3.580024722067872e-05, "epoch": 1.736, "percentage": 28.93, "elapsed_time": "1:19:08", "remaining_time": "3:14:22"}
{"current_steps": 1090, "total_steps": 3750, "loss": 0.4287, "lr": 3.574300720333247e-05, "epoch": 1.744, "percentage": 29.07, "elapsed_time": "1:19:23", "remaining_time": "3:13:44"}
{"current_steps": 1095, "total_steps": 3750, "loss": 0.4114, "lr": 3.568542616656739e-05, "epoch": 1.752, "percentage": 29.2, "elapsed_time": "1:19:41", "remaining_time": "3:13:14"}
{"current_steps": 1100, "total_steps": 3750, "loss": 0.4288, "lr": 3.5627505357683404e-05, "epoch": 1.76, "percentage": 29.33, "elapsed_time": "1:20:01", "remaining_time": "3:12:47"}
{"current_steps": 1105, "total_steps": 3750, "loss": 0.4194, "lr": 3.5569246031340474e-05, "epoch": 1.768, "percentage": 29.47, "elapsed_time": "1:21:23", "remaining_time": "3:14:49"}
{"current_steps": 1110, "total_steps": 3750, "loss": 0.4129, "lr": 3.5510649449531375e-05, "epoch": 1.776, "percentage": 29.6, "elapsed_time": "1:21:43", "remaining_time": "3:14:21"}
{"current_steps": 1115, "total_steps": 3750, "loss": 0.4055, "lr": 3.545171688155441e-05, "epoch": 1.784, "percentage": 29.73, "elapsed_time": "1:22:04", "remaining_time": "3:13:57"}
{"current_steps": 1120, "total_steps": 3750, "loss": 0.3998, "lr": 3.5392449603985894e-05, "epoch": 1.792, "percentage": 29.87, "elapsed_time": "1:22:21", "remaining_time": "3:13:24"}
{"current_steps": 1125, "total_steps": 3750, "loss": 0.4377, "lr": 3.53328489006525e-05, "epoch": 1.8, "percentage": 30.0, "elapsed_time": "1:22:39", "remaining_time": "3:12:52"}
{"current_steps": 1130, "total_steps": 3750, "loss": 0.4319, "lr": 3.527291606260345e-05, "epoch": 1.808, "percentage": 30.13, "elapsed_time": "1:22:56", "remaining_time": "3:12:18"}
{"current_steps": 1135, "total_steps": 3750, "loss": 0.4243, "lr": 3.521265238808255e-05, "epoch": 1.8159999999999998, "percentage": 30.27, "elapsed_time": "1:23:15", "remaining_time": "3:11:49"}
{"current_steps": 1140, "total_steps": 3750, "loss": 0.4265, "lr": 3.515205918250007e-05, "epoch": 1.8239999999999998, "percentage": 30.4, "elapsed_time": "1:23:35", "remaining_time": "3:11:21"}
{"current_steps": 1145, "total_steps": 3750, "loss": 0.4249, "lr": 3.5091137758404456e-05, "epoch": 1.8319999999999999, "percentage": 30.53, "elapsed_time": "1:23:52", "remaining_time": "3:10:50"}
{"current_steps": 1150, "total_steps": 3750, "loss": 0.4252, "lr": 3.5029889435453924e-05, "epoch": 1.8399999999999999, "percentage": 30.67, "elapsed_time": "1:24:09", "remaining_time": "3:10:15"}
{"current_steps": 1155, "total_steps": 3750, "loss": 0.3987, "lr": 3.496831554038784e-05, "epoch": 1.8479999999999999, "percentage": 30.8, "elapsed_time": "1:24:28", "remaining_time": "3:09:47"}
{"current_steps": 1160, "total_steps": 3750, "loss": 0.4305, "lr": 3.490641740699801e-05, "epoch": 1.8559999999999999, "percentage": 30.93, "elapsed_time": "1:24:45", "remaining_time": "3:09:14"}
{"current_steps": 1165, "total_steps": 3750, "loss": 0.3991, "lr": 3.484419637609977e-05, "epoch": 1.8639999999999999, "percentage": 31.07, "elapsed_time": "1:25:05", "remaining_time": "3:08:47"}
{"current_steps": 1170, "total_steps": 3750, "loss": 0.3962, "lr": 3.478165379550292e-05, "epoch": 1.8719999999999999, "percentage": 31.2, "elapsed_time": "1:25:23", "remaining_time": "3:08:17"}
{"current_steps": 1175, "total_steps": 3750, "loss": 0.4263, "lr": 3.471879101998262e-05, "epoch": 1.88, "percentage": 31.33, "elapsed_time": "1:25:41", "remaining_time": "3:07:47"}
{"current_steps": 1180, "total_steps": 3750, "loss": 0.4112, "lr": 3.465560941124992e-05, "epoch": 1.888, "percentage": 31.47, "elapsed_time": "1:25:59", "remaining_time": "3:07:17"}
{"current_steps": 1185, "total_steps": 3750, "loss": 0.4112, "lr": 3.459211033792233e-05, "epoch": 1.896, "percentage": 31.6, "elapsed_time": "1:26:19", "remaining_time": "3:06:50"}
{"current_steps": 1190, "total_steps": 3750, "loss": 0.4076, "lr": 3.4528295175494194e-05, "epoch": 1.904, "percentage": 31.73, "elapsed_time": "1:26:35", "remaining_time": "3:06:16"}
{"current_steps": 1195, "total_steps": 3750, "loss": 0.4187, "lr": 3.4464165306306845e-05, "epoch": 1.912, "percentage": 31.87, "elapsed_time": "1:26:53", "remaining_time": "3:05:47"}
{"current_steps": 1200, "total_steps": 3750, "loss": 0.4146, "lr": 3.4399722119518675e-05, "epoch": 1.92, "percentage": 32.0, "elapsed_time": "1:27:08", "remaining_time": "3:05:11"}
{"current_steps": 1205, "total_steps": 3750, "loss": 0.3901, "lr": 3.433496701107506e-05, "epoch": 1.928, "percentage": 32.13, "elapsed_time": "1:29:06", "remaining_time": "3:08:12"}
{"current_steps": 1210, "total_steps": 3750, "loss": 0.4359, "lr": 3.426990138367813e-05, "epoch": 1.936, "percentage": 32.27, "elapsed_time": "1:29:29", "remaining_time": "3:07:50"}
{"current_steps": 1215, "total_steps": 3750, "loss": 0.4173, "lr": 3.420452664675633e-05, "epoch": 1.944, "percentage": 32.4, "elapsed_time": "1:29:47", "remaining_time": "3:07:19"}
{"current_steps": 1220, "total_steps": 3750, "loss": 0.4111, "lr": 3.4138844216433946e-05, "epoch": 1.952, "percentage": 32.53, "elapsed_time": "1:30:04", "remaining_time": "3:06:48"}
{"current_steps": 1225, "total_steps": 3750, "loss": 0.4103, "lr": 3.407285551550041e-05, "epoch": 1.96, "percentage": 32.67, "elapsed_time": "1:30:24", "remaining_time": "3:06:21"}
{"current_steps": 1230, "total_steps": 3750, "loss": 0.4077, "lr": 3.4006561973379466e-05, "epoch": 1.968, "percentage": 32.8, "elapsed_time": "1:30:45", "remaining_time": "3:05:56"}
{"current_steps": 1235, "total_steps": 3750, "loss": 0.4123, "lr": 3.3939965026098245e-05, "epoch": 1.976, "percentage": 32.93, "elapsed_time": "1:31:04", "remaining_time": "3:05:27"}
{"current_steps": 1240, "total_steps": 3750, "loss": 0.3997, "lr": 3.38730661162561e-05, "epoch": 1.984, "percentage": 33.07, "elapsed_time": "1:31:20", "remaining_time": "3:04:54"}
{"current_steps": 1245, "total_steps": 3750, "loss": 0.4067, "lr": 3.3805866692993414e-05, "epoch": 1.992, "percentage": 33.2, "elapsed_time": "1:31:40", "remaining_time": "3:04:26"}
{"current_steps": 1250, "total_steps": 3750, "loss": 0.418, "lr": 3.373836821196018e-05, "epoch": 2.0, "percentage": 33.33, "elapsed_time": "1:31:57", "remaining_time": "3:03:55"}
{"current_steps": 1255, "total_steps": 3750, "loss": 0.3902, "lr": 3.3670572135284456e-05, "epoch": 2.008, "percentage": 33.47, "elapsed_time": "1:32:15", "remaining_time": "3:03:24"}
{"current_steps": 1260, "total_steps": 3750, "loss": 0.397, "lr": 3.360247993154073e-05, "epoch": 2.016, "percentage": 33.6, "elapsed_time": "1:32:35", "remaining_time": "3:02:59"}
{"current_steps": 1265, "total_steps": 3750, "loss": 0.3864, "lr": 3.35340930757181e-05, "epoch": 2.024, "percentage": 33.73, "elapsed_time": "1:32:54", "remaining_time": "3:02:30"}
{"current_steps": 1270, "total_steps": 3750, "loss": 0.3792, "lr": 3.3465413049188276e-05, "epoch": 2.032, "percentage": 33.87, "elapsed_time": "1:33:13", "remaining_time": "3:02:02"}
{"current_steps": 1275, "total_steps": 3750, "loss": 0.3766, "lr": 3.3396441339673564e-05, "epoch": 2.04, "percentage": 34.0, "elapsed_time": "1:33:33", "remaining_time": "3:01:36"}
{"current_steps": 1280, "total_steps": 3750, "loss": 0.3949, "lr": 3.3327179441214574e-05, "epoch": 2.048, "percentage": 34.13, "elapsed_time": "1:33:50", "remaining_time": "3:01:05"}
{"current_steps": 1285, "total_steps": 3750, "loss": 0.3988, "lr": 3.325762885413791e-05, "epoch": 2.056, "percentage": 34.27, "elapsed_time": "1:34:09", "remaining_time": "3:00:37"}
{"current_steps": 1290, "total_steps": 3750, "loss": 0.3733, "lr": 3.318779108502362e-05, "epoch": 2.064, "percentage": 34.4, "elapsed_time": "1:34:27", "remaining_time": "3:00:08"}
{"current_steps": 1295, "total_steps": 3750, "loss": 0.3754, "lr": 3.3117667646672616e-05, "epoch": 2.072, "percentage": 34.53, "elapsed_time": "1:34:45", "remaining_time": "2:59:37"}
{"current_steps": 1300, "total_steps": 3750, "loss": 0.3775, "lr": 3.304726005807386e-05, "epoch": 2.08, "percentage": 34.67, "elapsed_time": "1:35:01", "remaining_time": "2:59:05"}
{"current_steps": 1305, "total_steps": 3750, "loss": 0.388, "lr": 3.297656984437148e-05, "epoch": 2.088, "percentage": 34.8, "elapsed_time": "1:36:44", "remaining_time": "3:01:14"}
{"current_steps": 1310, "total_steps": 3750, "loss": 0.4185, "lr": 3.2905598536831715e-05, "epoch": 2.096, "percentage": 34.93, "elapsed_time": "1:37:04", "remaining_time": "3:00:49"}
{"current_steps": 1315, "total_steps": 3750, "loss": 0.3794, "lr": 3.2834347672809776e-05, "epoch": 2.104, "percentage": 35.07, "elapsed_time": "1:37:22", "remaining_time": "3:00:18"}
{"current_steps": 1320, "total_steps": 3750, "loss": 0.3675, "lr": 3.276281879571651e-05, "epoch": 2.112, "percentage": 35.2, "elapsed_time": "1:37:39", "remaining_time": "2:59:47"}
{"current_steps": 1325, "total_steps": 3750, "loss": 0.3883, "lr": 3.2691013454985006e-05, "epoch": 2.12, "percentage": 35.33, "elapsed_time": "1:37:57", "remaining_time": "2:59:16"}
{"current_steps": 1330, "total_steps": 3750, "loss": 0.394, "lr": 3.2618933206036994e-05, "epoch": 2.128, "percentage": 35.47, "elapsed_time": "1:38:15", "remaining_time": "2:58:47"}
{"current_steps": 1335, "total_steps": 3750, "loss": 0.381, "lr": 3.2546579610249177e-05, "epoch": 2.136, "percentage": 35.6, "elapsed_time": "1:38:34", "remaining_time": "2:58:19"}
{"current_steps": 1340, "total_steps": 3750, "loss": 0.3831, "lr": 3.2473954234919386e-05, "epoch": 2.144, "percentage": 35.73, "elapsed_time": "1:38:55", "remaining_time": "2:57:54"}
{"current_steps": 1345, "total_steps": 3750, "loss": 0.3837, "lr": 3.240105865323266e-05, "epoch": 2.152, "percentage": 35.87, "elapsed_time": "1:39:12", "remaining_time": "2:57:23"}
{"current_steps": 1350, "total_steps": 3750, "loss": 0.3803, "lr": 3.232789444422714e-05, "epoch": 2.16, "percentage": 36.0, "elapsed_time": "1:39:28", "remaining_time": "2:56:51"}
{"current_steps": 1355, "total_steps": 3750, "loss": 0.407, "lr": 3.225446319275988e-05, "epoch": 2.168, "percentage": 36.13, "elapsed_time": "1:39:44", "remaining_time": "2:56:18"}
{"current_steps": 1360, "total_steps": 3750, "loss": 0.3962, "lr": 3.218076648947251e-05, "epoch": 2.176, "percentage": 36.27, "elapsed_time": "1:40:02", "remaining_time": "2:55:48"}
{"current_steps": 1365, "total_steps": 3750, "loss": 0.383, "lr": 3.2106805930756804e-05, "epoch": 2.184, "percentage": 36.4, "elapsed_time": "1:40:19", "remaining_time": "2:55:18"}
{"current_steps": 1370, "total_steps": 3750, "loss": 0.4085, "lr": 3.2032583118720045e-05, "epoch": 2.192, "percentage": 36.53, "elapsed_time": "1:40:38", "remaining_time": "2:54:50"}
{"current_steps": 1375, "total_steps": 3750, "loss": 0.3659, "lr": 3.195809966115038e-05, "epoch": 2.2, "percentage": 36.67, "elapsed_time": "1:40:57", "remaining_time": "2:54:22"}
{"current_steps": 1380, "total_steps": 3750, "loss": 0.3928, "lr": 3.188335717148195e-05, "epoch": 2.208, "percentage": 36.8, "elapsed_time": "1:41:14", "remaining_time": "2:53:52"}
{"current_steps": 1385, "total_steps": 3750, "loss": 0.3745, "lr": 3.1808357268759964e-05, "epoch": 2.216, "percentage": 36.93, "elapsed_time": "1:41:33", "remaining_time": "2:53:25"}
{"current_steps": 1390, "total_steps": 3750, "loss": 0.3747, "lr": 3.173310157760563e-05, "epoch": 2.224, "percentage": 37.07, "elapsed_time": "1:41:50", "remaining_time": "2:52:55"}
{"current_steps": 1395, "total_steps": 3750, "loss": 0.3792, "lr": 3.165759172818093e-05, "epoch": 2.232, "percentage": 37.2, "elapsed_time": "1:42:10", "remaining_time": "2:52:29"}
{"current_steps": 1400, "total_steps": 3750, "loss": 0.3977, "lr": 3.158182935615336e-05, "epoch": 2.24, "percentage": 37.33, "elapsed_time": "1:42:29", "remaining_time": "2:52:02"}
{"current_steps": 1405, "total_steps": 3750, "loss": 0.3984, "lr": 3.150581610266046e-05, "epoch": 2.248, "percentage": 37.47, "elapsed_time": "1:44:27", "remaining_time": "2:54:21"}
{"current_steps": 1410, "total_steps": 3750, "loss": 0.381, "lr": 3.1429553614274256e-05, "epoch": 2.2560000000000002, "percentage": 37.6, "elapsed_time": "1:44:43", "remaining_time": "2:53:48"}
{"current_steps": 1415, "total_steps": 3750, "loss": 0.3761, "lr": 3.1353043542965636e-05, "epoch": 2.2640000000000002, "percentage": 37.73, "elapsed_time": "1:45:00", "remaining_time": "2:53:17"}
{"current_steps": 1420, "total_steps": 3750, "loss": 0.3754, "lr": 3.1276287546068536e-05, "epoch": 2.2720000000000002, "percentage": 37.87, "elapsed_time": "1:45:18", "remaining_time": "2:52:47"}
{"current_steps": 1425, "total_steps": 3750, "loss": 0.3924, "lr": 3.1199287286244047e-05, "epoch": 2.2800000000000002, "percentage": 38.0, "elapsed_time": "1:45:35", "remaining_time": "2:52:17"}
{"current_steps": 1430, "total_steps": 3750, "loss": 0.4048, "lr": 3.112204443144438e-05, "epoch": 2.288, "percentage": 38.13, "elapsed_time": "1:45:52", "remaining_time": "2:51:46"}
{"current_steps": 1435, "total_steps": 3750, "loss": 0.4009, "lr": 3.1044560654876775e-05, "epoch": 2.296, "percentage": 38.27, "elapsed_time": "1:46:12", "remaining_time": "2:51:20"}
{"current_steps": 1440, "total_steps": 3750, "loss": 0.3894, "lr": 3.0966837634967215e-05, "epoch": 2.304, "percentage": 38.4, "elapsed_time": "1:46:30", "remaining_time": "2:50:52"}
{"current_steps": 1445, "total_steps": 3750, "loss": 0.3724, "lr": 3.088887705532409e-05, "epoch": 2.312, "percentage": 38.53, "elapsed_time": "1:46:48", "remaining_time": "2:50:22"}
{"current_steps": 1450, "total_steps": 3750, "loss": 0.3722, "lr": 3.081068060470174e-05, "epoch": 2.32, "percentage": 38.67, "elapsed_time": "1:47:07", "remaining_time": "2:49:55"}
{"current_steps": 1455, "total_steps": 3750, "loss": 0.3892, "lr": 3.073224997696385e-05, "epoch": 2.328, "percentage": 38.8, "elapsed_time": "1:47:25", "remaining_time": "2:49:26"}
{"current_steps": 1460, "total_steps": 3750, "loss": 0.3904, "lr": 3.065358687104675e-05, "epoch": 2.336, "percentage": 38.93, "elapsed_time": "1:47:43", "remaining_time": "2:48:57"}
{"current_steps": 1465, "total_steps": 3750, "loss": 0.3697, "lr": 3.057469299092264e-05, "epoch": 2.344, "percentage": 39.07, "elapsed_time": "1:47:59", "remaining_time": "2:48:26"}
{"current_steps": 1470, "total_steps": 3750, "loss": 0.3702, "lr": 3.0495570045562686e-05, "epoch": 2.352, "percentage": 39.2, "elapsed_time": "1:48:18", "remaining_time": "2:47:58"}
{"current_steps": 1475, "total_steps": 3750, "loss": 0.3708, "lr": 3.041621974889996e-05, "epoch": 2.36, "percentage": 39.33, "elapsed_time": "1:48:35", "remaining_time": "2:47:29"}
{"current_steps": 1480, "total_steps": 3750, "loss": 0.4063, "lr": 3.0336643819792342e-05, "epoch": 2.368, "percentage": 39.47, "elapsed_time": "1:48:53", "remaining_time": "2:47:01"}
{"current_steps": 1485, "total_steps": 3750, "loss": 0.3957, "lr": 3.0256843981985295e-05, "epoch": 2.376, "percentage": 39.6, "elapsed_time": "1:49:11", "remaining_time": "2:46:32"}
{"current_steps": 1490, "total_steps": 3750, "loss": 0.3766, "lr": 3.0176821964074503e-05, "epoch": 2.384, "percentage": 39.73, "elapsed_time": "1:49:30", "remaining_time": "2:46:06"}
{"current_steps": 1495, "total_steps": 3750, "loss": 0.3711, "lr": 3.009657949946844e-05, "epoch": 2.392, "percentage": 39.87, "elapsed_time": "1:49:48", "remaining_time": "2:45:37"}
{"current_steps": 1500, "total_steps": 3750, "loss": 0.3863, "lr": 3.00161183263508e-05, "epoch": 2.4, "percentage": 40.0, "elapsed_time": "1:50:06", "remaining_time": "2:45:09"}
{"current_steps": 1505, "total_steps": 3750, "loss": 0.4124, "lr": 2.993544018764289e-05, "epoch": 2.408, "percentage": 40.13, "elapsed_time": "1:51:59", "remaining_time": "2:47:03"}
{"current_steps": 1510, "total_steps": 3750, "loss": 0.4003, "lr": 2.9854546830965833e-05, "epoch": 2.416, "percentage": 40.27, "elapsed_time": "1:52:19", "remaining_time": "2:46:38"}
{"current_steps": 1515, "total_steps": 3750, "loss": 0.3808, "lr": 2.9773440008602736e-05, "epoch": 2.424, "percentage": 40.4, "elapsed_time": "1:52:35", "remaining_time": "2:46:05"}
{"current_steps": 1520, "total_steps": 3750, "loss": 0.4028, "lr": 2.96921214774607e-05, "epoch": 2.432, "percentage": 40.53, "elapsed_time": "1:52:50", "remaining_time": "2:45:32"}
{"current_steps": 1525, "total_steps": 3750, "loss": 0.3873, "lr": 2.9610592999032815e-05, "epoch": 2.44, "percentage": 40.67, "elapsed_time": "1:53:07", "remaining_time": "2:45:03"}
{"current_steps": 1530, "total_steps": 3750, "loss": 0.365, "lr": 2.9528856339359973e-05, "epoch": 2.448, "percentage": 40.8, "elapsed_time": "1:53:22", "remaining_time": "2:44:30"}
{"current_steps": 1535, "total_steps": 3750, "loss": 0.3956, "lr": 2.9446913268992588e-05, "epoch": 2.456, "percentage": 40.93, "elapsed_time": "1:53:41", "remaining_time": "2:44:03"}
{"current_steps": 1540, "total_steps": 3750, "loss": 0.4069, "lr": 2.936476556295229e-05, "epoch": 2.464, "percentage": 41.07, "elapsed_time": "1:54:00", "remaining_time": "2:43:36"}
{"current_steps": 1545, "total_steps": 3750, "loss": 0.3936, "lr": 2.928241500069346e-05, "epoch": 2.472, "percentage": 41.2, "elapsed_time": "1:54:15", "remaining_time": "2:43:04"}
{"current_steps": 1550, "total_steps": 3750, "loss": 0.3799, "lr": 2.9199863366064655e-05, "epoch": 2.48, "percentage": 41.33, "elapsed_time": "1:54:34", "remaining_time": "2:42:37"}
{"current_steps": 1555, "total_steps": 3750, "loss": 0.369, "lr": 2.9117112447270007e-05, "epoch": 2.488, "percentage": 41.47, "elapsed_time": "1:54:52", "remaining_time": "2:42:09"}
{"current_steps": 1560, "total_steps": 3750, "loss": 0.3928, "lr": 2.9034164036830462e-05, "epoch": 2.496, "percentage": 41.6, "elapsed_time": "1:55:10", "remaining_time": "2:41:41"}
{"current_steps": 1565, "total_steps": 3750, "loss": 0.3754, "lr": 2.8951019931544975e-05, "epoch": 2.504, "percentage": 41.73, "elapsed_time": "1:55:34", "remaining_time": "2:41:21"}
{"current_steps": 1570, "total_steps": 3750, "loss": 0.3882, "lr": 2.8867681932451544e-05, "epoch": 2.512, "percentage": 41.87, "elapsed_time": "1:55:52", "remaining_time": "2:40:53"}
{"current_steps": 1575, "total_steps": 3750, "loss": 0.4039, "lr": 2.8784151844788267e-05, "epoch": 2.52, "percentage": 42.0, "elapsed_time": "1:56:09", "remaining_time": "2:40:24"}
{"current_steps": 1580, "total_steps": 3750, "loss": 0.3807, "lr": 2.8700431477954155e-05, "epoch": 2.528, "percentage": 42.13, "elapsed_time": "1:56:29", "remaining_time": "2:39:59"}
{"current_steps": 1585, "total_steps": 3750, "loss": 0.3926, "lr": 2.8616522645470012e-05, "epoch": 2.536, "percentage": 42.27, "elapsed_time": "1:56:44", "remaining_time": "2:39:27"}
{"current_steps": 1590, "total_steps": 3750, "loss": 0.3744, "lr": 2.8532427164939086e-05, "epoch": 2.544, "percentage": 42.4, "elapsed_time": "1:57:05", "remaining_time": "2:39:03"}
{"current_steps": 1595, "total_steps": 3750, "loss": 0.3992, "lr": 2.844814685800776e-05, "epoch": 2.552, "percentage": 42.53, "elapsed_time": "1:57:23", "remaining_time": "2:38:35"}
{"current_steps": 1600, "total_steps": 3750, "loss": 0.3992, "lr": 2.8363683550326028e-05, "epoch": 2.56, "percentage": 42.67, "elapsed_time": "1:57:42", "remaining_time": "2:38:10"}
{"current_steps": 1605, "total_steps": 3750, "loss": 0.3745, "lr": 2.8279039071508024e-05, "epoch": 2.568, "percentage": 42.8, "elapsed_time": "1:59:30", "remaining_time": "2:39:43"}
{"current_steps": 1610, "total_steps": 3750, "loss": 0.3814, "lr": 2.81942152550923e-05, "epoch": 2.576, "percentage": 42.93, "elapsed_time": "1:59:49", "remaining_time": "2:39:16"}
{"current_steps": 1615, "total_steps": 3750, "loss": 0.3743, "lr": 2.810921393850219e-05, "epoch": 2.584, "percentage": 43.07, "elapsed_time": "2:00:09", "remaining_time": "2:38:50"}
{"current_steps": 1620, "total_steps": 3750, "loss": 0.3977, "lr": 2.802403696300595e-05, "epoch": 2.592, "percentage": 43.2, "elapsed_time": "2:00:25", "remaining_time": "2:38:19"}
{"current_steps": 1625, "total_steps": 3750, "loss": 0.3734, "lr": 2.7938686173676915e-05, "epoch": 2.6, "percentage": 43.33, "elapsed_time": "2:00:41", "remaining_time": "2:37:49"}
{"current_steps": 1630, "total_steps": 3750, "loss": 0.3914, "lr": 2.7853163419353505e-05, "epoch": 2.608, "percentage": 43.47, "elapsed_time": "2:01:00", "remaining_time": "2:37:22"}
{"current_steps": 1635, "total_steps": 3750, "loss": 0.3846, "lr": 2.776747055259918e-05, "epoch": 2.616, "percentage": 43.6, "elapsed_time": "2:01:19", "remaining_time": "2:36:56"}
{"current_steps": 1640, "total_steps": 3750, "loss": 0.3801, "lr": 2.768160942966233e-05, "epoch": 2.624, "percentage": 43.73, "elapsed_time": "2:01:39", "remaining_time": "2:36:30"}
{"current_steps": 1645, "total_steps": 3750, "loss": 0.3866, "lr": 2.759558191043603e-05, "epoch": 2.632, "percentage": 43.87, "elapsed_time": "2:01:57", "remaining_time": "2:36:04"}
{"current_steps": 1650, "total_steps": 3750, "loss": 0.383, "lr": 2.7509389858417783e-05, "epoch": 2.64, "percentage": 44.0, "elapsed_time": "2:02:16", "remaining_time": "2:35:37"}
{"current_steps": 1655, "total_steps": 3750, "loss": 0.3977, "lr": 2.7423035140669147e-05, "epoch": 2.648, "percentage": 44.13, "elapsed_time": "2:02:34", "remaining_time": "2:35:10"}
{"current_steps": 1660, "total_steps": 3750, "loss": 0.3695, "lr": 2.7336519627775288e-05, "epoch": 2.656, "percentage": 44.27, "elapsed_time": "2:02:51", "remaining_time": "2:34:40"}
{"current_steps": 1665, "total_steps": 3750, "loss": 0.4005, "lr": 2.724984519380444e-05, "epoch": 2.664, "percentage": 44.4, "elapsed_time": "2:03:11", "remaining_time": "2:34:15"}
{"current_steps": 1670, "total_steps": 3750, "loss": 0.4008, "lr": 2.7163013716267353e-05, "epoch": 2.672, "percentage": 44.53, "elapsed_time": "2:03:29", "remaining_time": "2:33:48"}
{"current_steps": 1675, "total_steps": 3750, "loss": 0.3943, "lr": 2.707602707607659e-05, "epoch": 2.68, "percentage": 44.67, "elapsed_time": "2:03:45", "remaining_time": "2:33:18"}
{"current_steps": 1680, "total_steps": 3750, "loss": 0.3853, "lr": 2.6988887157505786e-05, "epoch": 2.6879999999999997, "percentage": 44.8, "elapsed_time": "2:04:07", "remaining_time": "2:32:56"}
{"current_steps": 1685, "total_steps": 3750, "loss": 0.3943, "lr": 2.6901595848148842e-05, "epoch": 2.6959999999999997, "percentage": 44.93, "elapsed_time": "2:04:26", "remaining_time": "2:32:30"}
{"current_steps": 1690, "total_steps": 3750, "loss": 0.3868, "lr": 2.681415503887904e-05, "epoch": 2.7039999999999997, "percentage": 45.07, "elapsed_time": "2:04:42", "remaining_time": "2:32:00"}
{"current_steps": 1695, "total_steps": 3750, "loss": 0.3882, "lr": 2.672656662380805e-05, "epoch": 2.7119999999999997, "percentage": 45.2, "elapsed_time": "2:04:59", "remaining_time": "2:31:32"}
{"current_steps": 1700, "total_steps": 3750, "loss": 0.3809, "lr": 2.6638832500244967e-05, "epoch": 2.7199999999999998, "percentage": 45.33, "elapsed_time": "2:05:16", "remaining_time": "2:31:04"}
{"current_steps": 1705, "total_steps": 3750, "loss": 0.3938, "lr": 2.655095456865514e-05, "epoch": 2.7279999999999998, "percentage": 45.47, "elapsed_time": "2:07:02", "remaining_time": "2:32:22"}
{"current_steps": 1710, "total_steps": 3750, "loss": 0.3824, "lr": 2.6462934732619047e-05, "epoch": 2.7359999999999998, "percentage": 45.6, "elapsed_time": "2:07:20", "remaining_time": "2:31:54"}
{"current_steps": 1715, "total_steps": 3750, "loss": 0.3786, "lr": 2.6374774898791047e-05, "epoch": 2.7439999999999998, "percentage": 45.73, "elapsed_time": "2:07:39", "remaining_time": "2:31:28"}
{"current_steps": 1720, "total_steps": 3750, "loss": 0.3726, "lr": 2.6286476976858084e-05, "epoch": 2.752, "percentage": 45.87, "elapsed_time": "2:07:58", "remaining_time": "2:31:01"}
{"current_steps": 1725, "total_steps": 3750, "loss": 0.4018, "lr": 2.619804287949831e-05, "epoch": 2.76, "percentage": 46.0, "elapsed_time": "2:08:14", "remaining_time": "2:30:33"}
{"current_steps": 1730, "total_steps": 3750, "loss": 0.3947, "lr": 2.6109474522339676e-05, "epoch": 2.768, "percentage": 46.13, "elapsed_time": "2:08:33", "remaining_time": "2:30:06"}
{"current_steps": 1735, "total_steps": 3750, "loss": 0.3908, "lr": 2.6020773823918414e-05, "epoch": 2.776, "percentage": 46.27, "elapsed_time": "2:08:49", "remaining_time": "2:29:37"}
{"current_steps": 1740, "total_steps": 3750, "loss": 0.3821, "lr": 2.5931942705637473e-05, "epoch": 2.784, "percentage": 46.4, "elapsed_time": "2:09:11", "remaining_time": "2:29:14"}
{"current_steps": 1745, "total_steps": 3750, "loss": 0.3935, "lr": 2.5842983091724923e-05, "epoch": 2.792, "percentage": 46.53, "elapsed_time": "2:09:29", "remaining_time": "2:28:47"}
{"current_steps": 1750, "total_steps": 3750, "loss": 0.3748, "lr": 2.575389690919226e-05, "epoch": 2.8, "percentage": 46.67, "elapsed_time": "2:09:45", "remaining_time": "2:28:17"}
{"current_steps": 1755, "total_steps": 3750, "loss": 0.3966, "lr": 2.5664686087792658e-05, "epoch": 2.808, "percentage": 46.8, "elapsed_time": "2:10:01", "remaining_time": "2:27:47"}
{"current_steps": 1760, "total_steps": 3750, "loss": 0.3774, "lr": 2.5575352559979188e-05, "epoch": 2.816, "percentage": 46.93, "elapsed_time": "2:10:22", "remaining_time": "2:27:25"}
{"current_steps": 1765, "total_steps": 3750, "loss": 0.3917, "lr": 2.5485898260862936e-05, "epoch": 2.824, "percentage": 47.07, "elapsed_time": "2:10:42", "remaining_time": "2:27:00"}
{"current_steps": 1770, "total_steps": 3750, "loss": 0.3875, "lr": 2.5396325128171072e-05, "epoch": 2.832, "percentage": 47.2, "elapsed_time": "2:11:03", "remaining_time": "2:26:36"}
{"current_steps": 1775, "total_steps": 3750, "loss": 0.4214, "lr": 2.5306635102204942e-05, "epoch": 2.84, "percentage": 47.33, "elapsed_time": "2:11:25", "remaining_time": "2:26:13"}
{"current_steps": 1780, "total_steps": 3750, "loss": 0.3941, "lr": 2.5216830125797943e-05, "epoch": 2.848, "percentage": 47.47, "elapsed_time": "2:11:44", "remaining_time": "2:25:47"}
{"current_steps": 1785, "total_steps": 3750, "loss": 0.4111, "lr": 2.5126912144273517e-05, "epoch": 2.856, "percentage": 47.6, "elapsed_time": "2:11:59", "remaining_time": "2:25:17"}
{"current_steps": 1790, "total_steps": 3750, "loss": 0.398, "lr": 2.5036883105402985e-05, "epoch": 2.864, "percentage": 47.73, "elapsed_time": "2:12:16", "remaining_time": "2:24:50"}
{"current_steps": 1795, "total_steps": 3750, "loss": 0.378, "lr": 2.4946744959363343e-05, "epoch": 2.872, "percentage": 47.87, "elapsed_time": "2:12:34", "remaining_time": "2:24:23"}
{"current_steps": 1800, "total_steps": 3750, "loss": 0.3726, "lr": 2.4856499658695018e-05, "epoch": 2.88, "percentage": 48.0, "elapsed_time": "2:12:52", "remaining_time": "2:23:56"}
{"current_steps": 1805, "total_steps": 3750, "loss": 0.3892, "lr": 2.4766149158259603e-05, "epoch": 2.888, "percentage": 48.13, "elapsed_time": "2:14:41", "remaining_time": "2:25:08"}
{"current_steps": 1810, "total_steps": 3750, "loss": 0.3644, "lr": 2.4675695415197476e-05, "epoch": 2.896, "percentage": 48.27, "elapsed_time": "2:15:04", "remaining_time": "2:24:46"}
{"current_steps": 1815, "total_steps": 3750, "loss": 0.3825, "lr": 2.458514038888543e-05, "epoch": 2.904, "percentage": 48.4, "elapsed_time": "2:15:22", "remaining_time": "2:24:19"}
{"current_steps": 1820, "total_steps": 3750, "loss": 0.3637, "lr": 2.4494486040894208e-05, "epoch": 2.912, "percentage": 48.53, "elapsed_time": "2:15:40", "remaining_time": "2:23:52"}
{"current_steps": 1825, "total_steps": 3750, "loss": 0.3955, "lr": 2.440373433494603e-05, "epoch": 2.92, "percentage": 48.67, "elapsed_time": "2:16:00", "remaining_time": "2:23:27"}
{"current_steps": 1830, "total_steps": 3750, "loss": 0.3909, "lr": 2.4312887236872066e-05, "epoch": 2.928, "percentage": 48.8, "elapsed_time": "2:16:14", "remaining_time": "2:22:56"}
{"current_steps": 1835, "total_steps": 3750, "loss": 0.3911, "lr": 2.4221946714569803e-05, "epoch": 2.936, "percentage": 48.93, "elapsed_time": "2:16:32", "remaining_time": "2:22:29"}
{"current_steps": 1840, "total_steps": 3750, "loss": 0.4035, "lr": 2.4130914737960472e-05, "epoch": 2.944, "percentage": 49.07, "elapsed_time": "2:16:47", "remaining_time": "2:21:59"}
{"current_steps": 1845, "total_steps": 3750, "loss": 0.3734, "lr": 2.4039793278946358e-05, "epoch": 2.952, "percentage": 49.2, "elapsed_time": "2:17:06", "remaining_time": "2:21:34"}
{"current_steps": 1850, "total_steps": 3750, "loss": 0.3971, "lr": 2.394858431136806e-05, "epoch": 2.96, "percentage": 49.33, "elapsed_time": "2:17:25", "remaining_time": "2:21:08"}
{"current_steps": 1855, "total_steps": 3750, "loss": 0.3865, "lr": 2.385728981096178e-05, "epoch": 2.968, "percentage": 49.47, "elapsed_time": "2:17:43", "remaining_time": "2:20:41"}
{"current_steps": 1860, "total_steps": 3750, "loss": 0.3596, "lr": 2.3765911755316503e-05, "epoch": 2.976, "percentage": 49.6, "elapsed_time": "2:18:02", "remaining_time": "2:20:15"}
{"current_steps": 1865, "total_steps": 3750, "loss": 0.3703, "lr": 2.3674452123831125e-05, "epoch": 2.984, "percentage": 49.73, "elapsed_time": "2:18:19", "remaining_time": "2:19:48"}
{"current_steps": 1870, "total_steps": 3750, "loss": 0.4017, "lr": 2.358291289767165e-05, "epoch": 2.992, "percentage": 49.87, "elapsed_time": "2:18:35", "remaining_time": "2:19:19"}
{"current_steps": 1875, "total_steps": 3750, "loss": 0.3866, "lr": 2.3491296059728202e-05, "epoch": 3.0, "percentage": 50.0, "elapsed_time": "2:18:54", "remaining_time": "2:18:54"}
{"current_steps": 1880, "total_steps": 3750, "loss": 0.362, "lr": 2.339960359457212e-05, "epoch": 3.008, "percentage": 50.13, "elapsed_time": "2:19:11", "remaining_time": "2:18:26"}
{"current_steps": 1885, "total_steps": 3750, "loss": 0.3414, "lr": 2.3307837488412955e-05, "epoch": 3.016, "percentage": 50.27, "elapsed_time": "2:19:32", "remaining_time": "2:18:04"}
{"current_steps": 1890, "total_steps": 3750, "loss": 0.3518, "lr": 2.3215999729055437e-05, "epoch": 3.024, "percentage": 50.4, "elapsed_time": "2:19:55", "remaining_time": "2:17:41"}
{"current_steps": 1895, "total_steps": 3750, "loss": 0.354, "lr": 2.312409230585641e-05, "epoch": 3.032, "percentage": 50.53, "elapsed_time": "2:20:10", "remaining_time": "2:17:13"}
{"current_steps": 1900, "total_steps": 3750, "loss": 0.3694, "lr": 2.3032117209681782e-05, "epoch": 3.04, "percentage": 50.67, "elapsed_time": "2:20:29", "remaining_time": "2:16:47"}
{"current_steps": 1905, "total_steps": 3750, "loss": 0.3576, "lr": 2.2940076432863335e-05, "epoch": 3.048, "percentage": 50.8, "elapsed_time": "2:21:58", "remaining_time": "2:17:30"}
{"current_steps": 1910, "total_steps": 3750, "loss": 0.3807, "lr": 2.2847971969155626e-05, "epoch": 3.056, "percentage": 50.93, "elapsed_time": "2:22:14", "remaining_time": "2:17:01"}
{"current_steps": 1915, "total_steps": 3750, "loss": 0.3534, "lr": 2.275580581369276e-05, "epoch": 3.064, "percentage": 51.07, "elapsed_time": "2:22:33", "remaining_time": "2:16:36"}
{"current_steps": 1920, "total_steps": 3750, "loss": 0.3557, "lr": 2.2663579962945205e-05, "epoch": 3.072, "percentage": 51.2, "elapsed_time": "2:22:52", "remaining_time": "2:16:10"}
{"current_steps": 1925, "total_steps": 3750, "loss": 0.344, "lr": 2.2571296414676503e-05, "epoch": 3.08, "percentage": 51.33, "elapsed_time": "2:23:09", "remaining_time": "2:15:43"}
{"current_steps": 1930, "total_steps": 3750, "loss": 0.3738, "lr": 2.2478957167900038e-05, "epoch": 3.088, "percentage": 51.47, "elapsed_time": "2:23:27", "remaining_time": "2:15:16"}
{"current_steps": 1935, "total_steps": 3750, "loss": 0.3558, "lr": 2.23865642228357e-05, "epoch": 3.096, "percentage": 51.6, "elapsed_time": "2:23:47", "remaining_time": "2:14:52"}
{"current_steps": 1940, "total_steps": 3750, "loss": 0.3705, "lr": 2.2294119580866592e-05, "epoch": 3.104, "percentage": 51.73, "elapsed_time": "2:24:05", "remaining_time": "2:14:26"}
{"current_steps": 1945, "total_steps": 3750, "loss": 0.3582, "lr": 2.2201625244495646e-05, "epoch": 3.112, "percentage": 51.87, "elapsed_time": "2:24:26", "remaining_time": "2:14:02"}
{"current_steps": 1950, "total_steps": 3750, "loss": 0.3732, "lr": 2.2109083217302242e-05, "epoch": 3.12, "percentage": 52.0, "elapsed_time": "2:24:41", "remaining_time": "2:13:34"}
{"current_steps": 1955, "total_steps": 3750, "loss": 0.348, "lr": 2.201649550389885e-05, "epoch": 3.128, "percentage": 52.13, "elapsed_time": "2:25:01", "remaining_time": "2:13:09"}
{"current_steps": 1960, "total_steps": 3750, "loss": 0.355, "lr": 2.1923864109887556e-05, "epoch": 3.136, "percentage": 52.27, "elapsed_time": "2:25:21", "remaining_time": "2:12:44"}
{"current_steps": 1965, "total_steps": 3750, "loss": 0.3692, "lr": 2.1831191041816652e-05, "epoch": 3.144, "percentage": 52.4, "elapsed_time": "2:25:40", "remaining_time": "2:12:19"}
{"current_steps": 1970, "total_steps": 3750, "loss": 0.3676, "lr": 2.173847830713715e-05, "epoch": 3.152, "percentage": 52.53, "elapsed_time": "2:25:59", "remaining_time": "2:11:54"}
{"current_steps": 1975, "total_steps": 3750, "loss": 0.3507, "lr": 2.1645727914159315e-05, "epoch": 3.16, "percentage": 52.67, "elapsed_time": "2:26:21", "remaining_time": "2:11:32"}
{"current_steps": 1980, "total_steps": 3750, "loss": 0.3617, "lr": 2.1552941872009144e-05, "epoch": 3.168, "percentage": 52.8, "elapsed_time": "2:26:39", "remaining_time": "2:11:06"}
{"current_steps": 1985, "total_steps": 3750, "loss": 0.3827, "lr": 2.1460122190584868e-05, "epoch": 3.176, "percentage": 52.93, "elapsed_time": "2:26:57", "remaining_time": "2:10:40"}
{"current_steps": 1990, "total_steps": 3750, "loss": 0.3801, "lr": 2.1367270880513377e-05, "epoch": 3.184, "percentage": 53.07, "elapsed_time": "2:27:13", "remaining_time": "2:10:12"}
{"current_steps": 1995, "total_steps": 3750, "loss": 0.3558, "lr": 2.127438995310671e-05, "epoch": 3.192, "percentage": 53.2, "elapsed_time": "2:27:33", "remaining_time": "2:09:48"}
{"current_steps": 2000, "total_steps": 3750, "loss": 0.3575, "lr": 2.118148142031846e-05, "epoch": 3.2, "percentage": 53.33, "elapsed_time": "2:27:51", "remaining_time": "2:09:22"}
{"current_steps": 2005, "total_steps": 3750, "loss": 0.3556, "lr": 2.1088547294700182e-05, "epoch": 3.208, "percentage": 53.47, "elapsed_time": "2:29:13", "remaining_time": "2:09:52"}
{"current_steps": 2010, "total_steps": 3750, "loss": 0.3722, "lr": 2.0995589589357846e-05, "epoch": 3.216, "percentage": 53.6, "elapsed_time": "2:29:34", "remaining_time": "2:09:28"}
{"current_steps": 2015, "total_steps": 3750, "loss": 0.3702, "lr": 2.0902610317908175e-05, "epoch": 3.224, "percentage": 53.73, "elapsed_time": "2:29:54", "remaining_time": "2:09:04"}
{"current_steps": 2020, "total_steps": 3750, "loss": 0.343, "lr": 2.080961149443505e-05, "epoch": 3.232, "percentage": 53.87, "elapsed_time": "2:30:12", "remaining_time": "2:08:38"}
{"current_steps": 2025, "total_steps": 3750, "loss": 0.3616, "lr": 2.071659513344589e-05, "epoch": 3.24, "percentage": 54.0, "elapsed_time": "2:30:29", "remaining_time": "2:08:11"}
{"current_steps": 2030, "total_steps": 3750, "loss": 0.33, "lr": 2.0623563249828e-05, "epoch": 3.248, "percentage": 54.13, "elapsed_time": "2:30:52", "remaining_time": "2:07:49"}
{"current_steps": 2035, "total_steps": 3750, "loss": 0.3669, "lr": 2.053051785880492e-05, "epoch": 3.2560000000000002, "percentage": 54.27, "elapsed_time": "2:31:08", "remaining_time": "2:07:22"}
{"current_steps": 2040, "total_steps": 3750, "loss": 0.3519, "lr": 2.0437460975892814e-05, "epoch": 3.2640000000000002, "percentage": 54.4, "elapsed_time": "2:31:24", "remaining_time": "2:06:55"}
{"current_steps": 2045, "total_steps": 3750, "loss": 0.3643, "lr": 2.0344394616856736e-05, "epoch": 3.2720000000000002, "percentage": 54.53, "elapsed_time": "2:31:42", "remaining_time": "2:06:28"}
{"current_steps": 2050, "total_steps": 3750, "loss": 0.3751, "lr": 2.0251320797667056e-05, "epoch": 3.2800000000000002, "percentage": 54.67, "elapsed_time": "2:32:00", "remaining_time": "2:06:03"}
{"current_steps": 2055, "total_steps": 3750, "loss": 0.3478, "lr": 2.01582415344557e-05, "epoch": 3.288, "percentage": 54.8, "elapsed_time": "2:32:16", "remaining_time": "2:05:36"}
{"current_steps": 2060, "total_steps": 3750, "loss": 0.3677, "lr": 2.006515884347255e-05, "epoch": 3.296, "percentage": 54.93, "elapsed_time": "2:32:36", "remaining_time": "2:05:12"}
{"current_steps": 2065, "total_steps": 3750, "loss": 0.3544, "lr": 1.9972074741041712e-05, "epoch": 3.304, "percentage": 55.07, "elapsed_time": "2:32:53", "remaining_time": "2:04:45"}
{"current_steps": 2070, "total_steps": 3750, "loss": 0.382, "lr": 1.9878991243517913e-05, "epoch": 3.312, "percentage": 55.2, "elapsed_time": "2:33:13", "remaining_time": "2:04:21"}
{"current_steps": 2075, "total_steps": 3750, "loss": 0.357, "lr": 1.9785910367242712e-05, "epoch": 3.32, "percentage": 55.33, "elapsed_time": "2:33:28", "remaining_time": "2:03:53"}
{"current_steps": 2080, "total_steps": 3750, "loss": 0.3666, "lr": 1.969283412850094e-05, "epoch": 3.328, "percentage": 55.47, "elapsed_time": "2:33:47", "remaining_time": "2:03:28"}
{"current_steps": 2085, "total_steps": 3750, "loss": 0.3394, "lr": 1.959976454347696e-05, "epoch": 3.336, "percentage": 55.6, "elapsed_time": "2:34:07", "remaining_time": "2:03:04"}
{"current_steps": 2090, "total_steps": 3750, "loss": 0.3453, "lr": 1.950670362821098e-05, "epoch": 3.344, "percentage": 55.73, "elapsed_time": "2:34:25", "remaining_time": "2:02:39"}
{"current_steps": 2095, "total_steps": 3750, "loss": 0.3756, "lr": 1.9413653398555437e-05, "epoch": 3.352, "percentage": 55.87, "elapsed_time": "2:34:40", "remaining_time": "2:02:11"}
{"current_steps": 2100, "total_steps": 3750, "loss": 0.3602, "lr": 1.9320615870131282e-05, "epoch": 3.36, "percentage": 56.0, "elapsed_time": "2:34:58", "remaining_time": "2:01:46"}
{"current_steps": 2105, "total_steps": 3750, "loss": 0.3674, "lr": 1.9227593058284343e-05, "epoch": 3.368, "percentage": 56.13, "elapsed_time": "2:36:22", "remaining_time": "2:02:12"}
{"current_steps": 2110, "total_steps": 3750, "loss": 0.3718, "lr": 1.9134586978041663e-05, "epoch": 3.376, "percentage": 56.27, "elapsed_time": "2:36:41", "remaining_time": "2:01:47"}
{"current_steps": 2115, "total_steps": 3750, "loss": 0.382, "lr": 1.9041599644067846e-05, "epoch": 3.384, "percentage": 56.4, "elapsed_time": "2:37:00", "remaining_time": "2:01:22"}
{"current_steps": 2120, "total_steps": 3750, "loss": 0.3467, "lr": 1.8948633070621433e-05, "epoch": 3.392, "percentage": 56.53, "elapsed_time": "2:37:17", "remaining_time": "2:00:56"}
{"current_steps": 2125, "total_steps": 3750, "loss": 0.3701, "lr": 1.885568927151124e-05, "epoch": 3.4, "percentage": 56.67, "elapsed_time": "2:37:32", "remaining_time": "2:00:28"}
{"current_steps": 2130, "total_steps": 3750, "loss": 0.3533, "lr": 1.8762770260052773e-05, "epoch": 3.408, "percentage": 56.8, "elapsed_time": "2:37:52", "remaining_time": "2:00:04"}
{"current_steps": 2135, "total_steps": 3750, "loss": 0.3461, "lr": 1.8669878049024575e-05, "epoch": 3.416, "percentage": 56.93, "elapsed_time": "2:38:13", "remaining_time": "1:59:41"}
{"current_steps": 2140, "total_steps": 3750, "loss": 0.3671, "lr": 1.857701465062467e-05, "epoch": 3.424, "percentage": 57.07, "elapsed_time": "2:38:32", "remaining_time": "1:59:16"}
{"current_steps": 2145, "total_steps": 3750, "loss": 0.3641, "lr": 1.848418207642693e-05, "epoch": 3.432, "percentage": 57.2, "elapsed_time": "2:38:51", "remaining_time": "1:58:51"}
{"current_steps": 2150, "total_steps": 3750, "loss": 0.3691, "lr": 1.8391382337337548e-05, "epoch": 3.44, "percentage": 57.33, "elapsed_time": "2:39:10", "remaining_time": "1:58:27"}
{"current_steps": 2155, "total_steps": 3750, "loss": 0.3604, "lr": 1.829861744355144e-05, "epoch": 3.448, "percentage": 57.47, "elapsed_time": "2:39:32", "remaining_time": "1:58:04"}
{"current_steps": 2160, "total_steps": 3750, "loss": 0.3527, "lr": 1.820588940450872e-05, "epoch": 3.456, "percentage": 57.6, "elapsed_time": "2:39:48", "remaining_time": "1:57:38"}
{"current_steps": 2165, "total_steps": 3750, "loss": 0.3391, "lr": 1.8113200228851163e-05, "epoch": 3.464, "percentage": 57.73, "elapsed_time": "2:40:07", "remaining_time": "1:57:13"}
{"current_steps": 2170, "total_steps": 3750, "loss": 0.3349, "lr": 1.80205519243787e-05, "epoch": 3.472, "percentage": 57.87, "elapsed_time": "2:40:24", "remaining_time": "1:56:47"}
{"current_steps": 2175, "total_steps": 3750, "loss": 0.3465, "lr": 1.7927946498005934e-05, "epoch": 3.48, "percentage": 58.0, "elapsed_time": "2:40:39", "remaining_time": "1:56:20"}
{"current_steps": 2180, "total_steps": 3750, "loss": 0.3525, "lr": 1.7835385955718653e-05, "epoch": 3.488, "percentage": 58.13, "elapsed_time": "2:40:57", "remaining_time": "1:55:55"}
{"current_steps": 2185, "total_steps": 3750, "loss": 0.3783, "lr": 1.7742872302530366e-05, "epoch": 3.496, "percentage": 58.27, "elapsed_time": "2:41:14", "remaining_time": "1:55:29"}
{"current_steps": 2190, "total_steps": 3750, "loss": 0.3676, "lr": 1.765040754243892e-05, "epoch": 3.504, "percentage": 58.4, "elapsed_time": "2:41:30", "remaining_time": "1:55:02"}
{"current_steps": 2195, "total_steps": 3750, "loss": 0.3617, "lr": 1.755799367838302e-05, "epoch": 3.512, "percentage": 58.53, "elapsed_time": "2:41:48", "remaining_time": "1:54:37"}
{"current_steps": 2200, "total_steps": 3750, "loss": 0.3659, "lr": 1.746563271219891e-05, "epoch": 3.52, "percentage": 58.67, "elapsed_time": "2:42:06", "remaining_time": "1:54:12"}
{"current_steps": 2205, "total_steps": 3750, "loss": 0.3708, "lr": 1.7373326644576965e-05, "epoch": 3.528, "percentage": 58.8, "elapsed_time": "2:43:31", "remaining_time": "1:54:34"}
{"current_steps": 2210, "total_steps": 3750, "loss": 0.358, "lr": 1.728107747501836e-05, "epoch": 3.536, "percentage": 58.93, "elapsed_time": "2:43:48", "remaining_time": "1:54:09"}
{"current_steps": 2215, "total_steps": 3750, "loss": 0.3413, "lr": 1.7188887201791785e-05, "epoch": 3.544, "percentage": 59.07, "elapsed_time": "2:44:04", "remaining_time": "1:53:42"}
{"current_steps": 2220, "total_steps": 3750, "loss": 0.354, "lr": 1.7096757821890117e-05, "epoch": 3.552, "percentage": 59.2, "elapsed_time": "2:44:23", "remaining_time": "1:53:17"}
{"current_steps": 2225, "total_steps": 3750, "loss": 0.3785, "lr": 1.7004691330987196e-05, "epoch": 3.56, "percentage": 59.33, "elapsed_time": "2:44:42", "remaining_time": "1:52:53"}
{"current_steps": 2230, "total_steps": 3750, "loss": 0.3714, "lr": 1.691268972339458e-05, "epoch": 3.568, "percentage": 59.47, "elapsed_time": "2:45:01", "remaining_time": "1:52:28"}
{"current_steps": 2235, "total_steps": 3750, "loss": 0.3672, "lr": 1.6820754992018344e-05, "epoch": 3.576, "percentage": 59.6, "elapsed_time": "2:45:18", "remaining_time": "1:52:03"}
{"current_steps": 2240, "total_steps": 3750, "loss": 0.3579, "lr": 1.6728889128315932e-05, "epoch": 3.584, "percentage": 59.73, "elapsed_time": "2:45:35", "remaining_time": "1:51:37"}
{"current_steps": 2245, "total_steps": 3750, "loss": 0.3826, "lr": 1.663709412225297e-05, "epoch": 3.592, "percentage": 59.87, "elapsed_time": "2:45:52", "remaining_time": "1:51:11"}
{"current_steps": 2250, "total_steps": 3750, "loss": 0.3678, "lr": 1.654537196226022e-05, "epoch": 3.6, "percentage": 60.0, "elapsed_time": "2:46:07", "remaining_time": "1:50:45"}
{"current_steps": 2255, "total_steps": 3750, "loss": 0.3615, "lr": 1.6453724635190455e-05, "epoch": 3.608, "percentage": 60.13, "elapsed_time": "2:46:24", "remaining_time": "1:50:19"}
{"current_steps": 2260, "total_steps": 3750, "loss": 0.361, "lr": 1.6362154126275467e-05, "epoch": 3.616, "percentage": 60.27, "elapsed_time": "2:46:43", "remaining_time": "1:49:55"}
{"current_steps": 2265, "total_steps": 3750, "loss": 0.3654, "lr": 1.6270662419083018e-05, "epoch": 3.624, "percentage": 60.4, "elapsed_time": "2:47:01", "remaining_time": "1:49:30"}
{"current_steps": 2270, "total_steps": 3750, "loss": 0.3745, "lr": 1.617925149547391e-05, "epoch": 3.632, "percentage": 60.53, "elapsed_time": "2:47:18", "remaining_time": "1:49:04"}
{"current_steps": 2275, "total_steps": 3750, "loss": 0.3449, "lr": 1.608792333555904e-05, "epoch": 3.64, "percentage": 60.67, "elapsed_time": "2:47:36", "remaining_time": "1:48:40"}
{"current_steps": 2280, "total_steps": 3750, "loss": 0.3584, "lr": 1.5996679917656492e-05, "epoch": 3.648, "percentage": 60.8, "elapsed_time": "2:47:53", "remaining_time": "1:48:15"}
{"current_steps": 2285, "total_steps": 3750, "loss": 0.3349, "lr": 1.5905523218248723e-05, "epoch": 3.656, "percentage": 60.93, "elapsed_time": "2:48:11", "remaining_time": "1:47:50"}
{"current_steps": 2290, "total_steps": 3750, "loss": 0.3565, "lr": 1.5814455211939698e-05, "epoch": 3.664, "percentage": 61.07, "elapsed_time": "2:48:29", "remaining_time": "1:47:25"}
{"current_steps": 2295, "total_steps": 3750, "loss": 0.3453, "lr": 1.5723477871412168e-05, "epoch": 3.672, "percentage": 61.2, "elapsed_time": "2:48:44", "remaining_time": "1:46:58"}
{"current_steps": 2300, "total_steps": 3750, "loss": 0.3514, "lr": 1.56325931673849e-05, "epoch": 3.68, "percentage": 61.33, "elapsed_time": "2:49:03", "remaining_time": "1:46:34"}
{"current_steps": 2305, "total_steps": 3750, "loss": 0.3696, "lr": 1.5541803068569993e-05, "epoch": 3.6879999999999997, "percentage": 61.47, "elapsed_time": "2:50:21", "remaining_time": "1:46:47"}
{"current_steps": 2310, "total_steps": 3750, "loss": 0.352, "lr": 1.5451109541630275e-05, "epoch": 3.6959999999999997, "percentage": 61.6, "elapsed_time": "2:50:36", "remaining_time": "1:46:21"}
{"current_steps": 2315, "total_steps": 3750, "loss": 0.3394, "lr": 1.536051455113663e-05, "epoch": 3.7039999999999997, "percentage": 61.73, "elapsed_time": "2:50:53", "remaining_time": "1:45:56"}
{"current_steps": 2320, "total_steps": 3750, "loss": 0.3523, "lr": 1.527002005952551e-05, "epoch": 3.7119999999999997, "percentage": 61.87, "elapsed_time": "2:51:14", "remaining_time": "1:45:33"}
{"current_steps": 2325, "total_steps": 3750, "loss": 0.3576, "lr": 1.5179628027056373e-05, "epoch": 3.7199999999999998, "percentage": 62.0, "elapsed_time": "2:51:33", "remaining_time": "1:45:09"}
{"current_steps": 2330, "total_steps": 3750, "loss": 0.3683, "lr": 1.5089340411769257e-05, "epoch": 3.7279999999999998, "percentage": 62.13, "elapsed_time": "2:51:50", "remaining_time": "1:44:43"}
{"current_steps": 2335, "total_steps": 3750, "loss": 0.3493, "lr": 1.499915916944236e-05, "epoch": 3.7359999999999998, "percentage": 62.27, "elapsed_time": "2:52:09", "remaining_time": "1:44:19"}
{"current_steps": 2340, "total_steps": 3750, "loss": 0.3509, "lr": 1.490908625354964e-05, "epoch": 3.7439999999999998, "percentage": 62.4, "elapsed_time": "2:52:26", "remaining_time": "1:43:54"}
{"current_steps": 2345, "total_steps": 3750, "loss": 0.3514, "lr": 1.4819123615218556e-05, "epoch": 3.752, "percentage": 62.53, "elapsed_time": "2:52:44", "remaining_time": "1:43:29"}
{"current_steps": 2350, "total_steps": 3750, "loss": 0.3545, "lr": 1.472927320318775e-05, "epoch": 3.76, "percentage": 62.67, "elapsed_time": "2:53:03", "remaining_time": "1:43:06"}
{"current_steps": 2355, "total_steps": 3750, "loss": 0.3457, "lr": 1.4639536963764878e-05, "epoch": 3.768, "percentage": 62.8, "elapsed_time": "2:53:24", "remaining_time": "1:42:43"}
{"current_steps": 2360, "total_steps": 3750, "loss": 0.3731, "lr": 1.4549916840784409e-05, "epoch": 3.776, "percentage": 62.93, "elapsed_time": "2:53:41", "remaining_time": "1:42:18"}
{"current_steps": 2365, "total_steps": 3750, "loss": 0.3627, "lr": 1.4460414775565555e-05, "epoch": 3.784, "percentage": 63.07, "elapsed_time": "2:54:00", "remaining_time": "1:41:54"}
{"current_steps": 2370, "total_steps": 3750, "loss": 0.3576, "lr": 1.43710327068702e-05, "epoch": 3.792, "percentage": 63.2, "elapsed_time": "2:54:19", "remaining_time": "1:41:30"}
{"current_steps": 2375, "total_steps": 3750, "loss": 0.3645, "lr": 1.4281772570860897e-05, "epoch": 3.8, "percentage": 63.33, "elapsed_time": "2:54:35", "remaining_time": "1:41:04"}
{"current_steps": 2380, "total_steps": 3750, "loss": 0.3473, "lr": 1.4192636301058952e-05, "epoch": 3.808, "percentage": 63.47, "elapsed_time": "2:54:52", "remaining_time": "1:40:39"}
{"current_steps": 2385, "total_steps": 3750, "loss": 0.3528, "lr": 1.4103625828302508e-05, "epoch": 3.816, "percentage": 63.6, "elapsed_time": "2:55:10", "remaining_time": "1:40:15"}
{"current_steps": 2390, "total_steps": 3750, "loss": 0.3608, "lr": 1.4014743080704743e-05, "epoch": 3.824, "percentage": 63.73, "elapsed_time": "2:55:28", "remaining_time": "1:39:50"}
{"current_steps": 2395, "total_steps": 3750, "loss": 0.3845, "lr": 1.3925989983612118e-05, "epoch": 3.832, "percentage": 63.87, "elapsed_time": "2:55:45", "remaining_time": "1:39:26"}
{"current_steps": 2400, "total_steps": 3750, "loss": 0.3555, "lr": 1.383736845956261e-05, "epoch": 3.84, "percentage": 64.0, "elapsed_time": "2:56:02", "remaining_time": "1:39:01"}
{"current_steps": 2405, "total_steps": 3750, "loss": 0.3465, "lr": 1.3748880428244154e-05, "epoch": 3.848, "percentage": 64.13, "elapsed_time": "2:57:22", "remaining_time": "1:39:11"}
{"current_steps": 2410, "total_steps": 3750, "loss": 0.3575, "lr": 1.3660527806452965e-05, "epoch": 3.856, "percentage": 64.27, "elapsed_time": "2:57:40", "remaining_time": "1:38:47"}
{"current_steps": 2415, "total_steps": 3750, "loss": 0.3702, "lr": 1.3572312508052118e-05, "epoch": 3.864, "percentage": 64.4, "elapsed_time": "2:57:58", "remaining_time": "1:38:22"}
{"current_steps": 2420, "total_steps": 3750, "loss": 0.3702, "lr": 1.3484236443929982e-05, "epoch": 3.872, "percentage": 64.53, "elapsed_time": "2:58:16", "remaining_time": "1:37:58"}
{"current_steps": 2425, "total_steps": 3750, "loss": 0.3605, "lr": 1.3396301521958926e-05, "epoch": 3.88, "percentage": 64.67, "elapsed_time": "2:58:36", "remaining_time": "1:37:35"}
{"current_steps": 2430, "total_steps": 3750, "loss": 0.3582, "lr": 1.3308509646953934e-05, "epoch": 3.888, "percentage": 64.8, "elapsed_time": "2:58:55", "remaining_time": "1:37:11"}
{"current_steps": 2435, "total_steps": 3750, "loss": 0.3359, "lr": 1.3220862720631349e-05, "epoch": 3.896, "percentage": 64.93, "elapsed_time": "2:59:13", "remaining_time": "1:36:47"}
{"current_steps": 2440, "total_steps": 3750, "loss": 0.3514, "lr": 1.3133362641567697e-05, "epoch": 3.904, "percentage": 65.07, "elapsed_time": "2:59:30", "remaining_time": "1:36:22"}
{"current_steps": 2445, "total_steps": 3750, "loss": 0.3665, "lr": 1.3046011305158546e-05, "epoch": 3.912, "percentage": 65.2, "elapsed_time": "2:59:48", "remaining_time": "1:35:58"}
{"current_steps": 2450, "total_steps": 3750, "loss": 0.3493, "lr": 1.2958810603577456e-05, "epoch": 3.92, "percentage": 65.33, "elapsed_time": "3:00:06", "remaining_time": "1:35:34"}
{"current_steps": 2455, "total_steps": 3750, "loss": 0.3501, "lr": 1.2871762425734989e-05, "epoch": 3.928, "percentage": 65.47, "elapsed_time": "3:00:23", "remaining_time": "1:35:09"}
{"current_steps": 2460, "total_steps": 3750, "loss": 0.3446, "lr": 1.278486865723779e-05, "epoch": 3.936, "percentage": 65.6, "elapsed_time": "3:00:39", "remaining_time": "1:34:44"}
{"current_steps": 2465, "total_steps": 3750, "loss": 0.3609, "lr": 1.269813118034775e-05, "epoch": 3.944, "percentage": 65.73, "elapsed_time": "3:00:56", "remaining_time": "1:34:19"}
{"current_steps": 2470, "total_steps": 3750, "loss": 0.3819, "lr": 1.2611551873941213e-05, "epoch": 3.952, "percentage": 65.87, "elapsed_time": "3:01:14", "remaining_time": "1:33:55"}
{"current_steps": 2475, "total_steps": 3750, "loss": 0.3662, "lr": 1.2525132613468309e-05, "epoch": 3.96, "percentage": 66.0, "elapsed_time": "3:01:33", "remaining_time": "1:33:31"}
{"current_steps": 2480, "total_steps": 3750, "loss": 0.367, "lr": 1.2438875270912294e-05, "epoch": 3.968, "percentage": 66.13, "elapsed_time": "3:01:50", "remaining_time": "1:33:07"}
{"current_steps": 2485, "total_steps": 3750, "loss": 0.3733, "lr": 1.2352781714749016e-05, "epoch": 3.976, "percentage": 66.27, "elapsed_time": "3:02:08", "remaining_time": "1:32:43"}
{"current_steps": 2490, "total_steps": 3750, "loss": 0.3761, "lr": 1.2266853809906469e-05, "epoch": 3.984, "percentage": 66.4, "elapsed_time": "3:02:26", "remaining_time": "1:32:18"}
{"current_steps": 2495, "total_steps": 3750, "loss": 0.3614, "lr": 1.2181093417724317e-05, "epoch": 3.992, "percentage": 66.53, "elapsed_time": "3:02:45", "remaining_time": "1:31:55"}
{"current_steps": 2500, "total_steps": 3750, "loss": 0.3682, "lr": 1.2095502395913676e-05, "epoch": 4.0, "percentage": 66.67, "elapsed_time": "3:03:02", "remaining_time": "1:31:31"}
{"current_steps": 2505, "total_steps": 3750, "loss": 0.3443, "lr": 1.2010082598516775e-05, "epoch": 4.008, "percentage": 66.8, "elapsed_time": "3:04:20", "remaining_time": "1:31:37"}
{"current_steps": 2510, "total_steps": 3750, "loss": 0.3492, "lr": 1.1924835875866884e-05, "epoch": 4.016, "percentage": 66.93, "elapsed_time": "3:04:35", "remaining_time": "1:31:11"}
{"current_steps": 2515, "total_steps": 3750, "loss": 0.3354, "lr": 1.1839764074548145e-05, "epoch": 4.024, "percentage": 67.07, "elapsed_time": "3:04:58", "remaining_time": "1:30:49"}
{"current_steps": 2520, "total_steps": 3750, "loss": 0.3504, "lr": 1.1754869037355659e-05, "epoch": 4.032, "percentage": 67.2, "elapsed_time": "3:05:16", "remaining_time": "1:30:25"}
{"current_steps": 2525, "total_steps": 3750, "loss": 0.3354, "lr": 1.1670152603255504e-05, "epoch": 4.04, "percentage": 67.33, "elapsed_time": "3:05:36", "remaining_time": "1:30:02"}
{"current_steps": 2530, "total_steps": 3750, "loss": 0.3515, "lr": 1.1585616607344909e-05, "epoch": 4.048, "percentage": 67.47, "elapsed_time": "3:05:57", "remaining_time": "1:29:40"}
{"current_steps": 2535, "total_steps": 3750, "loss": 0.3456, "lr": 1.1501262880812547e-05, "epoch": 4.056, "percentage": 67.6, "elapsed_time": "3:06:12", "remaining_time": "1:29:14"}
{"current_steps": 2540, "total_steps": 3750, "loss": 0.3441, "lr": 1.141709325089881e-05, "epoch": 4.064, "percentage": 67.73, "elapsed_time": "3:06:34", "remaining_time": "1:28:52"}
{"current_steps": 2545, "total_steps": 3750, "loss": 0.3431, "lr": 1.1333109540856257e-05, "epoch": 4.072, "percentage": 67.87, "elapsed_time": "3:06:49", "remaining_time": "1:28:27"}
{"current_steps": 2550, "total_steps": 3750, "loss": 0.3556, "lr": 1.1249313569910143e-05, "epoch": 4.08, "percentage": 68.0, "elapsed_time": "3:07:08", "remaining_time": "1:28:04"}
{"current_steps": 2555, "total_steps": 3750, "loss": 0.3354, "lr": 1.1165707153218942e-05, "epoch": 4.088, "percentage": 68.13, "elapsed_time": "3:07:28", "remaining_time": "1:27:40"}
{"current_steps": 2560, "total_steps": 3750, "loss": 0.3345, "lr": 1.1082292101835121e-05, "epoch": 4.096, "percentage": 68.27, "elapsed_time": "3:07:46", "remaining_time": "1:27:16"}
{"current_steps": 2565, "total_steps": 3750, "loss": 0.341, "lr": 1.099907022266582e-05, "epoch": 4.104, "percentage": 68.4, "elapsed_time": "3:08:01", "remaining_time": "1:26:52"}
{"current_steps": 2570, "total_steps": 3750, "loss": 0.3408, "lr": 1.0916043318433767e-05, "epoch": 4.112, "percentage": 68.53, "elapsed_time": "3:08:19", "remaining_time": "1:26:27"}
{"current_steps": 2575, "total_steps": 3750, "loss": 0.3453, "lr": 1.0833213187638203e-05, "epoch": 4.12, "percentage": 68.67, "elapsed_time": "3:08:36", "remaining_time": "1:26:03"}
{"current_steps": 2580, "total_steps": 3750, "loss": 0.3487, "lr": 1.0750581624515957e-05, "epoch": 4.128, "percentage": 68.8, "elapsed_time": "3:08:53", "remaining_time": "1:25:39"}
{"current_steps": 2585, "total_steps": 3750, "loss": 0.3458, "lr": 1.0668150419002527e-05, "epoch": 4.136, "percentage": 68.93, "elapsed_time": "3:09:10", "remaining_time": "1:25:15"}
{"current_steps": 2590, "total_steps": 3750, "loss": 0.3389, "lr": 1.0585921356693349e-05, "epoch": 4.144, "percentage": 69.07, "elapsed_time": "3:09:30", "remaining_time": "1:24:52"}
{"current_steps": 2595, "total_steps": 3750, "loss": 0.332, "lr": 1.0503896218805112e-05, "epoch": 4.152, "percentage": 69.2, "elapsed_time": "3:09:50", "remaining_time": "1:24:29"}
{"current_steps": 2600, "total_steps": 3750, "loss": 0.3368, "lr": 1.0422076782137155e-05, "epoch": 4.16, "percentage": 69.33, "elapsed_time": "3:10:11", "remaining_time": "1:24:07"}
{"current_steps": 2605, "total_steps": 3750, "loss": 0.335, "lr": 1.0340464819032991e-05, "epoch": 4.168, "percentage": 69.47, "elapsed_time": "3:11:26", "remaining_time": "1:24:08"}
{"current_steps": 2610, "total_steps": 3750, "loss": 0.323, "lr": 1.0259062097341911e-05, "epoch": 4.176, "percentage": 69.6, "elapsed_time": "3:11:45", "remaining_time": "1:23:45"}
{"current_steps": 2615, "total_steps": 3750, "loss": 0.3483, "lr": 1.017787038038071e-05, "epoch": 4.184, "percentage": 69.73, "elapsed_time": "3:12:06", "remaining_time": "1:23:22"}
{"current_steps": 2620, "total_steps": 3750, "loss": 0.3371, "lr": 1.0096891426895476e-05, "epoch": 4.192, "percentage": 69.87, "elapsed_time": "3:12:22", "remaining_time": "1:22:58"}
{"current_steps": 2625, "total_steps": 3750, "loss": 0.34, "lr": 1.0016126991023447e-05, "epoch": 4.2, "percentage": 70.0, "elapsed_time": "3:12:40", "remaining_time": "1:22:34"}
{"current_steps": 2630, "total_steps": 3750, "loss": 0.3559, "lr": 9.935578822255113e-06, "epoch": 4.208, "percentage": 70.13, "elapsed_time": "3:13:00", "remaining_time": "1:22:11"}
{"current_steps": 2635, "total_steps": 3750, "loss": 0.3335, "lr": 9.855248665396218e-06, "epoch": 4.216, "percentage": 70.27, "elapsed_time": "3:13:18", "remaining_time": "1:21:47"}
{"current_steps": 2640, "total_steps": 3750, "loss": 0.3349, "lr": 9.775138260530046e-06, "epoch": 4.224, "percentage": 70.4, "elapsed_time": "3:13:35", "remaining_time": "1:21:23"}
{"current_steps": 2645, "total_steps": 3750, "loss": 0.3415, "lr": 9.695249342979667e-06, "epoch": 4.232, "percentage": 70.53, "elapsed_time": "3:13:54", "remaining_time": "1:21:00"}
{"current_steps": 2650, "total_steps": 3750, "loss": 0.3476, "lr": 9.615583643270371e-06, "epoch": 4.24, "percentage": 70.67, "elapsed_time": "3:14:12", "remaining_time": "1:20:36"}
{"current_steps": 2655, "total_steps": 3750, "loss": 0.329, "lr": 9.536142887092208e-06, "epoch": 4.248, "percentage": 70.8, "elapsed_time": "3:14:32", "remaining_time": "1:20:14"}
{"current_steps": 2660, "total_steps": 3750, "loss": 0.3385, "lr": 9.456928795262552e-06, "epoch": 4.256, "percentage": 70.93, "elapsed_time": "3:14:49", "remaining_time": "1:19:49"}
{"current_steps": 2665, "total_steps": 3750, "loss": 0.3261, "lr": 9.377943083688873e-06, "epoch": 4.264, "percentage": 71.07, "elapsed_time": "3:15:06", "remaining_time": "1:19:25"}
{"current_steps": 2670, "total_steps": 3750, "loss": 0.3337, "lr": 9.29918746333153e-06, "epoch": 4.272, "percentage": 71.2, "elapsed_time": "3:15:22", "remaining_time": "1:19:01"}
{"current_steps": 2675, "total_steps": 3750, "loss": 0.3504, "lr": 9.220663640166756e-06, "epoch": 4.28, "percentage": 71.33, "elapsed_time": "3:15:40", "remaining_time": "1:18:38"}
{"current_steps": 2680, "total_steps": 3750, "loss": 0.35, "lr": 9.142373315149655e-06, "epoch": 4.288, "percentage": 71.47, "elapsed_time": "3:15:59", "remaining_time": "1:18:15"}
{"current_steps": 2685, "total_steps": 3750, "loss": 0.3506, "lr": 9.064318184177373e-06, "epoch": 4.296, "percentage": 71.6, "elapsed_time": "3:16:17", "remaining_time": "1:17:51"}
{"current_steps": 2690, "total_steps": 3750, "loss": 0.3316, "lr": 8.986499938052396e-06, "epoch": 4.304, "percentage": 71.73, "elapsed_time": "3:16:34", "remaining_time": "1:17:27"}
{"current_steps": 2695, "total_steps": 3750, "loss": 0.3351, "lr": 8.908920262445859e-06, "epoch": 4.312, "percentage": 71.87, "elapsed_time": "3:16:50", "remaining_time": "1:17:03"}
{"current_steps": 2700, "total_steps": 3750, "loss": 0.3321, "lr": 8.831580837861082e-06, "epoch": 4.32, "percentage": 72.0, "elapsed_time": "3:17:06", "remaining_time": "1:16:39"}
{"current_steps": 2705, "total_steps": 3750, "loss": 0.3447, "lr": 8.754483339597166e-06, "epoch": 4.328, "percentage": 72.13, "elapsed_time": "3:18:24", "remaining_time": "1:16:39"}
{"current_steps": 2710, "total_steps": 3750, "loss": 0.3519, "lr": 8.677629437712665e-06, "epoch": 4.336, "percentage": 72.27, "elapsed_time": "3:18:38", "remaining_time": "1:16:14"}
{"current_steps": 2715, "total_steps": 3750, "loss": 0.329, "lr": 8.601020796989467e-06, "epoch": 4.344, "percentage": 72.4, "elapsed_time": "3:18:54", "remaining_time": "1:15:49"}
{"current_steps": 2720, "total_steps": 3750, "loss": 0.3383, "lr": 8.524659076896656e-06, "epoch": 4.352, "percentage": 72.53, "elapsed_time": "3:19:14", "remaining_time": "1:15:26"}
{"current_steps": 2725, "total_steps": 3750, "loss": 0.3359, "lr": 8.448545931554652e-06, "epoch": 4.36, "percentage": 72.67, "elapsed_time": "3:19:30", "remaining_time": "1:15:02"}
{"current_steps": 2730, "total_steps": 3750, "loss": 0.3335, "lr": 8.372683009699307e-06, "epoch": 4.368, "percentage": 72.8, "elapsed_time": "3:19:47", "remaining_time": "1:14:38"}
{"current_steps": 2735, "total_steps": 3750, "loss": 0.3535, "lr": 8.297071954646248e-06, "epoch": 4.376, "percentage": 72.93, "elapsed_time": "3:20:06", "remaining_time": "1:14:15"}
{"current_steps": 2740, "total_steps": 3750, "loss": 0.3327, "lr": 8.22171440425523e-06, "epoch": 4.384, "percentage": 73.07, "elapsed_time": "3:20:23", "remaining_time": "1:13:52"}
{"current_steps": 2745, "total_steps": 3750, "loss": 0.337, "lr": 8.146611990894683e-06, "epoch": 4.392, "percentage": 73.2, "elapsed_time": "3:20:41", "remaining_time": "1:13:28"}
{"current_steps": 2750, "total_steps": 3750, "loss": 0.357, "lr": 8.071766341406363e-06, "epoch": 4.4, "percentage": 73.33, "elapsed_time": "3:21:01", "remaining_time": "1:13:05"}
{"current_steps": 2755, "total_steps": 3750, "loss": 0.3297, "lr": 7.997179077070092e-06, "epoch": 4.408, "percentage": 73.47, "elapsed_time": "3:21:16", "remaining_time": "1:12:41"}
{"current_steps": 2760, "total_steps": 3750, "loss": 0.3463, "lr": 7.92285181356864e-06, "epoch": 4.416, "percentage": 73.6, "elapsed_time": "3:21:36", "remaining_time": "1:12:19"}
{"current_steps": 2765, "total_steps": 3750, "loss": 0.337, "lr": 7.848786160952726e-06, "epoch": 4.424, "percentage": 73.73, "elapsed_time": "3:21:55", "remaining_time": "1:11:55"}
{"current_steps": 2770, "total_steps": 3750, "loss": 0.3269, "lr": 7.77498372360617e-06, "epoch": 4.432, "percentage": 73.87, "elapsed_time": "3:22:11", "remaining_time": "1:11:31"}
{"current_steps": 2775, "total_steps": 3750, "loss": 0.3389, "lr": 7.701446100211095e-06, "epoch": 4.44, "percentage": 74.0, "elapsed_time": "3:22:32", "remaining_time": "1:11:09"}
{"current_steps": 2780, "total_steps": 3750, "loss": 0.3373, "lr": 7.628174883713322e-06, "epoch": 4.448, "percentage": 74.13, "elapsed_time": "3:22:50", "remaining_time": "1:10:46"}
{"current_steps": 2785, "total_steps": 3750, "loss": 0.3407, "lr": 7.555171661287875e-06, "epoch": 4.456, "percentage": 74.27, "elapsed_time": "3:23:05", "remaining_time": "1:10:22"}
{"current_steps": 2790, "total_steps": 3750, "loss": 0.3449, "lr": 7.482438014304567e-06, "epoch": 4.464, "percentage": 74.4, "elapsed_time": "3:23:20", "remaining_time": "1:09:58"}
{"current_steps": 2795, "total_steps": 3750, "loss": 0.3215, "lr": 7.4099755182937685e-06, "epoch": 4.4719999999999995, "percentage": 74.53, "elapsed_time": "3:23:38", "remaining_time": "1:09:34"}
{"current_steps": 2800, "total_steps": 3750, "loss": 0.3406, "lr": 7.337785742912289e-06, "epoch": 4.48, "percentage": 74.67, "elapsed_time": "3:23:59", "remaining_time": "1:09:12"}
{"current_steps": 2805, "total_steps": 3750, "loss": 0.34, "lr": 7.265870251909335e-06, "epoch": 4.4879999999999995, "percentage": 74.8, "elapsed_time": "3:25:19", "remaining_time": "1:09:10"}
{"current_steps": 2810, "total_steps": 3750, "loss": 0.3363, "lr": 7.194230603092697e-06, "epoch": 4.496, "percentage": 74.93, "elapsed_time": "3:25:34", "remaining_time": "1:08:46"}
{"current_steps": 2815, "total_steps": 3750, "loss": 0.3489, "lr": 7.122868348294927e-06, "epoch": 4.504, "percentage": 75.07, "elapsed_time": "3:25:51", "remaining_time": "1:08:22"}
{"current_steps": 2820, "total_steps": 3750, "loss": 0.3667, "lr": 7.051785033339804e-06, "epoch": 4.5120000000000005, "percentage": 75.2, "elapsed_time": "3:26:09", "remaining_time": "1:07:59"}
{"current_steps": 2825, "total_steps": 3750, "loss": 0.3234, "lr": 6.980982198008785e-06, "epoch": 4.52, "percentage": 75.33, "elapsed_time": "3:26:27", "remaining_time": "1:07:36"}
{"current_steps": 2830, "total_steps": 3750, "loss": 0.3502, "lr": 6.910461376007704e-06, "epoch": 4.5280000000000005, "percentage": 75.47, "elapsed_time": "3:26:47", "remaining_time": "1:07:13"}
{"current_steps": 2835, "total_steps": 3750, "loss": 0.337, "lr": 6.840224094933501e-06, "epoch": 4.536, "percentage": 75.6, "elapsed_time": "3:27:04", "remaining_time": "1:06:50"}
{"current_steps": 2840, "total_steps": 3750, "loss": 0.367, "lr": 6.7702718762411505e-06, "epoch": 4.5440000000000005, "percentage": 75.73, "elapsed_time": "3:27:22", "remaining_time": "1:06:26"}
{"current_steps": 2845, "total_steps": 3750, "loss": 0.3323, "lr": 6.700606235210731e-06, "epoch": 4.552, "percentage": 75.87, "elapsed_time": "3:27:41", "remaining_time": "1:06:03"}
{"current_steps": 2850, "total_steps": 3750, "loss": 0.3447, "lr": 6.631228680914558e-06, "epoch": 4.5600000000000005, "percentage": 76.0, "elapsed_time": "3:28:01", "remaining_time": "1:05:41"}
{"current_steps": 2855, "total_steps": 3750, "loss": 0.3384, "lr": 6.562140716184515e-06, "epoch": 4.568, "percentage": 76.13, "elapsed_time": "3:28:19", "remaining_time": "1:05:18"}
{"current_steps": 2860, "total_steps": 3750, "loss": 0.3455, "lr": 6.493343837579511e-06, "epoch": 4.576, "percentage": 76.27, "elapsed_time": "3:28:36", "remaining_time": "1:04:55"}
{"current_steps": 2865, "total_steps": 3750, "loss": 0.3326, "lr": 6.424839535353045e-06, "epoch": 4.584, "percentage": 76.4, "elapsed_time": "3:28:55", "remaining_time": "1:04:32"}
{"current_steps": 2870, "total_steps": 3750, "loss": 0.3303, "lr": 6.356629293420926e-06, "epoch": 4.592, "percentage": 76.53, "elapsed_time": "3:29:11", "remaining_time": "1:04:08"}
{"current_steps": 2875, "total_steps": 3750, "loss": 0.3412, "lr": 6.28871458932913e-06, "epoch": 4.6, "percentage": 76.67, "elapsed_time": "3:29:30", "remaining_time": "1:03:45"}
{"current_steps": 2880, "total_steps": 3750, "loss": 0.3349, "lr": 6.2210968942218206e-06, "epoch": 4.608, "percentage": 76.8, "elapsed_time": "3:29:50", "remaining_time": "1:03:23"}
{"current_steps": 2885, "total_steps": 3750, "loss": 0.3407, "lr": 6.153777672809438e-06, "epoch": 4.616, "percentage": 76.93, "elapsed_time": "3:30:07", "remaining_time": "1:03:00"}
{"current_steps": 2890, "total_steps": 3750, "loss": 0.3434, "lr": 6.086758383336984e-06, "epoch": 4.624, "percentage": 77.07, "elapsed_time": "3:30:23", "remaining_time": "1:02:36"}
{"current_steps": 2895, "total_steps": 3750, "loss": 0.3379, "lr": 6.0200404775524715e-06, "epoch": 4.632, "percentage": 77.2, "elapsed_time": "3:30:40", "remaining_time": "1:02:13"}
{"current_steps": 2900, "total_steps": 3750, "loss": 0.3272, "lr": 5.9536254006754155e-06, "epoch": 4.64, "percentage": 77.33, "elapsed_time": "3:31:01", "remaining_time": "1:01:51"}
{"current_steps": 2905, "total_steps": 3750, "loss": 0.3221, "lr": 5.887514591365593e-06, "epoch": 4.648, "percentage": 77.47, "elapsed_time": "3:32:20", "remaining_time": "1:01:46"}
{"current_steps": 2910, "total_steps": 3750, "loss": 0.3408, "lr": 5.821709481691798e-06, "epoch": 4.656, "percentage": 77.6, "elapsed_time": "3:32:37", "remaining_time": "1:01:22"}
{"current_steps": 2915, "total_steps": 3750, "loss": 0.3398, "lr": 5.75621149710091e-06, "epoch": 4.664, "percentage": 77.73, "elapsed_time": "3:32:57", "remaining_time": "1:01:00"}
{"current_steps": 2920, "total_steps": 3750, "loss": 0.3142, "lr": 5.691022056386961e-06, "epoch": 4.672, "percentage": 77.87, "elapsed_time": "3:33:18", "remaining_time": "1:00:37"}
{"current_steps": 2925, "total_steps": 3750, "loss": 0.3279, "lr": 5.6261425716604136e-06, "epoch": 4.68, "percentage": 78.0, "elapsed_time": "3:33:34", "remaining_time": "1:00:14"}
{"current_steps": 2930, "total_steps": 3750, "loss": 0.3434, "lr": 5.56157444831757e-06, "epoch": 4.688, "percentage": 78.13, "elapsed_time": "3:33:52", "remaining_time": "0:59:51"}
{"current_steps": 2935, "total_steps": 3750, "loss": 0.3393, "lr": 5.4973190850101334e-06, "epoch": 4.696, "percentage": 78.27, "elapsed_time": "3:34:08", "remaining_time": "0:59:27"}
{"current_steps": 2940, "total_steps": 3750, "loss": 0.3554, "lr": 5.433377873614925e-06, "epoch": 4.704, "percentage": 78.4, "elapsed_time": "3:34:27", "remaining_time": "0:59:05"}
{"current_steps": 2945, "total_steps": 3750, "loss": 0.3521, "lr": 5.369752199203702e-06, "epoch": 4.712, "percentage": 78.53, "elapsed_time": "3:34:44", "remaining_time": "0:58:41"}
{"current_steps": 2950, "total_steps": 3750, "loss": 0.338, "lr": 5.306443440013171e-06, "epoch": 4.72, "percentage": 78.67, "elapsed_time": "3:35:01", "remaining_time": "0:58:18"}
{"current_steps": 2955, "total_steps": 3750, "loss": 0.3398, "lr": 5.243452967415155e-06, "epoch": 4.728, "percentage": 78.8, "elapsed_time": "3:35:19", "remaining_time": "0:57:55"}
{"current_steps": 2960, "total_steps": 3750, "loss": 0.3363, "lr": 5.180782145886846e-06, "epoch": 4.736, "percentage": 78.93, "elapsed_time": "3:35:37", "remaining_time": "0:57:32"}
{"current_steps": 2965, "total_steps": 3750, "loss": 0.3177, "lr": 5.118432332981273e-06, "epoch": 4.744, "percentage": 79.07, "elapsed_time": "3:35:57", "remaining_time": "0:57:10"}
{"current_steps": 2970, "total_steps": 3750, "loss": 0.334, "lr": 5.056404879297887e-06, "epoch": 4.752, "percentage": 79.2, "elapsed_time": "3:36:14", "remaining_time": "0:56:47"}
{"current_steps": 2975, "total_steps": 3750, "loss": 0.3332, "lr": 4.994701128453325e-06, "epoch": 4.76, "percentage": 79.33, "elapsed_time": "3:36:32", "remaining_time": "0:56:24"}
{"current_steps": 2980, "total_steps": 3750, "loss": 0.313, "lr": 4.933322417052269e-06, "epoch": 4.768, "percentage": 79.47, "elapsed_time": "3:36:50", "remaining_time": "0:56:01"}
{"current_steps": 2985, "total_steps": 3750, "loss": 0.3583, "lr": 4.8722700746585135e-06, "epoch": 4.776, "percentage": 79.6, "elapsed_time": "3:37:08", "remaining_time": "0:55:38"}
{"current_steps": 2990, "total_steps": 3750, "loss": 0.3498, "lr": 4.811545423766184e-06, "epoch": 4.784, "percentage": 79.73, "elapsed_time": "3:37:23", "remaining_time": "0:55:15"}
{"current_steps": 2995, "total_steps": 3750, "loss": 0.3399, "lr": 4.75114977977104e-06, "epoch": 4.792, "percentage": 79.87, "elapsed_time": "3:37:40", "remaining_time": "0:54:52"}
{"current_steps": 3000, "total_steps": 3750, "loss": 0.3341, "lr": 4.691084450942047e-06, "epoch": 4.8, "percentage": 80.0, "elapsed_time": "3:38:02", "remaining_time": "0:54:30"}
{"current_steps": 3005, "total_steps": 3750, "loss": 0.3357, "lr": 4.631350738392955e-06, "epoch": 4.808, "percentage": 80.13, "elapsed_time": "3:39:20", "remaining_time": "0:54:22"}
{"current_steps": 3010, "total_steps": 3750, "loss": 0.3496, "lr": 4.571949936054197e-06, "epoch": 4.816, "percentage": 80.27, "elapsed_time": "3:39:36", "remaining_time": "0:53:59"}
{"current_steps": 3015, "total_steps": 3750, "loss": 0.3405, "lr": 4.512883330644815e-06, "epoch": 4.824, "percentage": 80.4, "elapsed_time": "3:39:55", "remaining_time": "0:53:36"}
{"current_steps": 3020, "total_steps": 3750, "loss": 0.3339, "lr": 4.454152201644591e-06, "epoch": 4.832, "percentage": 80.53, "elapsed_time": "3:40:11", "remaining_time": "0:53:13"}
{"current_steps": 3025, "total_steps": 3750, "loss": 0.3356, "lr": 4.395757821266333e-06, "epoch": 4.84, "percentage": 80.67, "elapsed_time": "3:40:28", "remaining_time": "0:52:50"}
{"current_steps": 3030, "total_steps": 3750, "loss": 0.3451, "lr": 4.337701454428322e-06, "epoch": 4.848, "percentage": 80.8, "elapsed_time": "3:40:44", "remaining_time": "0:52:27"}
{"current_steps": 3035, "total_steps": 3750, "loss": 0.3104, "lr": 4.279984358726925e-06, "epoch": 4.856, "percentage": 80.93, "elapsed_time": "3:41:03", "remaining_time": "0:52:04"}
{"current_steps": 3040, "total_steps": 3750, "loss": 0.325, "lr": 4.2226077844093205e-06, "epoch": 4.864, "percentage": 81.07, "elapsed_time": "3:41:19", "remaining_time": "0:51:41"}
{"current_steps": 3045, "total_steps": 3750, "loss": 0.3406, "lr": 4.165572974346435e-06, "epoch": 4.872, "percentage": 81.2, "elapsed_time": "3:41:35", "remaining_time": "0:51:18"}
{"current_steps": 3050, "total_steps": 3750, "loss": 0.3355, "lr": 4.108881164006033e-06, "epoch": 4.88, "percentage": 81.33, "elapsed_time": "3:41:55", "remaining_time": "0:50:55"}
{"current_steps": 3055, "total_steps": 3750, "loss": 0.3505, "lr": 4.05253358142593e-06, "epoch": 4.888, "percentage": 81.47, "elapsed_time": "3:42:11", "remaining_time": "0:50:32"}
{"current_steps": 3060, "total_steps": 3750, "loss": 0.3437, "lr": 3.9965314471874035e-06, "epoch": 4.896, "percentage": 81.6, "elapsed_time": "3:42:29", "remaining_time": "0:50:10"}
{"current_steps": 3065, "total_steps": 3750, "loss": 0.3517, "lr": 3.940875974388749e-06, "epoch": 4.904, "percentage": 81.73, "elapsed_time": "3:42:43", "remaining_time": "0:49:46"}
{"current_steps": 3070, "total_steps": 3750, "loss": 0.3474, "lr": 3.885568368619013e-06, "epoch": 4.912, "percentage": 81.87, "elapsed_time": "3:42:59", "remaining_time": "0:49:23"}
{"current_steps": 3075, "total_steps": 3750, "loss": 0.346, "lr": 3.830609827931877e-06, "epoch": 4.92, "percentage": 82.0, "elapsed_time": "3:43:16", "remaining_time": "0:49:00"}
{"current_steps": 3080, "total_steps": 3750, "loss": 0.3382, "lr": 3.7760015428196694e-06, "epoch": 4.928, "percentage": 82.13, "elapsed_time": "3:43:35", "remaining_time": "0:48:38"}
{"current_steps": 3085, "total_steps": 3750, "loss": 0.3418, "lr": 3.7217446961876413e-06, "epoch": 4.936, "percentage": 82.27, "elapsed_time": "3:43:53", "remaining_time": "0:48:15"}
{"current_steps": 3090, "total_steps": 3750, "loss": 0.3384, "lr": 3.6678404633282826e-06, "epoch": 4.944, "percentage": 82.4, "elapsed_time": "3:44:09", "remaining_time": "0:47:52"}
{"current_steps": 3095, "total_steps": 3750, "loss": 0.3463, "lr": 3.6142900118959158e-06, "epoch": 4.952, "percentage": 82.53, "elapsed_time": "3:44:24", "remaining_time": "0:47:29"}
{"current_steps": 3100, "total_steps": 3750, "loss": 0.3249, "lr": 3.561094501881339e-06, "epoch": 4.96, "percentage": 82.67, "elapsed_time": "3:44:44", "remaining_time": "0:47:07"}
{"current_steps": 3105, "total_steps": 3750, "loss": 0.3571, "lr": 3.5082550855867693e-06, "epoch": 4.968, "percentage": 82.8, "elapsed_time": "3:46:02", "remaining_time": "0:46:57"}
{"current_steps": 3110, "total_steps": 3750, "loss": 0.3519, "lr": 3.455772907600841e-06, "epoch": 4.976, "percentage": 82.93, "elapsed_time": "3:46:18", "remaining_time": "0:46:34"}
{"current_steps": 3115, "total_steps": 3750, "loss": 0.3298, "lr": 3.4036491047738075e-06, "epoch": 4.984, "percentage": 83.07, "elapsed_time": "3:46:37", "remaining_time": "0:46:11"}
{"current_steps": 3120, "total_steps": 3750, "loss": 0.3398, "lr": 3.351884806192933e-06, "epoch": 4.992, "percentage": 83.2, "elapsed_time": "3:46:52", "remaining_time": "0:45:48"}
{"current_steps": 3125, "total_steps": 3750, "loss": 0.3541, "lr": 3.3004811331580268e-06, "epoch": 5.0, "percentage": 83.33, "elapsed_time": "3:47:09", "remaining_time": "0:45:25"}
{"current_steps": 3130, "total_steps": 3750, "loss": 0.3318, "lr": 3.249439199157167e-06, "epoch": 5.008, "percentage": 83.47, "elapsed_time": "3:47:26", "remaining_time": "0:45:03"}
{"current_steps": 3135, "total_steps": 3750, "loss": 0.3418, "lr": 3.198760109842558e-06, "epoch": 5.016, "percentage": 83.6, "elapsed_time": "3:47:43", "remaining_time": "0:44:40"}
{"current_steps": 3140, "total_steps": 3750, "loss": 0.3523, "lr": 3.1484449630065894e-06, "epoch": 5.024, "percentage": 83.73, "elapsed_time": "3:48:03", "remaining_time": "0:44:18"}
{"current_steps": 3145, "total_steps": 3750, "loss": 0.3208, "lr": 3.0984948485580736e-06, "epoch": 5.032, "percentage": 83.87, "elapsed_time": "3:48:21", "remaining_time": "0:43:55"}
{"current_steps": 3150, "total_steps": 3750, "loss": 0.3195, "lr": 3.048910848498605e-06, "epoch": 5.04, "percentage": 84.0, "elapsed_time": "3:48:38", "remaining_time": "0:43:33"}
{"current_steps": 3155, "total_steps": 3750, "loss": 0.3182, "lr": 2.9996940368991477e-06, "epoch": 5.048, "percentage": 84.13, "elapsed_time": "3:48:55", "remaining_time": "0:43:10"}
{"current_steps": 3160, "total_steps": 3750, "loss": 0.335, "lr": 2.9508454798767516e-06, "epoch": 5.056, "percentage": 84.27, "elapsed_time": "3:49:12", "remaining_time": "0:42:47"}
{"current_steps": 3165, "total_steps": 3750, "loss": 0.322, "lr": 2.9023662355714766e-06, "epoch": 5.064, "percentage": 84.4, "elapsed_time": "3:49:29", "remaining_time": "0:42:25"}
{"current_steps": 3170, "total_steps": 3750, "loss": 0.3494, "lr": 2.8542573541234707e-06, "epoch": 5.072, "percentage": 84.53, "elapsed_time": "3:49:46", "remaining_time": "0:42:02"}
{"current_steps": 3175, "total_steps": 3750, "loss": 0.3435, "lr": 2.80651987765018e-06, "epoch": 5.08, "percentage": 84.67, "elapsed_time": "3:50:03", "remaining_time": "0:41:39"}
{"current_steps": 3180, "total_steps": 3750, "loss": 0.318, "lr": 2.759154840223843e-06, "epoch": 5.088, "percentage": 84.8, "elapsed_time": "3:50:20", "remaining_time": "0:41:17"}
{"current_steps": 3185, "total_steps": 3750, "loss": 0.3382, "lr": 2.7121632678490327e-06, "epoch": 5.096, "percentage": 84.93, "elapsed_time": "3:50:38", "remaining_time": "0:40:54"}
{"current_steps": 3190, "total_steps": 3750, "loss": 0.325, "lr": 2.6655461784404768e-06, "epoch": 5.104, "percentage": 85.07, "elapsed_time": "3:50:57", "remaining_time": "0:40:32"}
{"current_steps": 3195, "total_steps": 3750, "loss": 0.3231, "lr": 2.6193045818009654e-06, "epoch": 5.112, "percentage": 85.2, "elapsed_time": "3:51:15", "remaining_time": "0:40:10"}
{"current_steps": 3200, "total_steps": 3750, "loss": 0.3169, "lr": 2.5734394795995066e-06, "epoch": 5.12, "percentage": 85.33, "elapsed_time": "3:51:32", "remaining_time": "0:39:47"}
{"current_steps": 3205, "total_steps": 3750, "loss": 0.3427, "lr": 2.5279518653496272e-06, "epoch": 5.128, "percentage": 85.47, "elapsed_time": "3:52:48", "remaining_time": "0:39:35"}
{"current_steps": 3210, "total_steps": 3750, "loss": 0.3258, "lr": 2.4828427243878307e-06, "epoch": 5.136, "percentage": 85.6, "elapsed_time": "3:53:05", "remaining_time": "0:39:12"}
{"current_steps": 3215, "total_steps": 3750, "loss": 0.3112, "lr": 2.4381130338522762e-06, "epoch": 5.144, "percentage": 85.73, "elapsed_time": "3:53:22", "remaining_time": "0:38:50"}
{"current_steps": 3220, "total_steps": 3750, "loss": 0.3527, "lr": 2.393763762661596e-06, "epoch": 5.152, "percentage": 85.87, "elapsed_time": "3:53:42", "remaining_time": "0:38:28"}
{"current_steps": 3225, "total_steps": 3750, "loss": 0.313, "lr": 2.349795871493925e-06, "epoch": 5.16, "percentage": 86.0, "elapsed_time": "3:53:59", "remaining_time": "0:38:05"}
{"current_steps": 3230, "total_steps": 3750, "loss": 0.343, "lr": 2.3062103127660686e-06, "epoch": 5.168, "percentage": 86.13, "elapsed_time": "3:54:15", "remaining_time": "0:37:42"}
{"current_steps": 3235, "total_steps": 3750, "loss": 0.3361, "lr": 2.2630080306128833e-06, "epoch": 5.176, "percentage": 86.27, "elapsed_time": "3:54:35", "remaining_time": "0:37:20"}
{"current_steps": 3240, "total_steps": 3750, "loss": 0.3201, "lr": 2.2201899608668365e-06, "epoch": 5.184, "percentage": 86.4, "elapsed_time": "3:54:56", "remaining_time": "0:36:58"}
{"current_steps": 3245, "total_steps": 3750, "loss": 0.3604, "lr": 2.1777570310377084e-06, "epoch": 5.192, "percentage": 86.53, "elapsed_time": "3:55:13", "remaining_time": "0:36:36"}
{"current_steps": 3250, "total_steps": 3750, "loss": 0.3304, "lr": 2.1357101602925323e-06, "epoch": 5.2, "percentage": 86.67, "elapsed_time": "3:55:29", "remaining_time": "0:36:13"}
{"current_steps": 3255, "total_steps": 3750, "loss": 0.3424, "lr": 2.0940502594356427e-06, "epoch": 5.208, "percentage": 86.8, "elapsed_time": "3:55:46", "remaining_time": "0:35:51"}
{"current_steps": 3260, "total_steps": 3750, "loss": 0.3176, "lr": 2.052778230888994e-06, "epoch": 5.216, "percentage": 86.93, "elapsed_time": "3:56:06", "remaining_time": "0:35:29"}
{"current_steps": 3265, "total_steps": 3750, "loss": 0.325, "lr": 2.0118949686725786e-06, "epoch": 5.224, "percentage": 87.07, "elapsed_time": "3:56:21", "remaining_time": "0:35:06"}
{"current_steps": 3270, "total_steps": 3750, "loss": 0.3163, "lr": 1.971401358385072e-06, "epoch": 5.232, "percentage": 87.2, "elapsed_time": "3:56:42", "remaining_time": "0:34:44"}
{"current_steps": 3275, "total_steps": 3750, "loss": 0.3234, "lr": 1.9312982771846435e-06, "epoch": 5.24, "percentage": 87.33, "elapsed_time": "3:57:00", "remaining_time": "0:34:22"}
{"current_steps": 3280, "total_steps": 3750, "loss": 0.3396, "lr": 1.8915865937699652e-06, "epoch": 5.248, "percentage": 87.47, "elapsed_time": "3:57:18", "remaining_time": "0:34:00"}
{"current_steps": 3285, "total_steps": 3750, "loss": 0.3384, "lr": 1.8522671683613946e-06, "epoch": 5.256, "percentage": 87.6, "elapsed_time": "3:57:35", "remaining_time": "0:33:37"}
{"current_steps": 3290, "total_steps": 3750, "loss": 0.3374, "lr": 1.8133408526823283e-06, "epoch": 5.264, "percentage": 87.73, "elapsed_time": "3:57:52", "remaining_time": "0:33:15"}
{"current_steps": 3295, "total_steps": 3750, "loss": 0.3275, "lr": 1.7748084899407558e-06, "epoch": 5.272, "percentage": 87.87, "elapsed_time": "3:58:10", "remaining_time": "0:32:53"}
{"current_steps": 3300, "total_steps": 3750, "loss": 0.3439, "lr": 1.7366709148110118e-06, "epoch": 5.28, "percentage": 88.0, "elapsed_time": "3:58:29", "remaining_time": "0:32:31"}
{"current_steps": 3305, "total_steps": 3750, "loss": 0.3228, "lr": 1.698928953415675e-06, "epoch": 5.288, "percentage": 88.13, "elapsed_time": "3:59:43", "remaining_time": "0:32:16"}
{"current_steps": 3310, "total_steps": 3750, "loss": 0.3281, "lr": 1.6615834233076756e-06, "epoch": 5.296, "percentage": 88.27, "elapsed_time": "4:00:02", "remaining_time": "0:31:54"}
{"current_steps": 3315, "total_steps": 3750, "loss": 0.3411, "lr": 1.6246351334525944e-06, "epoch": 5.304, "percentage": 88.4, "elapsed_time": "4:00:18", "remaining_time": "0:31:32"}
{"current_steps": 3320, "total_steps": 3750, "loss": 0.3246, "lr": 1.5880848842111362e-06, "epoch": 5.312, "percentage": 88.53, "elapsed_time": "4:00:36", "remaining_time": "0:31:09"}
{"current_steps": 3325, "total_steps": 3750, "loss": 0.3429, "lr": 1.5519334673218023e-06, "epoch": 5.32, "percentage": 88.67, "elapsed_time": "4:00:53", "remaining_time": "0:30:47"}
{"current_steps": 3330, "total_steps": 3750, "loss": 0.3289, "lr": 1.5161816658837002e-06, "epoch": 5.328, "percentage": 88.8, "elapsed_time": "4:01:08", "remaining_time": "0:30:24"}
{"current_steps": 3335, "total_steps": 3750, "loss": 0.3307, "lr": 1.4808302543396423e-06, "epoch": 5.336, "percentage": 88.93, "elapsed_time": "4:01:29", "remaining_time": "0:30:03"}
{"current_steps": 3340, "total_steps": 3750, "loss": 0.3205, "lr": 1.445879998459314e-06, "epoch": 5.344, "percentage": 89.07, "elapsed_time": "4:01:51", "remaining_time": "0:29:41"}
{"current_steps": 3345, "total_steps": 3750, "loss": 0.3384, "lr": 1.4113316553227296e-06, "epoch": 5.352, "percentage": 89.2, "elapsed_time": "4:02:06", "remaining_time": "0:29:18"}
{"current_steps": 3350, "total_steps": 3750, "loss": 0.3316, "lr": 1.3771859733037896e-06, "epoch": 5.36, "percentage": 89.33, "elapsed_time": "4:02:22", "remaining_time": "0:28:56"}
{"current_steps": 3355, "total_steps": 3750, "loss": 0.3532, "lr": 1.3434436920541072e-06, "epoch": 5.368, "percentage": 89.47, "elapsed_time": "4:02:41", "remaining_time": "0:28:34"}
{"current_steps": 3360, "total_steps": 3750, "loss": 0.3253, "lr": 1.3101055424869768e-06, "epoch": 5.376, "percentage": 89.6, "elapsed_time": "4:03:03", "remaining_time": "0:28:12"}
{"current_steps": 3365, "total_steps": 3750, "loss": 0.3361, "lr": 1.2771722467615266e-06, "epoch": 5.384, "percentage": 89.73, "elapsed_time": "4:03:19", "remaining_time": "0:27:50"}
{"current_steps": 3370, "total_steps": 3750, "loss": 0.3231, "lr": 1.2446445182670818e-06, "epoch": 5.392, "percentage": 89.87, "elapsed_time": "4:03:35", "remaining_time": "0:27:28"}
{"current_steps": 3375, "total_steps": 3750, "loss": 0.3273, "lr": 1.21252306160772e-06, "epoch": 5.4, "percentage": 90.0, "elapsed_time": "4:03:55", "remaining_time": "0:27:06"}
{"current_steps": 3380, "total_steps": 3750, "loss": 0.3374, "lr": 1.1808085725870088e-06, "epoch": 5.408, "percentage": 90.13, "elapsed_time": "4:04:13", "remaining_time": "0:26:44"}
{"current_steps": 3385, "total_steps": 3750, "loss": 0.3348, "lr": 1.1495017381929197e-06, "epoch": 5.416, "percentage": 90.27, "elapsed_time": "4:04:31", "remaining_time": "0:26:22"}
{"current_steps": 3390, "total_steps": 3750, "loss": 0.3141, "lr": 1.1186032365829514e-06, "epoch": 5.424, "percentage": 90.4, "elapsed_time": "4:04:53", "remaining_time": "0:26:00"}
{"current_steps": 3395, "total_steps": 3750, "loss": 0.3457, "lr": 1.088113737069456e-06, "epoch": 5.432, "percentage": 90.53, "elapsed_time": "4:05:09", "remaining_time": "0:25:38"}
{"current_steps": 3400, "total_steps": 3750, "loss": 0.3361, "lr": 1.0580339001051153e-06, "epoch": 5.44, "percentage": 90.67, "elapsed_time": "4:05:24", "remaining_time": "0:25:15"}
{"current_steps": 3405, "total_steps": 3750, "loss": 0.3331, "lr": 1.0283643772686535e-06, "epoch": 5.448, "percentage": 90.8, "elapsed_time": "4:06:38", "remaining_time": "0:24:59"}
{"current_steps": 3410, "total_steps": 3750, "loss": 0.3285, "lr": 9.991058112507113e-07, "epoch": 5.456, "percentage": 90.93, "elapsed_time": "4:06:56", "remaining_time": "0:24:37"}
{"current_steps": 3415, "total_steps": 3750, "loss": 0.3383, "lr": 9.702588358399345e-07, "epoch": 5.464, "percentage": 91.07, "elapsed_time": "4:07:15", "remaining_time": "0:24:15"}
{"current_steps": 3420, "total_steps": 3750, "loss": 0.3292, "lr": 9.418240759092434e-07, "epoch": 5.4719999999999995, "percentage": 91.2, "elapsed_time": "4:07:34", "remaining_time": "0:23:53"}
{"current_steps": 3425, "total_steps": 3750, "loss": 0.3233, "lr": 9.138021474022763e-07, "epoch": 5.48, "percentage": 91.33, "elapsed_time": "4:07:52", "remaining_time": "0:23:31"}
{"current_steps": 3430, "total_steps": 3750, "loss": 0.3402, "lr": 8.861936573200825e-07, "epoch": 5.4879999999999995, "percentage": 91.47, "elapsed_time": "4:08:11", "remaining_time": "0:23:09"}
{"current_steps": 3435, "total_steps": 3750, "loss": 0.329, "lr": 8.58999203707942e-07, "epoch": 5.496, "percentage": 91.6, "elapsed_time": "4:08:27", "remaining_time": "0:22:47"}
{"current_steps": 3440, "total_steps": 3750, "loss": 0.322, "lr": 8.322193756424401e-07, "epoch": 5.504, "percentage": 91.73, "elapsed_time": "4:08:48", "remaining_time": "0:22:25"}
{"current_steps": 3445, "total_steps": 3750, "loss": 0.3221, "lr": 8.058547532186667e-07, "epoch": 5.5120000000000005, "percentage": 91.87, "elapsed_time": "4:09:08", "remaining_time": "0:22:03"}
{"current_steps": 3450, "total_steps": 3750, "loss": 0.3226, "lr": 7.799059075376991e-07, "epoch": 5.52, "percentage": 92.0, "elapsed_time": "4:09:26", "remaining_time": "0:21:41"}
{"current_steps": 3455, "total_steps": 3750, "loss": 0.3234, "lr": 7.54373400694195e-07, "epoch": 5.5280000000000005, "percentage": 92.13, "elapsed_time": "4:09:43", "remaining_time": "0:21:19"}
{"current_steps": 3460, "total_steps": 3750, "loss": 0.3306, "lr": 7.292577857642302e-07, "epoch": 5.536, "percentage": 92.27, "elapsed_time": "4:10:01", "remaining_time": "0:20:57"}
{"current_steps": 3465, "total_steps": 3750, "loss": 0.3287, "lr": 7.045596067933158e-07, "epoch": 5.5440000000000005, "percentage": 92.4, "elapsed_time": "4:10:19", "remaining_time": "0:20:35"}
{"current_steps": 3470, "total_steps": 3750, "loss": 0.3311, "lr": 6.80279398784609e-07, "epoch": 5.552, "percentage": 92.53, "elapsed_time": "4:10:35", "remaining_time": "0:20:13"}
{"current_steps": 3475, "total_steps": 3750, "loss": 0.3301, "lr": 6.56417687687343e-07, "epoch": 5.5600000000000005, "percentage": 92.67, "elapsed_time": "4:10:52", "remaining_time": "0:19:51"}
{"current_steps": 3480, "total_steps": 3750, "loss": 0.3111, "lr": 6.329749903854066e-07, "epoch": 5.568, "percentage": 92.8, "elapsed_time": "4:11:14", "remaining_time": "0:19:29"}
{"current_steps": 3485, "total_steps": 3750, "loss": 0.3338, "lr": 6.099518146861628e-07, "epoch": 5.576, "percentage": 92.93, "elapsed_time": "4:11:31", "remaining_time": "0:19:07"}
{"current_steps": 3490, "total_steps": 3750, "loss": 0.3387, "lr": 5.873486593094546e-07, "epoch": 5.584, "percentage": 93.07, "elapsed_time": "4:11:47", "remaining_time": "0:18:45"}
{"current_steps": 3495, "total_steps": 3750, "loss": 0.3262, "lr": 5.651660138767834e-07, "epoch": 5.592, "percentage": 93.2, "elapsed_time": "4:12:06", "remaining_time": "0:18:23"}
{"current_steps": 3500, "total_steps": 3750, "loss": 0.3262, "lr": 5.434043589007232e-07, "epoch": 5.6, "percentage": 93.33, "elapsed_time": "4:12:23", "remaining_time": "0:18:01"}
{"current_steps": 3505, "total_steps": 3750, "loss": 0.3128, "lr": 5.220641657744963e-07, "epoch": 5.608, "percentage": 93.47, "elapsed_time": "4:13:42", "remaining_time": "0:17:44"}
{"current_steps": 3510, "total_steps": 3750, "loss": 0.3318, "lr": 5.0114589676177e-07, "epoch": 5.616, "percentage": 93.6, "elapsed_time": "4:14:01", "remaining_time": "0:17:22"}
{"current_steps": 3515, "total_steps": 3750, "loss": 0.3355, "lr": 4.806500049866492e-07, "epoch": 5.624, "percentage": 93.73, "elapsed_time": "4:14:19", "remaining_time": "0:17:00"}
{"current_steps": 3520, "total_steps": 3750, "loss": 0.3165, "lr": 4.6057693442383756e-07, "epoch": 5.632, "percentage": 93.87, "elapsed_time": "4:14:37", "remaining_time": "0:16:38"}
{"current_steps": 3525, "total_steps": 3750, "loss": 0.324, "lr": 4.409271198890519e-07, "epoch": 5.64, "percentage": 94.0, "elapsed_time": "4:14:54", "remaining_time": "0:16:16"}
{"current_steps": 3530, "total_steps": 3750, "loss": 0.3437, "lr": 4.217009870295763e-07, "epoch": 5.648, "percentage": 94.13, "elapsed_time": "4:15:12", "remaining_time": "0:15:54"}
{"current_steps": 3535, "total_steps": 3750, "loss": 0.3166, "lr": 4.028989523150628e-07, "epoch": 5.656, "percentage": 94.27, "elapsed_time": "4:15:32", "remaining_time": "0:15:32"}
{"current_steps": 3540, "total_steps": 3750, "loss": 0.3266, "lr": 3.8452142302849216e-07, "epoch": 5.664, "percentage": 94.4, "elapsed_time": "4:15:48", "remaining_time": "0:15:10"}
{"current_steps": 3545, "total_steps": 3750, "loss": 0.3379, "lr": 3.665687972573606e-07, "epoch": 5.672, "percentage": 94.53, "elapsed_time": "4:16:06", "remaining_time": "0:14:48"}
{"current_steps": 3550, "total_steps": 3750, "loss": 0.3226, "lr": 3.4904146388506475e-07, "epoch": 5.68, "percentage": 94.67, "elapsed_time": "4:16:23", "remaining_time": "0:14:26"}
{"current_steps": 3555, "total_steps": 3750, "loss": 0.326, "lr": 3.319398025824572e-07, "epoch": 5.688, "percentage": 94.8, "elapsed_time": "4:16:39", "remaining_time": "0:14:04"}
{"current_steps": 3560, "total_steps": 3750, "loss": 0.3314, "lr": 3.152641837996373e-07, "epoch": 5.696, "percentage": 94.93, "elapsed_time": "4:16:54", "remaining_time": "0:13:42"}
{"current_steps": 3565, "total_steps": 3750, "loss": 0.335, "lr": 2.990149687579247e-07, "epoch": 5.704, "percentage": 95.07, "elapsed_time": "4:17:12", "remaining_time": "0:13:20"}
{"current_steps": 3570, "total_steps": 3750, "loss": 0.3357, "lr": 2.8319250944203625e-07, "epoch": 5.712, "percentage": 95.2, "elapsed_time": "4:17:28", "remaining_time": "0:12:58"}
{"current_steps": 3575, "total_steps": 3750, "loss": 0.3269, "lr": 2.677971485924502e-07, "epoch": 5.72, "percentage": 95.33, "elapsed_time": "4:17:43", "remaining_time": "0:12:36"}
{"current_steps": 3580, "total_steps": 3750, "loss": 0.3039, "lr": 2.52829219697992e-07, "epoch": 5.728, "percentage": 95.47, "elapsed_time": "4:18:00", "remaining_time": "0:12:15"}
{"current_steps": 3585, "total_steps": 3750, "loss": 0.3188, "lr": 2.3828904698861565e-07, "epoch": 5.736, "percentage": 95.6, "elapsed_time": "4:18:17", "remaining_time": "0:11:53"}
{"current_steps": 3590, "total_steps": 3750, "loss": 0.3468, "lr": 2.2417694542836489e-07, "epoch": 5.744, "percentage": 95.73, "elapsed_time": "4:18:36", "remaining_time": "0:11:31"}
{"current_steps": 3595, "total_steps": 3750, "loss": 0.3187, "lr": 2.104932207085586e-07, "epoch": 5.752, "percentage": 95.87, "elapsed_time": "4:18:55", "remaining_time": "0:11:09"}
{"current_steps": 3600, "total_steps": 3750, "loss": 0.3364, "lr": 1.97238169241174e-07, "epoch": 5.76, "percentage": 96.0, "elapsed_time": "4:19:14", "remaining_time": "0:10:48"}
{"current_steps": 3605, "total_steps": 3750, "loss": 0.3186, "lr": 1.8441207815241613e-07, "epoch": 5.768, "percentage": 96.13, "elapsed_time": "4:20:29", "remaining_time": "0:10:28"}
{"current_steps": 3610, "total_steps": 3750, "loss": 0.3252, "lr": 1.720152252765095e-07, "epoch": 5.776, "percentage": 96.27, "elapsed_time": "4:20:47", "remaining_time": "0:10:06"}
{"current_steps": 3615, "total_steps": 3750, "loss": 0.3178, "lr": 1.600478791496629e-07, "epoch": 5.784, "percentage": 96.4, "elapsed_time": "4:21:07", "remaining_time": "0:09:45"}
{"current_steps": 3620, "total_steps": 3750, "loss": 0.3064, "lr": 1.4851029900427415e-07, "epoch": 5.792, "percentage": 96.53, "elapsed_time": "4:21:27", "remaining_time": "0:09:23"}
{"current_steps": 3625, "total_steps": 3750, "loss": 0.3158, "lr": 1.3740273476329224e-07, "epoch": 5.8, "percentage": 96.67, "elapsed_time": "4:21:43", "remaining_time": "0:09:01"}
{"current_steps": 3630, "total_steps": 3750, "loss": 0.3332, "lr": 1.2672542703482616e-07, "epoch": 5.808, "percentage": 96.8, "elapsed_time": "4:22:02", "remaining_time": "0:08:39"}
{"current_steps": 3635, "total_steps": 3750, "loss": 0.3257, "lr": 1.164786071069135e-07, "epoch": 5.816, "percentage": 96.93, "elapsed_time": "4:22:18", "remaining_time": "0:08:17"}
{"current_steps": 3640, "total_steps": 3750, "loss": 0.3336, "lr": 1.0666249694251785e-07, "epoch": 5.824, "percentage": 97.07, "elapsed_time": "4:22:34", "remaining_time": "0:07:56"}
{"current_steps": 3645, "total_steps": 3750, "loss": 0.3174, "lr": 9.72773091747281e-08, "epoch": 5.832, "percentage": 97.2, "elapsed_time": "4:22:53", "remaining_time": "0:07:34"}
{"current_steps": 3650, "total_steps": 3750, "loss": 0.3382, "lr": 8.832324710214002e-08, "epoch": 5.84, "percentage": 97.33, "elapsed_time": "4:23:11", "remaining_time": "0:07:12"}
{"current_steps": 3655, "total_steps": 3750, "loss": 0.336, "lr": 7.980050468445744e-08, "epoch": 5.848, "percentage": 97.47, "elapsed_time": "4:23:30", "remaining_time": "0:06:50"}
{"current_steps": 3660, "total_steps": 3750, "loss": 0.3574, "lr": 7.170926653829347e-08, "epoch": 5.856, "percentage": 97.6, "elapsed_time": "4:23:47", "remaining_time": "0:06:29"}
{"current_steps": 3665, "total_steps": 3750, "loss": 0.3261, "lr": 6.404970793317145e-08, "epoch": 5.864, "percentage": 97.73, "elapsed_time": "4:24:04", "remaining_time": "0:06:07"}
{"current_steps": 3670, "total_steps": 3750, "loss": 0.3331, "lr": 5.682199478772133e-08, "epoch": 5.872, "percentage": 97.87, "elapsed_time": "4:24:20", "remaining_time": "0:05:45"}
{"current_steps": 3675, "total_steps": 3750, "loss": 0.3309, "lr": 5.0026283666093635e-08, "epoch": 5.88, "percentage": 98.0, "elapsed_time": "4:24:37", "remaining_time": "0:05:24"}
{"current_steps": 3680, "total_steps": 3750, "loss": 0.332, "lr": 4.366272177456665e-08, "epoch": 5.888, "percentage": 98.13, "elapsed_time": "4:24:57", "remaining_time": "0:05:02"}
{"current_steps": 3685, "total_steps": 3750, "loss": 0.3028, "lr": 3.773144695834674e-08, "epoch": 5.896, "percentage": 98.27, "elapsed_time": "4:25:15", "remaining_time": "0:04:40"}
{"current_steps": 3690, "total_steps": 3750, "loss": 0.3259, "lr": 3.223258769860405e-08, "epoch": 5.904, "percentage": 98.4, "elapsed_time": "4:25:33", "remaining_time": "0:04:19"}
{"current_steps": 3695, "total_steps": 3750, "loss": 0.3296, "lr": 2.716626310966808e-08, "epoch": 5.912, "percentage": 98.53, "elapsed_time": "4:25:52", "remaining_time": "0:03:57"}
{"current_steps": 3700, "total_steps": 3750, "loss": 0.3219, "lr": 2.253258293645866e-08, "epoch": 5.92, "percentage": 98.67, "elapsed_time": "4:26:12", "remaining_time": "0:03:35"}
{"current_steps": 3705, "total_steps": 3750, "loss": 0.3286, "lr": 1.8331647552110033e-08, "epoch": 5.928, "percentage": 98.8, "elapsed_time": "4:27:32", "remaining_time": "0:03:14"}
{"current_steps": 3710, "total_steps": 3750, "loss": 0.3228, "lr": 1.456354795578374e-08, "epoch": 5.936, "percentage": 98.93, "elapsed_time": "4:27:49", "remaining_time": "0:02:53"}
{"current_steps": 3715, "total_steps": 3750, "loss": 0.346, "lr": 1.1228365770714622e-08, "epoch": 5.944, "percentage": 99.07, "elapsed_time": "4:28:07", "remaining_time": "0:02:31"}
{"current_steps": 3720, "total_steps": 3750, "loss": 0.337, "lr": 8.326173242432233e-09, "epoch": 5.952, "percentage": 99.2, "elapsed_time": "4:28:23", "remaining_time": "0:02:09"}
{"current_steps": 3725, "total_steps": 3750, "loss": 0.3268, "lr": 5.857033237199883e-09, "epoch": 5.96, "percentage": 99.33, "elapsed_time": "4:28:41", "remaining_time": "0:01:48"}
{"current_steps": 3730, "total_steps": 3750, "loss": 0.326, "lr": 3.820999240644608e-09, "epoch": 5.968, "percentage": 99.47, "elapsed_time": "4:28:56", "remaining_time": "0:01:26"}
{"current_steps": 3735, "total_steps": 3750, "loss": 0.3276, "lr": 2.2181153566158687e-09, "epoch": 5.976, "percentage": 99.6, "elapsed_time": "4:29:15", "remaining_time": "0:01:04"}
{"current_steps": 3740, "total_steps": 3750, "loss": 0.3181, "lr": 1.0484163062107755e-09, "epoch": 5.984, "percentage": 99.73, "elapsed_time": "4:29:31", "remaining_time": "0:00:43"}
{"current_steps": 3745, "total_steps": 3750, "loss": 0.3225, "lr": 3.11927427034675e-10, "epoch": 5.992, "percentage": 99.87, "elapsed_time": "4:29:49", "remaining_time": "0:00:21"}
{"current_steps": 3750, "total_steps": 3750, "loss": 0.3141, "lr": 8.664672648261985e-12, "epoch": 6.0, "percentage": 100.0, "elapsed_time": "4:30:06", "remaining_time": "0:00:00"}
{"current_steps": 3750, "total_steps": 3750, "epoch": 6.0, "percentage": 100.0, "elapsed_time": "4:31:12", "remaining_time": "0:00:00"}