full_sft_v0.4_args / trainer_log.jsonl
yueqis's picture
Upload trainer_log.jsonl with huggingface_hub
a06b423 verified
{"current_steps": 10, "total_steps": 2470, "loss": 0.8275, "lr": 7.258064516129033e-07, "epoch": 0.004048582995951417, "percentage": 0.4, "elapsed_time": "0:03:18", "remaining_time": "13:31:55"}
{"current_steps": 20, "total_steps": 2470, "loss": 0.7256, "lr": 1.5322580645161292e-06, "epoch": 0.008097165991902834, "percentage": 0.81, "elapsed_time": "0:05:41", "remaining_time": "11:37:54"}
{"current_steps": 30, "total_steps": 2470, "loss": 0.5483, "lr": 2.338709677419355e-06, "epoch": 0.012145748987854251, "percentage": 1.21, "elapsed_time": "0:08:22", "remaining_time": "11:21:41"}
{"current_steps": 40, "total_steps": 2470, "loss": 0.5483, "lr": 3.145161290322581e-06, "epoch": 0.016194331983805668, "percentage": 1.62, "elapsed_time": "0:11:09", "remaining_time": "11:17:27"}
{"current_steps": 50, "total_steps": 2470, "loss": 0.4507, "lr": 3.951612903225807e-06, "epoch": 0.020242914979757085, "percentage": 2.02, "elapsed_time": "0:13:29", "remaining_time": "10:52:47"}
{"current_steps": 60, "total_steps": 2470, "loss": 0.5085, "lr": 4.758064516129033e-06, "epoch": 0.024291497975708502, "percentage": 2.43, "elapsed_time": "0:16:39", "remaining_time": "11:09:19"}
{"current_steps": 70, "total_steps": 2470, "loss": 0.5205, "lr": 5.564516129032258e-06, "epoch": 0.02834008097165992, "percentage": 2.83, "elapsed_time": "0:19:11", "remaining_time": "10:58:12"}
{"current_steps": 80, "total_steps": 2470, "loss": 0.4227, "lr": 6.370967741935485e-06, "epoch": 0.032388663967611336, "percentage": 3.24, "elapsed_time": "0:21:45", "remaining_time": "10:50:01"}
{"current_steps": 90, "total_steps": 2470, "loss": 0.4632, "lr": 7.177419354838711e-06, "epoch": 0.03643724696356275, "percentage": 3.64, "elapsed_time": "0:24:32", "remaining_time": "10:49:07"}
{"current_steps": 100, "total_steps": 2470, "loss": 0.3617, "lr": 7.983870967741935e-06, "epoch": 0.04048582995951417, "percentage": 4.05, "elapsed_time": "0:26:57", "remaining_time": "10:39:05"}
{"current_steps": 110, "total_steps": 2470, "loss": 0.401, "lr": 8.790322580645163e-06, "epoch": 0.044534412955465584, "percentage": 4.45, "elapsed_time": "0:29:57", "remaining_time": "10:42:38"}
{"current_steps": 120, "total_steps": 2470, "loss": 0.4275, "lr": 9.596774193548389e-06, "epoch": 0.048582995951417005, "percentage": 4.86, "elapsed_time": "0:32:17", "remaining_time": "10:32:14"}
{"current_steps": 130, "total_steps": 2470, "loss": 0.3987, "lr": 9.999887921547818e-06, "epoch": 0.05263157894736842, "percentage": 5.26, "elapsed_time": "0:35:02", "remaining_time": "10:30:53"}
{"current_steps": 140, "total_steps": 2470, "loss": 0.4308, "lr": 9.998991324077906e-06, "epoch": 0.05668016194331984, "percentage": 5.67, "elapsed_time": "0:37:49", "remaining_time": "10:29:38"}
{"current_steps": 150, "total_steps": 2470, "loss": 0.3664, "lr": 9.997198289919097e-06, "epoch": 0.06072874493927125, "percentage": 6.07, "elapsed_time": "0:40:07", "remaining_time": "10:20:33"}
{"current_steps": 160, "total_steps": 2470, "loss": 0.367, "lr": 9.994509140604573e-06, "epoch": 0.06477732793522267, "percentage": 6.48, "elapsed_time": "0:43:00", "remaining_time": "10:20:54"}
{"current_steps": 170, "total_steps": 2470, "loss": 0.4213, "lr": 9.990924358362037e-06, "epoch": 0.06882591093117409, "percentage": 6.88, "elapsed_time": "0:45:26", "remaining_time": "10:14:45"}
{"current_steps": 180, "total_steps": 2470, "loss": 0.3967, "lr": 9.986444586027236e-06, "epoch": 0.0728744939271255, "percentage": 7.29, "elapsed_time": "0:48:05", "remaining_time": "10:11:52"}
{"current_steps": 190, "total_steps": 2470, "loss": 0.394, "lr": 9.981070626928688e-06, "epoch": 0.07692307692307693, "percentage": 7.69, "elapsed_time": "0:50:47", "remaining_time": "10:09:28"}
{"current_steps": 200, "total_steps": 2470, "loss": 0.4059, "lr": 9.974803444743617e-06, "epoch": 0.08097165991902834, "percentage": 8.1, "elapsed_time": "0:53:08", "remaining_time": "10:03:12"}
{"current_steps": 210, "total_steps": 2470, "loss": 0.4162, "lr": 9.967644163325157e-06, "epoch": 0.08502024291497975, "percentage": 8.5, "elapsed_time": "0:56:06", "remaining_time": "10:03:51"}
{"current_steps": 220, "total_steps": 2470, "loss": 0.4101, "lr": 9.959594066500805e-06, "epoch": 0.08906882591093117, "percentage": 8.91, "elapsed_time": "0:58:30", "remaining_time": "9:58:20"}
{"current_steps": 230, "total_steps": 2470, "loss": 0.3829, "lr": 9.950654597842209e-06, "epoch": 0.0931174089068826, "percentage": 9.31, "elapsed_time": "1:01:04", "remaining_time": "9:54:48"}
{"current_steps": 240, "total_steps": 2470, "loss": 0.412, "lr": 9.940827360406297e-06, "epoch": 0.09716599190283401, "percentage": 9.72, "elapsed_time": "1:03:55", "remaining_time": "9:53:58"}
{"current_steps": 250, "total_steps": 2470, "loss": 0.3582, "lr": 9.93011411644782e-06, "epoch": 0.10121457489878542, "percentage": 10.12, "elapsed_time": "1:06:27", "remaining_time": "9:50:09"}
{"current_steps": 260, "total_steps": 2470, "loss": 0.387, "lr": 9.918516787103322e-06, "epoch": 0.10526315789473684, "percentage": 10.53, "elapsed_time": "1:09:31", "remaining_time": "9:51:00"}
{"current_steps": 270, "total_steps": 2470, "loss": 0.4085, "lr": 9.906037452046655e-06, "epoch": 0.10931174089068826, "percentage": 10.93, "elapsed_time": "1:11:56", "remaining_time": "9:46:15"}
{"current_steps": 280, "total_steps": 2470, "loss": 0.3689, "lr": 9.892678349116026e-06, "epoch": 0.11336032388663968, "percentage": 11.34, "elapsed_time": "1:14:43", "remaining_time": "9:44:23"}
{"current_steps": 290, "total_steps": 2470, "loss": 0.4033, "lr": 9.878441873912712e-06, "epoch": 0.11740890688259109, "percentage": 11.74, "elapsed_time": "1:17:27", "remaining_time": "9:42:18"}
{"current_steps": 300, "total_steps": 2470, "loss": 0.3417, "lr": 9.863330579371469e-06, "epoch": 0.1214574898785425, "percentage": 12.15, "elapsed_time": "1:19:39", "remaining_time": "9:36:12"}
{"current_steps": 310, "total_steps": 2470, "loss": 0.3646, "lr": 9.847347175302728e-06, "epoch": 0.12550607287449392, "percentage": 12.55, "elapsed_time": "1:22:39", "remaining_time": "9:35:57"}
{"current_steps": 320, "total_steps": 2470, "loss": 0.402, "lr": 9.830494527906671e-06, "epoch": 0.12955465587044535, "percentage": 12.96, "elapsed_time": "1:25:01", "remaining_time": "9:31:14"}
{"current_steps": 330, "total_steps": 2470, "loss": 0.361, "lr": 9.812775659259236e-06, "epoch": 0.13360323886639677, "percentage": 13.36, "elapsed_time": "1:27:34", "remaining_time": "9:27:55"}
{"current_steps": 340, "total_steps": 2470, "loss": 0.3861, "lr": 9.794193746770216e-06, "epoch": 0.13765182186234817, "percentage": 13.77, "elapsed_time": "1:30:24", "remaining_time": "9:26:22"}
{"current_steps": 350, "total_steps": 2470, "loss": 0.3589, "lr": 9.77475212261344e-06, "epoch": 0.1417004048582996, "percentage": 14.17, "elapsed_time": "1:32:38", "remaining_time": "9:21:09"}
{"current_steps": 360, "total_steps": 2470, "loss": 0.4093, "lr": 9.754454273129267e-06, "epoch": 0.145748987854251, "percentage": 14.57, "elapsed_time": "1:35:40", "remaining_time": "9:20:48"}
{"current_steps": 370, "total_steps": 2470, "loss": 0.3897, "lr": 9.733303838199387e-06, "epoch": 0.14979757085020243, "percentage": 14.98, "elapsed_time": "1:38:09", "remaining_time": "9:17:08"}
{"current_steps": 380, "total_steps": 2470, "loss": 0.3791, "lr": 9.711304610594104e-06, "epoch": 0.15384615384615385, "percentage": 15.38, "elapsed_time": "1:40:49", "remaining_time": "9:14:34"}
{"current_steps": 390, "total_steps": 2470, "loss": 0.4034, "lr": 9.68846053529221e-06, "epoch": 0.15789473684210525, "percentage": 15.79, "elapsed_time": "1:43:32", "remaining_time": "9:12:10"}
{"current_steps": 400, "total_steps": 2470, "loss": 0.3867, "lr": 9.664775708773554e-06, "epoch": 0.16194331983805668, "percentage": 16.19, "elapsed_time": "1:45:49", "remaining_time": "9:07:39"}
{"current_steps": 410, "total_steps": 2470, "loss": 0.3891, "lr": 9.640254378284447e-06, "epoch": 0.1659919028340081, "percentage": 16.6, "elapsed_time": "1:48:58", "remaining_time": "9:07:31"}
{"current_steps": 420, "total_steps": 2470, "loss": 0.3972, "lr": 9.614900941076036e-06, "epoch": 0.1700404858299595, "percentage": 17.0, "elapsed_time": "1:51:27", "remaining_time": "9:04:00"}
{"current_steps": 430, "total_steps": 2470, "loss": 0.357, "lr": 9.58871994361576e-06, "epoch": 0.17408906882591094, "percentage": 17.41, "elapsed_time": "1:54:05", "remaining_time": "9:01:15"}
{"current_steps": 440, "total_steps": 2470, "loss": 0.3767, "lr": 9.561716080772072e-06, "epoch": 0.17813765182186234, "percentage": 17.81, "elapsed_time": "1:56:47", "remaining_time": "8:58:51"}
{"current_steps": 450, "total_steps": 2470, "loss": 0.3636, "lr": 9.533894194972541e-06, "epoch": 0.18218623481781376, "percentage": 18.22, "elapsed_time": "1:59:08", "remaining_time": "8:54:47"}
{"current_steps": 460, "total_steps": 2470, "loss": 0.379, "lr": 9.505259275335488e-06, "epoch": 0.1862348178137652, "percentage": 18.62, "elapsed_time": "2:02:06", "remaining_time": "8:53:35"}
{"current_steps": 470, "total_steps": 2470, "loss": 0.3398, "lr": 9.475816456775313e-06, "epoch": 0.1902834008097166, "percentage": 19.03, "elapsed_time": "2:04:29", "remaining_time": "8:49:43"}
{"current_steps": 480, "total_steps": 2470, "loss": 0.3348, "lr": 9.44557101908169e-06, "epoch": 0.19433198380566802, "percentage": 19.43, "elapsed_time": "2:07:07", "remaining_time": "8:47:00"}
{"current_steps": 490, "total_steps": 2470, "loss": 0.3666, "lr": 9.41452838597278e-06, "epoch": 0.19838056680161945, "percentage": 19.84, "elapsed_time": "2:10:00", "remaining_time": "8:45:21"}
{"current_steps": 500, "total_steps": 2470, "loss": 0.3947, "lr": 9.382694124122624e-06, "epoch": 0.20242914979757085, "percentage": 20.24, "elapsed_time": "2:12:16", "remaining_time": "8:41:08"}
{"current_steps": 510, "total_steps": 2470, "loss": 0.3838, "lr": 9.350073942162911e-06, "epoch": 0.20647773279352227, "percentage": 20.65, "elapsed_time": "2:18:30", "remaining_time": "8:52:18"}
{"current_steps": 520, "total_steps": 2470, "loss": 0.3967, "lr": 9.316673689659285e-06, "epoch": 0.21052631578947367, "percentage": 21.05, "elapsed_time": "2:20:52", "remaining_time": "8:48:18"}
{"current_steps": 530, "total_steps": 2470, "loss": 0.3461, "lr": 9.282499356062385e-06, "epoch": 0.2145748987854251, "percentage": 21.46, "elapsed_time": "2:23:43", "remaining_time": "8:46:06"}
{"current_steps": 540, "total_steps": 2470, "loss": 0.4016, "lr": 9.247557069633784e-06, "epoch": 0.21862348178137653, "percentage": 21.86, "elapsed_time": "2:26:31", "remaining_time": "8:43:40"}
{"current_steps": 550, "total_steps": 2470, "loss": 0.3532, "lr": 9.211853096347059e-06, "epoch": 0.22267206477732793, "percentage": 22.27, "elapsed_time": "2:28:48", "remaining_time": "8:39:30"}
{"current_steps": 560, "total_steps": 2470, "loss": 0.3521, "lr": 9.175393838764153e-06, "epoch": 0.22672064777327935, "percentage": 22.67, "elapsed_time": "2:31:52", "remaining_time": "8:38:00"}
{"current_steps": 570, "total_steps": 2470, "loss": 0.3887, "lr": 9.138185834887241e-06, "epoch": 0.23076923076923078, "percentage": 23.08, "elapsed_time": "2:34:15", "remaining_time": "8:34:11"}
{"current_steps": 580, "total_steps": 2470, "loss": 0.4027, "lr": 9.100235756986312e-06, "epoch": 0.23481781376518218, "percentage": 23.48, "elapsed_time": "2:37:00", "remaining_time": "8:31:37"}
{"current_steps": 590, "total_steps": 2470, "loss": 0.3744, "lr": 9.061550410402677e-06, "epoch": 0.2388663967611336, "percentage": 23.89, "elapsed_time": "2:39:37", "remaining_time": "8:28:37"}
{"current_steps": 600, "total_steps": 2470, "loss": 0.3713, "lr": 9.022136732328618e-06, "epoch": 0.242914979757085, "percentage": 24.29, "elapsed_time": "2:41:49", "remaining_time": "8:24:19"}
{"current_steps": 610, "total_steps": 2470, "loss": 0.3554, "lr": 8.982001790563364e-06, "epoch": 0.24696356275303644, "percentage": 24.7, "elapsed_time": "2:44:48", "remaining_time": "8:22:32"}
{"current_steps": 620, "total_steps": 2470, "loss": 0.3473, "lr": 8.9411527822457e-06, "epoch": 0.25101214574898784, "percentage": 25.1, "elapsed_time": "2:47:15", "remaining_time": "8:19:04"}
{"current_steps": 630, "total_steps": 2470, "loss": 0.3743, "lr": 8.899597032563318e-06, "epoch": 0.2550607287449393, "percentage": 25.51, "elapsed_time": "2:49:50", "remaining_time": "8:16:02"}
{"current_steps": 640, "total_steps": 2470, "loss": 0.3655, "lr": 8.857341993439273e-06, "epoch": 0.2591093117408907, "percentage": 25.91, "elapsed_time": "2:52:33", "remaining_time": "8:13:24"}
{"current_steps": 650, "total_steps": 2470, "loss": 0.3423, "lr": 8.814395242195642e-06, "epoch": 0.2631578947368421, "percentage": 26.32, "elapsed_time": "2:54:44", "remaining_time": "8:09:17"}
{"current_steps": 660, "total_steps": 2470, "loss": 0.3257, "lr": 8.770764480194762e-06, "epoch": 0.26720647773279355, "percentage": 26.72, "elapsed_time": "2:57:44", "remaining_time": "8:07:27"}
{"current_steps": 670, "total_steps": 2470, "loss": 0.3319, "lr": 8.726457531458174e-06, "epoch": 0.27125506072874495, "percentage": 27.13, "elapsed_time": "3:00:10", "remaining_time": "8:04:01"}
{"current_steps": 680, "total_steps": 2470, "loss": 0.336, "lr": 8.68148234126361e-06, "epoch": 0.27530364372469635, "percentage": 27.53, "elapsed_time": "3:02:50", "remaining_time": "8:01:17"}
{"current_steps": 690, "total_steps": 2470, "loss": 0.3705, "lr": 8.635846974720196e-06, "epoch": 0.2793522267206478, "percentage": 27.94, "elapsed_time": "3:05:38", "remaining_time": "7:58:52"}
{"current_steps": 700, "total_steps": 2470, "loss": 0.3611, "lr": 8.58955961532221e-06, "epoch": 0.2834008097165992, "percentage": 28.34, "elapsed_time": "3:08:09", "remaining_time": "7:55:46"}
{"current_steps": 710, "total_steps": 2470, "loss": 0.3277, "lr": 8.542628563481577e-06, "epoch": 0.2874493927125506, "percentage": 28.74, "elapsed_time": "3:11:12", "remaining_time": "7:53:57"}
{"current_steps": 720, "total_steps": 2470, "loss": 0.3713, "lr": 8.49506223503941e-06, "epoch": 0.291497975708502, "percentage": 29.15, "elapsed_time": "3:13:41", "remaining_time": "7:50:47"}
{"current_steps": 730, "total_steps": 2470, "loss": 0.3915, "lr": 8.44686915975686e-06, "epoch": 0.29554655870445345, "percentage": 29.55, "elapsed_time": "3:16:19", "remaining_time": "7:47:57"}
{"current_steps": 740, "total_steps": 2470, "loss": 0.4059, "lr": 8.398057979785515e-06, "epoch": 0.29959514170040485, "percentage": 29.96, "elapsed_time": "3:18:58", "remaining_time": "7:45:09"}
{"current_steps": 750, "total_steps": 2470, "loss": 0.3455, "lr": 8.348637448117676e-06, "epoch": 0.30364372469635625, "percentage": 30.36, "elapsed_time": "3:21:12", "remaining_time": "7:41:26"}
{"current_steps": 760, "total_steps": 2470, "loss": 0.379, "lr": 8.298616427016726e-06, "epoch": 0.3076923076923077, "percentage": 30.77, "elapsed_time": "3:24:16", "remaining_time": "7:39:36"}
{"current_steps": 770, "total_steps": 2470, "loss": 0.3442, "lr": 8.248003886427927e-06, "epoch": 0.3117408906882591, "percentage": 31.17, "elapsed_time": "3:26:43", "remaining_time": "7:36:25"}
{"current_steps": 780, "total_steps": 2470, "loss": 0.3228, "lr": 8.196808902369889e-06, "epoch": 0.3157894736842105, "percentage": 31.58, "elapsed_time": "3:29:22", "remaining_time": "7:33:37"}
{"current_steps": 790, "total_steps": 2470, "loss": 0.3733, "lr": 8.145040655307035e-06, "epoch": 0.31983805668016196, "percentage": 31.98, "elapsed_time": "3:32:07", "remaining_time": "7:31:06"}
{"current_steps": 800, "total_steps": 2470, "loss": 0.339, "lr": 8.092708428503324e-06, "epoch": 0.32388663967611336, "percentage": 32.39, "elapsed_time": "3:34:25", "remaining_time": "7:27:36"}
{"current_steps": 810, "total_steps": 2470, "loss": 0.3637, "lr": 8.039821606357544e-06, "epoch": 0.32793522267206476, "percentage": 32.79, "elapsed_time": "3:37:22", "remaining_time": "7:25:29"}
{"current_steps": 820, "total_steps": 2470, "loss": 0.35, "lr": 7.986389672720465e-06, "epoch": 0.3319838056680162, "percentage": 33.2, "elapsed_time": "3:39:39", "remaining_time": "7:22:00"}
{"current_steps": 830, "total_steps": 2470, "loss": 0.3387, "lr": 7.93242220919417e-06, "epoch": 0.3360323886639676, "percentage": 33.6, "elapsed_time": "3:42:12", "remaining_time": "7:19:03"}
{"current_steps": 840, "total_steps": 2470, "loss": 0.3862, "lr": 7.87792889341384e-06, "epoch": 0.340080971659919, "percentage": 34.01, "elapsed_time": "3:44:59", "remaining_time": "7:16:34"}
{"current_steps": 850, "total_steps": 2470, "loss": 0.3085, "lr": 7.82291949731233e-06, "epoch": 0.3441295546558704, "percentage": 34.41, "elapsed_time": "3:47:17", "remaining_time": "7:13:11"}
{"current_steps": 860, "total_steps": 2470, "loss": 0.3836, "lr": 7.767403885367832e-06, "epoch": 0.3481781376518219, "percentage": 34.82, "elapsed_time": "3:50:18", "remaining_time": "7:11:09"}
{"current_steps": 870, "total_steps": 2470, "loss": 0.3341, "lr": 7.711392012834945e-06, "epoch": 0.3522267206477733, "percentage": 35.22, "elapsed_time": "3:52:39", "remaining_time": "7:07:53"}
{"current_steps": 880, "total_steps": 2470, "loss": 0.3435, "lr": 7.654893923959452e-06, "epoch": 0.3562753036437247, "percentage": 35.63, "elapsed_time": "3:55:29", "remaining_time": "7:05:29"}
{"current_steps": 890, "total_steps": 2470, "loss": 0.3876, "lr": 7.597919750177168e-06, "epoch": 0.3603238866396761, "percentage": 36.03, "elapsed_time": "3:58:12", "remaining_time": "7:02:53"}
{"current_steps": 900, "total_steps": 2470, "loss": 0.3105, "lr": 7.540479708297123e-06, "epoch": 0.3643724696356275, "percentage": 36.44, "elapsed_time": "4:00:24", "remaining_time": "6:59:23"}
{"current_steps": 910, "total_steps": 2470, "loss": 0.3256, "lr": 7.48258409866945e-06, "epoch": 0.3684210526315789, "percentage": 36.84, "elapsed_time": "4:03:18", "remaining_time": "6:57:05"}
{"current_steps": 920, "total_steps": 2470, "loss": 0.3667, "lr": 7.42424330333829e-06, "epoch": 0.3724696356275304, "percentage": 37.25, "elapsed_time": "4:05:45", "remaining_time": "6:54:02"}
{"current_steps": 930, "total_steps": 2470, "loss": 0.3186, "lr": 7.365467784180051e-06, "epoch": 0.3765182186234818, "percentage": 37.65, "elapsed_time": "4:08:27", "remaining_time": "6:51:25"}
{"current_steps": 940, "total_steps": 2470, "loss": 0.3572, "lr": 7.306268081027347e-06, "epoch": 0.3805668016194332, "percentage": 38.06, "elapsed_time": "4:11:07", "remaining_time": "6:48:45"}
{"current_steps": 950, "total_steps": 2470, "loss": 0.3602, "lr": 7.246654809778951e-06, "epoch": 0.38461538461538464, "percentage": 38.46, "elapsed_time": "4:13:27", "remaining_time": "6:45:31"}
{"current_steps": 960, "total_steps": 2470, "loss": 0.3739, "lr": 7.186638660496125e-06, "epoch": 0.38866396761133604, "percentage": 38.87, "elapsed_time": "4:16:24", "remaining_time": "6:43:18"}
{"current_steps": 970, "total_steps": 2470, "loss": 0.3369, "lr": 7.1262303954856335e-06, "epoch": 0.39271255060728744, "percentage": 39.27, "elapsed_time": "4:18:43", "remaining_time": "6:40:06"}
{"current_steps": 980, "total_steps": 2470, "loss": 0.3192, "lr": 7.0654408473698084e-06, "epoch": 0.3967611336032389, "percentage": 39.68, "elapsed_time": "4:21:25", "remaining_time": "6:37:28"}
{"current_steps": 990, "total_steps": 2470, "loss": 0.3704, "lr": 7.004280917144015e-06, "epoch": 0.4008097165991903, "percentage": 40.08, "elapsed_time": "4:24:03", "remaining_time": "6:34:45"}
{"current_steps": 1000, "total_steps": 2470, "loss": 0.3427, "lr": 6.942761572221833e-06, "epoch": 0.4048582995951417, "percentage": 40.49, "elapsed_time": "4:26:10", "remaining_time": "6:31:16"}
{"current_steps": 1000, "total_steps": 2470, "eval_loss": 0.367609441280365, "epoch": 0.4048582995951417, "percentage": 40.49, "elapsed_time": "4:26:25", "remaining_time": "6:31:37"}
{"current_steps": 1010, "total_steps": 2470, "loss": 0.3523, "lr": 6.8808938444683505e-06, "epoch": 0.4089068825910931, "percentage": 40.89, "elapsed_time": "4:32:59", "remaining_time": "6:34:37"}
{"current_steps": 1020, "total_steps": 2470, "loss": 0.3391, "lr": 6.81868882822189e-06, "epoch": 0.41295546558704455, "percentage": 41.3, "elapsed_time": "4:35:20", "remaining_time": "6:31:24"}
{"current_steps": 1030, "total_steps": 2470, "loss": 0.3116, "lr": 6.756157678304531e-06, "epoch": 0.41700404858299595, "percentage": 41.7, "elapsed_time": "4:37:52", "remaining_time": "6:28:28"}
{"current_steps": 1040, "total_steps": 2470, "loss": 0.3261, "lr": 6.69331160802179e-06, "epoch": 0.42105263157894735, "percentage": 42.11, "elapsed_time": "4:40:36", "remaining_time": "6:25:49"}
{"current_steps": 1050, "total_steps": 2470, "loss": 0.3165, "lr": 6.630161887151806e-06, "epoch": 0.4251012145748988, "percentage": 42.51, "elapsed_time": "4:43:03", "remaining_time": "6:22:48"}
{"current_steps": 1060, "total_steps": 2470, "loss": 0.3801, "lr": 6.566719839924412e-06, "epoch": 0.4291497975708502, "percentage": 42.91, "elapsed_time": "4:46:16", "remaining_time": "6:20:47"}
{"current_steps": 1070, "total_steps": 2470, "loss": 0.368, "lr": 6.502996842990431e-06, "epoch": 0.4331983805668016, "percentage": 43.32, "elapsed_time": "4:48:44", "remaining_time": "6:17:47"}
{"current_steps": 1080, "total_steps": 2470, "loss": 0.3221, "lr": 6.43900432338157e-06, "epoch": 0.43724696356275305, "percentage": 43.72, "elapsed_time": "4:51:22", "remaining_time": "6:15:00"}
{"current_steps": 1090, "total_steps": 2470, "loss": 0.3687, "lr": 6.374753756461295e-06, "epoch": 0.44129554655870445, "percentage": 44.13, "elapsed_time": "4:54:03", "remaining_time": "6:12:17"}
{"current_steps": 1100, "total_steps": 2470, "loss": 0.318, "lr": 6.310256663867019e-06, "epoch": 0.44534412955465585, "percentage": 44.53, "elapsed_time": "4:56:27", "remaining_time": "6:09:12"}
{"current_steps": 1110, "total_steps": 2470, "loss": 0.3322, "lr": 6.245524611444005e-06, "epoch": 0.4493927125506073, "percentage": 44.94, "elapsed_time": "4:59:22", "remaining_time": "6:06:48"}
{"current_steps": 1120, "total_steps": 2470, "loss": 0.3637, "lr": 6.180569207171338e-06, "epoch": 0.4534412955465587, "percentage": 45.34, "elapsed_time": "5:01:40", "remaining_time": "6:03:37"}
{"current_steps": 1130, "total_steps": 2470, "loss": 0.3171, "lr": 6.115402099080345e-06, "epoch": 0.4574898785425101, "percentage": 45.75, "elapsed_time": "5:04:16", "remaining_time": "6:00:49"}
{"current_steps": 1140, "total_steps": 2470, "loss": 0.3466, "lr": 6.05003497316582e-06, "epoch": 0.46153846153846156, "percentage": 46.15, "elapsed_time": "5:06:54", "remaining_time": "5:58:03"}
{"current_steps": 1150, "total_steps": 2470, "loss": 0.3241, "lr": 5.984479551290459e-06, "epoch": 0.46558704453441296, "percentage": 46.56, "elapsed_time": "5:09:03", "remaining_time": "5:54:44"}
{"current_steps": 1160, "total_steps": 2470, "loss": 0.3249, "lr": 5.918747589082853e-06, "epoch": 0.46963562753036436, "percentage": 46.96, "elapsed_time": "5:12:10", "remaining_time": "5:52:32"}
{"current_steps": 1170, "total_steps": 2470, "loss": 0.331, "lr": 5.852850873829421e-06, "epoch": 0.47368421052631576, "percentage": 47.37, "elapsed_time": "5:14:37", "remaining_time": "5:49:35"}
{"current_steps": 1180, "total_steps": 2470, "loss": 0.3332, "lr": 5.786801222360682e-06, "epoch": 0.4777327935222672, "percentage": 47.77, "elapsed_time": "5:17:11", "remaining_time": "5:46:45"}
{"current_steps": 1190, "total_steps": 2470, "loss": 0.3958, "lr": 5.720610478932211e-06, "epoch": 0.4817813765182186, "percentage": 48.18, "elapsed_time": "5:19:49", "remaining_time": "5:44:01"}
{"current_steps": 1200, "total_steps": 2470, "loss": 0.3196, "lr": 5.654290513100691e-06, "epoch": 0.48582995951417, "percentage": 48.58, "elapsed_time": "5:22:05", "remaining_time": "5:40:53"}
{"current_steps": 1210, "total_steps": 2470, "loss": 0.3399, "lr": 5.587853217595418e-06, "epoch": 0.4898785425101215, "percentage": 48.99, "elapsed_time": "5:25:03", "remaining_time": "5:38:29"}
{"current_steps": 1220, "total_steps": 2470, "loss": 0.3297, "lr": 5.521310506185661e-06, "epoch": 0.4939271255060729, "percentage": 49.39, "elapsed_time": "5:27:25", "remaining_time": "5:35:28"}
{"current_steps": 1230, "total_steps": 2470, "loss": 0.3187, "lr": 5.454674311544236e-06, "epoch": 0.4979757085020243, "percentage": 49.8, "elapsed_time": "5:30:11", "remaining_time": "5:32:52"}
{"current_steps": 1240, "total_steps": 2470, "loss": 0.3775, "lr": 5.387956583107702e-06, "epoch": 0.5020242914979757, "percentage": 50.2, "elapsed_time": "5:33:00", "remaining_time": "5:30:19"}
{"current_steps": 1250, "total_steps": 2470, "loss": 0.3101, "lr": 5.321169284933543e-06, "epoch": 0.5060728744939271, "percentage": 50.61, "elapsed_time": "5:35:19", "remaining_time": "5:27:16"}
{"current_steps": 1260, "total_steps": 2470, "loss": 0.3213, "lr": 5.2543243935547385e-06, "epoch": 0.5101214574898786, "percentage": 51.01, "elapsed_time": "5:38:27", "remaining_time": "5:25:01"}
{"current_steps": 1270, "total_steps": 2470, "loss": 0.3492, "lr": 5.187433895832075e-06, "epoch": 0.5141700404858299, "percentage": 51.42, "elapsed_time": "5:40:51", "remaining_time": "5:22:04"}
{"current_steps": 1280, "total_steps": 2470, "loss": 0.3692, "lr": 5.120509786804635e-06, "epoch": 0.5182186234817814, "percentage": 51.82, "elapsed_time": "5:43:29", "remaining_time": "5:19:20"}
{"current_steps": 1290, "total_steps": 2470, "loss": 0.3925, "lr": 5.053564067538797e-06, "epoch": 0.5222672064777328, "percentage": 52.23, "elapsed_time": "5:46:19", "remaining_time": "5:16:47"}
{"current_steps": 1300, "total_steps": 2470, "loss": 0.3188, "lr": 4.986608742976164e-06, "epoch": 0.5263157894736842, "percentage": 52.63, "elapsed_time": "5:48:41", "remaining_time": "5:13:49"}
{"current_steps": 1310, "total_steps": 2470, "loss": 0.3225, "lr": 4.919655819780792e-06, "epoch": 0.5303643724696356, "percentage": 53.04, "elapsed_time": "5:51:48", "remaining_time": "5:11:31"}
{"current_steps": 1320, "total_steps": 2470, "loss": 0.3307, "lr": 4.852717304186119e-06, "epoch": 0.5344129554655871, "percentage": 53.44, "elapsed_time": "5:54:15", "remaining_time": "5:08:38"}
{"current_steps": 1330, "total_steps": 2470, "loss": 0.401, "lr": 4.785805199841956e-06, "epoch": 0.5384615384615384, "percentage": 53.85, "elapsed_time": "5:57:02", "remaining_time": "5:06:02"}
{"current_steps": 1340, "total_steps": 2470, "loss": 0.3371, "lr": 4.718931505661961e-06, "epoch": 0.5425101214574899, "percentage": 54.25, "elapsed_time": "5:59:47", "remaining_time": "5:03:24"}
{"current_steps": 1350, "total_steps": 2470, "loss": 0.3067, "lr": 4.652108213671947e-06, "epoch": 0.5465587044534413, "percentage": 54.66, "elapsed_time": "6:02:02", "remaining_time": "5:00:21"}
{"current_steps": 1360, "total_steps": 2470, "loss": 0.3075, "lr": 4.585347306859423e-06, "epoch": 0.5506072874493927, "percentage": 55.06, "elapsed_time": "6:05:02", "remaining_time": "4:57:56"}
{"current_steps": 1370, "total_steps": 2470, "loss": 0.3369, "lr": 4.518660757024774e-06, "epoch": 0.5546558704453441, "percentage": 55.47, "elapsed_time": "6:07:25", "remaining_time": "4:55:00"}
{"current_steps": 1380, "total_steps": 2470, "loss": 0.3196, "lr": 4.452060522634431e-06, "epoch": 0.5587044534412956, "percentage": 55.87, "elapsed_time": "6:10:00", "remaining_time": "4:52:14"}
{"current_steps": 1390, "total_steps": 2470, "loss": 0.3291, "lr": 4.3855585466764305e-06, "epoch": 0.562753036437247, "percentage": 56.28, "elapsed_time": "6:12:47", "remaining_time": "4:49:38"}
{"current_steps": 1400, "total_steps": 2470, "loss": 0.3306, "lr": 4.319166754518768e-06, "epoch": 0.5668016194331984, "percentage": 56.68, "elapsed_time": "6:14:59", "remaining_time": "4:46:35"}
{"current_steps": 1410, "total_steps": 2470, "loss": 0.322, "lr": 4.25289705177089e-06, "epoch": 0.5708502024291497, "percentage": 57.09, "elapsed_time": "6:18:01", "remaining_time": "4:44:10"}
{"current_steps": 1420, "total_steps": 2470, "loss": 0.3538, "lr": 4.186761322148741e-06, "epoch": 0.5748987854251012, "percentage": 57.49, "elapsed_time": "6:20:26", "remaining_time": "4:41:18"}
{"current_steps": 1430, "total_steps": 2470, "loss": 0.3138, "lr": 4.120771425343733e-06, "epoch": 0.5789473684210527, "percentage": 57.89, "elapsed_time": "6:23:12", "remaining_time": "4:38:41"}
{"current_steps": 1440, "total_steps": 2470, "loss": 0.37, "lr": 4.0549391948960275e-06, "epoch": 0.582995951417004, "percentage": 58.3, "elapsed_time": "6:25:57", "remaining_time": "4:36:04"}
{"current_steps": 1450, "total_steps": 2470, "loss": 0.3303, "lr": 3.9892764360725e-06, "epoch": 0.5870445344129555, "percentage": 58.7, "elapsed_time": "6:28:12", "remaining_time": "4:33:05"}
{"current_steps": 1460, "total_steps": 2470, "loss": 0.2951, "lr": 3.923794923749775e-06, "epoch": 0.5910931174089069, "percentage": 59.11, "elapsed_time": "6:31:17", "remaining_time": "4:30:41"}
{"current_steps": 1470, "total_steps": 2470, "loss": 0.3287, "lr": 3.8585064003027236e-06, "epoch": 0.5951417004048583, "percentage": 59.51, "elapsed_time": "6:33:46", "remaining_time": "4:27:52"}
{"current_steps": 1480, "total_steps": 2470, "loss": 0.3211, "lr": 3.793422573498771e-06, "epoch": 0.5991902834008097, "percentage": 59.92, "elapsed_time": "6:36:22", "remaining_time": "4:25:08"}
{"current_steps": 1490, "total_steps": 2470, "loss": 0.3742, "lr": 3.728555114398419e-06, "epoch": 0.6032388663967612, "percentage": 60.32, "elapsed_time": "6:39:09", "remaining_time": "4:22:31"}
{"current_steps": 1500, "total_steps": 2470, "loss": 0.3284, "lr": 3.6639156552623557e-06, "epoch": 0.6072874493927125, "percentage": 60.73, "elapsed_time": "6:41:26", "remaining_time": "4:19:36"}
{"current_steps": 1510, "total_steps": 2470, "loss": 0.3014, "lr": 3.5995157874655134e-06, "epoch": 0.611336032388664, "percentage": 61.13, "elapsed_time": "6:47:50", "remaining_time": "4:19:17"}
{"current_steps": 1520, "total_steps": 2470, "loss": 0.3416, "lr": 3.5353670594184623e-06, "epoch": 0.6153846153846154, "percentage": 61.54, "elapsed_time": "6:50:18", "remaining_time": "4:16:26"}
{"current_steps": 1530, "total_steps": 2470, "loss": 0.3168, "lr": 3.471480974496513e-06, "epoch": 0.6194331983805668, "percentage": 61.94, "elapsed_time": "6:53:02", "remaining_time": "4:13:46"}
{"current_steps": 1540, "total_steps": 2470, "loss": 0.3258, "lr": 3.4078689889768867e-06, "epoch": 0.6234817813765182, "percentage": 62.35, "elapsed_time": "6:55:45", "remaining_time": "4:11:04"}
{"current_steps": 1550, "total_steps": 2470, "loss": 0.3209, "lr": 3.3445425099843343e-06, "epoch": 0.6275303643724697, "percentage": 62.75, "elapsed_time": "6:57:53", "remaining_time": "4:08:02"}
{"current_steps": 1560, "total_steps": 2470, "loss": 0.3064, "lr": 3.2815128934455774e-06, "epoch": 0.631578947368421, "percentage": 63.16, "elapsed_time": "7:00:53", "remaining_time": "4:05:31"}
{"current_steps": 1570, "total_steps": 2470, "loss": 0.31, "lr": 3.2187914420529176e-06, "epoch": 0.6356275303643725, "percentage": 63.56, "elapsed_time": "7:03:20", "remaining_time": "4:02:40"}
{"current_steps": 1580, "total_steps": 2470, "loss": 0.3385, "lr": 3.1563894032373977e-06, "epoch": 0.6396761133603239, "percentage": 63.97, "elapsed_time": "7:05:55", "remaining_time": "3:59:55"}
{"current_steps": 1590, "total_steps": 2470, "loss": 0.331, "lr": 3.094317967151876e-06, "epoch": 0.6437246963562753, "percentage": 64.37, "elapsed_time": "7:08:44", "remaining_time": "3:57:17"}
{"current_steps": 1600, "total_steps": 2470, "loss": 0.323, "lr": 3.0325882646643713e-06, "epoch": 0.6477732793522267, "percentage": 64.78, "elapsed_time": "7:11:01", "remaining_time": "3:54:22"}
{"current_steps": 1610, "total_steps": 2470, "loss": 0.3539, "lr": 2.971211365362028e-06, "epoch": 0.6518218623481782, "percentage": 65.18, "elapsed_time": "7:14:10", "remaining_time": "3:51:54"}
{"current_steps": 1620, "total_steps": 2470, "loss": 0.3446, "lr": 2.910198275566085e-06, "epoch": 0.6558704453441295, "percentage": 65.59, "elapsed_time": "7:16:36", "remaining_time": "3:49:05"}
{"current_steps": 1630, "total_steps": 2470, "loss": 0.2856, "lr": 2.8495599363581816e-06, "epoch": 0.659919028340081, "percentage": 65.99, "elapsed_time": "7:19:20", "remaining_time": "3:46:24"}
{"current_steps": 1640, "total_steps": 2470, "loss": 0.3514, "lr": 2.789307221618369e-06, "epoch": 0.6639676113360324, "percentage": 66.4, "elapsed_time": "7:22:04", "remaining_time": "3:43:43"}
{"current_steps": 1650, "total_steps": 2470, "loss": 0.3434, "lr": 2.72945093607516e-06, "epoch": 0.6680161943319838, "percentage": 66.8, "elapsed_time": "7:24:13", "remaining_time": "3:40:45"}
{"current_steps": 1660, "total_steps": 2470, "loss": 0.3168, "lr": 2.6700018133679883e-06, "epoch": 0.6720647773279352, "percentage": 67.21, "elapsed_time": "7:27:13", "remaining_time": "3:38:13"}
{"current_steps": 1670, "total_steps": 2470, "loss": 0.3325, "lr": 2.6109705141224255e-06, "epoch": 0.6761133603238867, "percentage": 67.61, "elapsed_time": "7:29:41", "remaining_time": "3:35:25"}
{"current_steps": 1680, "total_steps": 2470, "loss": 0.3139, "lr": 2.5523676240384652e-06, "epoch": 0.680161943319838, "percentage": 68.02, "elapsed_time": "7:32:23", "remaining_time": "3:32:43"}
{"current_steps": 1690, "total_steps": 2470, "loss": 0.3088, "lr": 2.494203651992265e-06, "epoch": 0.6842105263157895, "percentage": 68.42, "elapsed_time": "7:35:08", "remaining_time": "3:30:03"}
{"current_steps": 1700, "total_steps": 2470, "loss": 0.3054, "lr": 2.4364890281516633e-06, "epoch": 0.6882591093117408, "percentage": 68.83, "elapsed_time": "7:37:18", "remaining_time": "3:27:07"}
{"current_steps": 1710, "total_steps": 2470, "loss": 0.3181, "lr": 2.3792341021057917e-06, "epoch": 0.6923076923076923, "percentage": 69.23, "elapsed_time": "7:40:28", "remaining_time": "3:24:39"}
{"current_steps": 1720, "total_steps": 2470, "loss": 0.3351, "lr": 2.3224491410091664e-06, "epoch": 0.6963562753036437, "percentage": 69.64, "elapsed_time": "7:42:53", "remaining_time": "3:21:50"}
{"current_steps": 1730, "total_steps": 2470, "loss": 0.2898, "lr": 2.266144327740531e-06, "epoch": 0.7004048582995951, "percentage": 70.04, "elapsed_time": "7:45:33", "remaining_time": "3:19:08"}
{"current_steps": 1740, "total_steps": 2470, "loss": 0.3462, "lr": 2.2103297590768334e-06, "epoch": 0.7044534412955465, "percentage": 70.45, "elapsed_time": "7:48:14", "remaining_time": "3:16:26"}
{"current_steps": 1750, "total_steps": 2470, "loss": 0.3417, "lr": 2.155015443882644e-06, "epoch": 0.708502024291498, "percentage": 70.85, "elapsed_time": "7:50:32", "remaining_time": "3:13:35"}
{"current_steps": 1760, "total_steps": 2470, "loss": 0.3136, "lr": 2.100211301315315e-06, "epoch": 0.7125506072874493, "percentage": 71.26, "elapsed_time": "7:53:31", "remaining_time": "3:11:01"}
{"current_steps": 1770, "total_steps": 2470, "loss": 0.3124, "lr": 2.045927159046252e-06, "epoch": 0.7165991902834008, "percentage": 71.66, "elapsed_time": "7:55:55", "remaining_time": "3:08:13"}
{"current_steps": 1780, "total_steps": 2470, "loss": 0.2817, "lr": 1.9921727514985857e-06, "epoch": 0.7206477732793523, "percentage": 72.06, "elapsed_time": "7:58:40", "remaining_time": "3:05:33"}
{"current_steps": 1790, "total_steps": 2470, "loss": 0.3343, "lr": 1.9389577181015496e-06, "epoch": 0.7246963562753036, "percentage": 72.47, "elapsed_time": "8:01:19", "remaining_time": "3:02:51"}
{"current_steps": 1800, "total_steps": 2470, "loss": 0.2932, "lr": 1.8862916015619093e-06, "epoch": 0.728744939271255, "percentage": 72.87, "elapsed_time": "8:03:36", "remaining_time": "3:00:00"}
{"current_steps": 1810, "total_steps": 2470, "loss": 0.2659, "lr": 1.8341838461527344e-06, "epoch": 0.7327935222672065, "percentage": 73.28, "elapsed_time": "8:06:35", "remaining_time": "2:57:25"}
{"current_steps": 1820, "total_steps": 2470, "loss": 0.3147, "lr": 1.782643796019814e-06, "epoch": 0.7368421052631579, "percentage": 73.68, "elapsed_time": "8:08:55", "remaining_time": "2:54:37"}
{"current_steps": 1830, "total_steps": 2470, "loss": 0.2962, "lr": 1.7316806935060298e-06, "epoch": 0.7408906882591093, "percentage": 74.09, "elapsed_time": "8:11:32", "remaining_time": "2:51:54"}
{"current_steps": 1840, "total_steps": 2470, "loss": 0.3507, "lr": 1.6813036774939894e-06, "epoch": 0.7449392712550608, "percentage": 74.49, "elapsed_time": "8:14:15", "remaining_time": "2:49:13"}
{"current_steps": 1850, "total_steps": 2470, "loss": 0.3013, "lr": 1.6315217817672142e-06, "epoch": 0.7489878542510121, "percentage": 74.9, "elapsed_time": "8:16:36", "remaining_time": "2:46:25"}
{"current_steps": 1860, "total_steps": 2470, "loss": 0.2863, "lr": 1.5823439333901591e-06, "epoch": 0.7530364372469636, "percentage": 75.3, "elapsed_time": "8:19:28", "remaining_time": "2:43:48"}
{"current_steps": 1870, "total_steps": 2470, "loss": 0.3043, "lr": 1.5337789511073881e-06, "epoch": 0.757085020242915, "percentage": 75.71, "elapsed_time": "8:21:52", "remaining_time": "2:41:01"}
{"current_steps": 1880, "total_steps": 2470, "loss": 0.2814, "lr": 1.4858355437621663e-06, "epoch": 0.7611336032388664, "percentage": 76.11, "elapsed_time": "8:24:31", "remaining_time": "2:38:19"}
{"current_steps": 1890, "total_steps": 2470, "loss": 0.3551, "lr": 1.4385223087347533e-06, "epoch": 0.7651821862348178, "percentage": 76.52, "elapsed_time": "8:27:16", "remaining_time": "2:35:40"}
{"current_steps": 1900, "total_steps": 2470, "loss": 0.3204, "lr": 1.3918477304006956e-06, "epoch": 0.7692307692307693, "percentage": 76.92, "elapsed_time": "8:29:27", "remaining_time": "2:32:50"}
{"current_steps": 1910, "total_steps": 2470, "loss": 0.3572, "lr": 1.3458201786093795e-06, "epoch": 0.7732793522267206, "percentage": 77.33, "elapsed_time": "8:32:29", "remaining_time": "2:30:15"}
{"current_steps": 1920, "total_steps": 2470, "loss": 0.3235, "lr": 1.3004479071831161e-06, "epoch": 0.7773279352226721, "percentage": 77.73, "elapsed_time": "8:34:57", "remaining_time": "2:27:30"}
{"current_steps": 1930, "total_steps": 2470, "loss": 0.2956, "lr": 1.2557390524370371e-06, "epoch": 0.7813765182186235, "percentage": 78.14, "elapsed_time": "8:37:42", "remaining_time": "2:24:51"}
{"current_steps": 1940, "total_steps": 2470, "loss": 0.3123, "lr": 1.2117016317200702e-06, "epoch": 0.7854251012145749, "percentage": 78.54, "elapsed_time": "8:40:29", "remaining_time": "2:22:11"}
{"current_steps": 1950, "total_steps": 2470, "loss": 0.3165, "lr": 1.1683435419772282e-06, "epoch": 0.7894736842105263, "percentage": 78.95, "elapsed_time": "8:42:54", "remaining_time": "2:19:26"}
{"current_steps": 1960, "total_steps": 2470, "loss": 0.3207, "lr": 1.125672558333507e-06, "epoch": 0.7935222672064778, "percentage": 79.35, "elapsed_time": "8:45:55", "remaining_time": "2:16:50"}
{"current_steps": 1970, "total_steps": 2470, "loss": 0.3195, "lr": 1.083696332699628e-06, "epoch": 0.7975708502024291, "percentage": 79.76, "elapsed_time": "8:48:24", "remaining_time": "2:14:06"}
{"current_steps": 1980, "total_steps": 2470, "loss": 0.3292, "lr": 1.0424223923998572e-06, "epoch": 0.8016194331983806, "percentage": 80.16, "elapsed_time": "8:51:06", "remaining_time": "2:11:26"}
{"current_steps": 1990, "total_steps": 2470, "loss": 0.3595, "lr": 1.0018581388221942e-06, "epoch": 0.805668016194332, "percentage": 80.57, "elapsed_time": "8:53:49", "remaining_time": "2:08:45"}
{"current_steps": 2000, "total_steps": 2470, "loss": 0.3254, "lr": 9.620108460911181e-07, "epoch": 0.8097165991902834, "percentage": 80.97, "elapsed_time": "8:56:04", "remaining_time": "2:05:58"}
{"current_steps": 2000, "total_steps": 2470, "eval_loss": 0.3475629687309265, "epoch": 0.8097165991902834, "percentage": 80.97, "elapsed_time": "8:56:19", "remaining_time": "2:06:02"}
{"current_steps": 2010, "total_steps": 2470, "loss": 0.3207, "lr": 9.228876597631686e-07, "epoch": 0.8137651821862348, "percentage": 81.38, "elapsed_time": "9:02:44", "remaining_time": "2:04:12"}
{"current_steps": 2020, "total_steps": 2470, "loss": 0.2986, "lr": 8.844955955455859e-07, "epoch": 0.8178137651821862, "percentage": 81.78, "elapsed_time": "9:05:06", "remaining_time": "2:01:26"}
{"current_steps": 2030, "total_steps": 2470, "loss": 0.3022, "lr": 8.4684153803822e-07, "epoch": 0.8218623481781376, "percentage": 82.19, "elapsed_time": "9:07:47", "remaining_time": "1:58:44"}
{"current_steps": 2040, "total_steps": 2470, "loss": 0.3395, "lr": 8.099322394989645e-07, "epoch": 0.8259109311740891, "percentage": 82.59, "elapsed_time": "9:10:27", "remaining_time": "1:56:01"}
{"current_steps": 2050, "total_steps": 2470, "loss": 0.2974, "lr": 7.737743186329222e-07, "epoch": 0.8299595141700404, "percentage": 83.0, "elapsed_time": "9:12:43", "remaining_time": "1:53:14"}
{"current_steps": 2060, "total_steps": 2470, "loss": 0.3039, "lr": 7.383742594055077e-07, "epoch": 0.8340080971659919, "percentage": 83.4, "elapsed_time": "9:15:46", "remaining_time": "1:50:36"}
{"current_steps": 2070, "total_steps": 2470, "loss": 0.3029, "lr": 7.037384098797235e-07, "epoch": 0.8380566801619433, "percentage": 83.81, "elapsed_time": "9:18:15", "remaining_time": "1:47:52"}
{"current_steps": 2080, "total_steps": 2470, "loss": 0.2824, "lr": 6.698729810778065e-07, "epoch": 0.8421052631578947, "percentage": 84.21, "elapsed_time": "9:20:56", "remaining_time": "1:45:10"}
{"current_steps": 2090, "total_steps": 2470, "loss": 0.3344, "lr": 6.367840458674401e-07, "epoch": 0.8461538461538461, "percentage": 84.62, "elapsed_time": "9:23:38", "remaining_time": "1:42:28"}
{"current_steps": 2100, "total_steps": 2470, "loss": 0.2838, "lr": 6.044775378727474e-07, "epoch": 0.8502024291497976, "percentage": 85.02, "elapsed_time": "9:25:56", "remaining_time": "1:39:42"}
{"current_steps": 2110, "total_steps": 2470, "loss": 0.3043, "lr": 5.729592504102577e-07, "epoch": 0.854251012145749, "percentage": 85.43, "elapsed_time": "9:28:54", "remaining_time": "1:37:03"}
{"current_steps": 2120, "total_steps": 2470, "loss": 0.3722, "lr": 5.422348354500217e-07, "epoch": 0.8582995951417004, "percentage": 85.83, "elapsed_time": "9:31:18", "remaining_time": "1:34:19"}
{"current_steps": 2130, "total_steps": 2470, "loss": 0.3269, "lr": 5.12309802602084e-07, "epoch": 0.8623481781376519, "percentage": 86.23, "elapsed_time": "9:33:50", "remaining_time": "1:31:35"}
{"current_steps": 2140, "total_steps": 2470, "loss": 0.3336, "lr": 4.831895181284818e-07, "epoch": 0.8663967611336032, "percentage": 86.64, "elapsed_time": "9:36:29", "remaining_time": "1:28:53"}
{"current_steps": 2150, "total_steps": 2470, "loss": 0.2869, "lr": 4.5487920398094465e-07, "epoch": 0.8704453441295547, "percentage": 87.04, "elapsed_time": "9:38:46", "remaining_time": "1:26:08"}
{"current_steps": 2160, "total_steps": 2470, "loss": 0.3126, "lr": 4.273839368644778e-07, "epoch": 0.8744939271255061, "percentage": 87.45, "elapsed_time": "9:41:56", "remaining_time": "1:23:31"}
{"current_steps": 2170, "total_steps": 2470, "loss": 0.3288, "lr": 4.0070864732698945e-07, "epoch": 0.8785425101214575, "percentage": 87.85, "elapsed_time": "9:44:23", "remaining_time": "1:20:47"}
{"current_steps": 2180, "total_steps": 2470, "loss": 0.3102, "lr": 3.7485811887512714e-07, "epoch": 0.8825910931174089, "percentage": 88.26, "elapsed_time": "9:47:00", "remaining_time": "1:18:05"}
{"current_steps": 2190, "total_steps": 2470, "loss": 0.3266, "lr": 3.498369871164803e-07, "epoch": 0.8866396761133604, "percentage": 88.66, "elapsed_time": "9:49:43", "remaining_time": "1:15:23"}
{"current_steps": 2200, "total_steps": 2470, "loss": 0.2953, "lr": 3.256497389283142e-07, "epoch": 0.8906882591093117, "percentage": 89.07, "elapsed_time": "9:52:04", "remaining_time": "1:12:39"}
{"current_steps": 2210, "total_steps": 2470, "loss": 0.3171, "lr": 3.0230071165295804e-07, "epoch": 0.8947368421052632, "percentage": 89.47, "elapsed_time": "9:55:06", "remaining_time": "1:10:00"}
{"current_steps": 2220, "total_steps": 2470, "loss": 0.2901, "lr": 2.797940923200215e-07, "epoch": 0.8987854251012146, "percentage": 89.88, "elapsed_time": "9:57:33", "remaining_time": "1:07:17"}
{"current_steps": 2230, "total_steps": 2470, "loss": 0.3274, "lr": 2.58133916895566e-07, "epoch": 0.902834008097166, "percentage": 90.28, "elapsed_time": "10:00:12", "remaining_time": "1:04:35"}
{"current_steps": 2240, "total_steps": 2470, "loss": 0.3384, "lr": 2.373240695583534e-07, "epoch": 0.9068825910931174, "percentage": 90.69, "elapsed_time": "10:03:02", "remaining_time": "1:01:55"}
{"current_steps": 2250, "total_steps": 2470, "loss": 0.3575, "lr": 2.1736828200332628e-07, "epoch": 0.9109311740890689, "percentage": 91.09, "elapsed_time": "10:05:13", "remaining_time": "0:59:10"}
{"current_steps": 2260, "total_steps": 2470, "loss": 0.3151, "lr": 1.9827013277242736e-07, "epoch": 0.9149797570850202, "percentage": 91.5, "elapsed_time": "10:08:20", "remaining_time": "0:56:31"}
{"current_steps": 2270, "total_steps": 2470, "loss": 0.338, "lr": 1.800330466128808e-07, "epoch": 0.9190283400809717, "percentage": 91.9, "elapsed_time": "10:10:43", "remaining_time": "0:53:48"}
{"current_steps": 2280, "total_steps": 2470, "loss": 0.2969, "lr": 1.6266029386305448e-07, "epoch": 0.9230769230769231, "percentage": 92.31, "elapsed_time": "10:13:18", "remaining_time": "0:51:06"}
{"current_steps": 2290, "total_steps": 2470, "loss": 0.2982, "lr": 1.4615498986601362e-07, "epoch": 0.9271255060728745, "percentage": 92.71, "elapsed_time": "10:15:59", "remaining_time": "0:48:25"}
{"current_steps": 2300, "total_steps": 2470, "loss": 0.3464, "lr": 1.3052009441086533e-07, "epoch": 0.9311740890688259, "percentage": 93.12, "elapsed_time": "10:18:12", "remaining_time": "0:45:41"}
{"current_steps": 2310, "total_steps": 2470, "loss": 0.3107, "lr": 1.157584112019966e-07, "epoch": 0.9352226720647774, "percentage": 93.52, "elapsed_time": "10:21:12", "remaining_time": "0:43:01"}
{"current_steps": 2320, "total_steps": 2470, "loss": 0.3002, "lr": 1.0187258735630867e-07, "epoch": 0.9392712550607287, "percentage": 93.93, "elapsed_time": "10:23:36", "remaining_time": "0:40:19"}
{"current_steps": 2330, "total_steps": 2470, "loss": 0.299, "lr": 8.886511292852395e-08, "epoch": 0.9433198380566802, "percentage": 94.33, "elapsed_time": "10:26:19", "remaining_time": "0:37:37"}
{"current_steps": 2340, "total_steps": 2470, "loss": 0.37, "lr": 7.673832046465879e-08, "epoch": 0.9473684210526315, "percentage": 94.74, "elapsed_time": "10:29:02", "remaining_time": "0:34:56"}
{"current_steps": 2350, "total_steps": 2470, "loss": 0.3078, "lr": 6.549438458374857e-08, "epoch": 0.951417004048583, "percentage": 95.14, "elapsed_time": "10:31:30", "remaining_time": "0:32:14"}
{"current_steps": 2360, "total_steps": 2470, "loss": 0.3015, "lr": 5.513532158788193e-08, "epoch": 0.9554655870445344, "percentage": 95.55, "elapsed_time": "10:34:36", "remaining_time": "0:29:34"}
{"current_steps": 2370, "total_steps": 2470, "loss": 0.3385, "lr": 4.566298910063327e-08, "epoch": 0.9595141700404858, "percentage": 95.95, "elapsed_time": "10:36:58", "remaining_time": "0:26:52"}
{"current_steps": 2380, "total_steps": 2470, "loss": 0.3094, "lr": 3.707908573394703e-08, "epoch": 0.9635627530364372, "percentage": 96.36, "elapsed_time": "10:39:42", "remaining_time": "0:24:11"}
{"current_steps": 2390, "total_steps": 2470, "loss": 0.3348, "lr": 2.938515078353521e-08, "epoch": 0.9676113360323887, "percentage": 96.76, "elapsed_time": "10:42:34", "remaining_time": "0:21:30"}
{"current_steps": 2400, "total_steps": 2470, "loss": 0.322, "lr": 2.258256395284708e-08, "epoch": 0.97165991902834, "percentage": 97.17, "elapsed_time": "10:44:55", "remaining_time": "0:18:48"}
{"current_steps": 2410, "total_steps": 2470, "loss": 0.3143, "lr": 1.6672545105654857e-08, "epoch": 0.9757085020242915, "percentage": 97.57, "elapsed_time": "10:47:53", "remaining_time": "0:16:07"}
{"current_steps": 2420, "total_steps": 2470, "loss": 0.333, "lr": 1.1656154047303691e-08, "epoch": 0.979757085020243, "percentage": 97.98, "elapsed_time": "10:50:10", "remaining_time": "0:13:25"}
{"current_steps": 2430, "total_steps": 2470, "loss": 0.2787, "lr": 7.534290334664795e-09, "epoch": 0.9838056680161943, "percentage": 98.38, "elapsed_time": "10:52:54", "remaining_time": "0:10:44"}
{"current_steps": 2440, "total_steps": 2470, "loss": 0.3433, "lr": 4.307693114821154e-09, "epoch": 0.9878542510121457, "percentage": 98.79, "elapsed_time": "10:55:35", "remaining_time": "0:08:03"}
{"current_steps": 2450, "total_steps": 2470, "loss": 0.3547, "lr": 1.976940992523546e-09, "epoch": 0.9919028340080972, "percentage": 99.19, "elapsed_time": "10:57:49", "remaining_time": "0:05:22"}
{"current_steps": 2460, "total_steps": 2470, "loss": 0.344, "lr": 5.424519264324301e-10, "epoch": 0.9959514170040485, "percentage": 99.6, "elapsed_time": "11:00:49", "remaining_time": "0:02:41"}
{"current_steps": 2470, "total_steps": 2470, "loss": 0.3343, "lr": 4.4831541662349046e-12, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "11:03:06", "remaining_time": "0:00:00"}
{"current_steps": 2470, "total_steps": 2470, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "11:06:30", "remaining_time": "0:00:00"}