diff --git "a/trainer_log.jsonl" "b/trainer_log.jsonl" --- "a/trainer_log.jsonl" +++ "b/trainer_log.jsonl" @@ -1,775 +1,6 @@ -{"current_steps": 10, "total_steps": 6450, "loss": 1.587, "lr": 1.550387596899225e-06, "epoch": 0.015503875968992248, "percentage": 0.16, "elapsed_time": "0:01:21", "remaining_time": "14:32:54"} -{"current_steps": 20, "total_steps": 6450, "loss": 1.5507, "lr": 3.10077519379845e-06, "epoch": 0.031007751937984496, "percentage": 0.31, "elapsed_time": "0:02:42", "remaining_time": "14:29:20"} -{"current_steps": 30, "total_steps": 6450, "loss": 1.4835, "lr": 4.651162790697674e-06, "epoch": 0.046511627906976744, "percentage": 0.47, "elapsed_time": "0:04:03", "remaining_time": "14:28:08"} -{"current_steps": 40, "total_steps": 6450, "loss": 1.2778, "lr": 6.2015503875969e-06, "epoch": 0.06201550387596899, "percentage": 0.62, "elapsed_time": "0:05:24", "remaining_time": "14:26:52"} -{"current_steps": 50, "total_steps": 6450, "loss": 0.8365, "lr": 7.751937984496124e-06, "epoch": 0.07751937984496124, "percentage": 0.78, "elapsed_time": "0:06:45", "remaining_time": "14:24:56"} -{"current_steps": 50, "total_steps": 6450, "eval_loss": 0.720068097114563, "epoch": 0.07751937984496124, "percentage": 0.78, "elapsed_time": "0:09:29", "remaining_time": "20:15:27"} -{"current_steps": 60, "total_steps": 6450, "loss": 0.7544, "lr": 9.302325581395349e-06, "epoch": 0.09302325581395349, "percentage": 0.93, "elapsed_time": "0:10:54", "remaining_time": "19:21:18"} -{"current_steps": 70, "total_steps": 6450, "loss": 0.5623, "lr": 1.0852713178294575e-05, "epoch": 0.10852713178294573, "percentage": 1.09, "elapsed_time": "0:12:15", "remaining_time": "18:36:33"} -{"current_steps": 80, "total_steps": 6450, "loss": 0.3632, "lr": 1.24031007751938e-05, "epoch": 0.12403100775193798, "percentage": 1.24, "elapsed_time": "0:13:35", "remaining_time": "18:02:42"} -{"current_steps": 90, "total_steps": 6450, "loss": 0.2516, "lr": 1.3953488372093024e-05, "epoch": 0.13953488372093023, "percentage": 1.4, "elapsed_time": "0:14:56", "remaining_time": "17:35:56"} -{"current_steps": 100, "total_steps": 6450, "loss": 0.1902, "lr": 1.5503875968992248e-05, "epoch": 0.15503875968992248, "percentage": 1.55, "elapsed_time": "0:16:17", "remaining_time": "17:14:15"} -{"current_steps": 100, "total_steps": 6450, "eval_loss": 0.1545812040567398, "epoch": 0.15503875968992248, "percentage": 1.55, "elapsed_time": "0:19:01", "remaining_time": "20:07:52"} -{"current_steps": 110, "total_steps": 6450, "loss": 0.168, "lr": 1.7054263565891473e-05, "epoch": 0.17054263565891473, "percentage": 1.71, "elapsed_time": "0:20:26", "remaining_time": "19:38:31"} -{"current_steps": 120, "total_steps": 6450, "loss": 0.1196, "lr": 1.8604651162790697e-05, "epoch": 0.18604651162790697, "percentage": 1.86, "elapsed_time": "0:21:47", "remaining_time": "19:09:50"} -{"current_steps": 130, "total_steps": 6450, "loss": 0.1045, "lr": 2.0155038759689922e-05, "epoch": 0.20155038759689922, "percentage": 2.02, "elapsed_time": "0:23:08", "remaining_time": "18:44:54"} -{"current_steps": 140, "total_steps": 6450, "loss": 0.1011, "lr": 2.170542635658915e-05, "epoch": 0.21705426356589147, "percentage": 2.17, "elapsed_time": "0:24:28", "remaining_time": "18:23:17"} -{"current_steps": 150, "total_steps": 6450, "loss": 0.0775, "lr": 2.3255813953488374e-05, "epoch": 0.23255813953488372, "percentage": 2.33, "elapsed_time": "0:25:48", "remaining_time": "18:04:13"} -{"current_steps": 150, "total_steps": 6450, "eval_loss": 0.07378725707530975, "epoch": 0.23255813953488372, "percentage": 2.33, "elapsed_time": "0:28:32", "remaining_time": "19:58:53"} -{"current_steps": 160, "total_steps": 6450, "loss": 0.0897, "lr": 2.48062015503876e-05, "epoch": 0.24806201550387597, "percentage": 2.48, "elapsed_time": "0:29:56", "remaining_time": "19:37:20"} -{"current_steps": 170, "total_steps": 6450, "loss": 0.0751, "lr": 2.6356589147286826e-05, "epoch": 0.26356589147286824, "percentage": 2.64, "elapsed_time": "0:31:17", "remaining_time": "19:16:07"} -{"current_steps": 180, "total_steps": 6450, "loss": 0.0688, "lr": 2.7906976744186048e-05, "epoch": 0.27906976744186046, "percentage": 2.79, "elapsed_time": "0:32:38", "remaining_time": "18:57:02"} -{"current_steps": 190, "total_steps": 6450, "loss": 0.0744, "lr": 2.9457364341085275e-05, "epoch": 0.29457364341085274, "percentage": 2.95, "elapsed_time": "0:33:59", "remaining_time": "18:39:48"} -{"current_steps": 200, "total_steps": 6450, "loss": 0.0669, "lr": 3.1007751937984497e-05, "epoch": 0.31007751937984496, "percentage": 3.1, "elapsed_time": "0:35:19", "remaining_time": "18:23:58"} -{"current_steps": 200, "total_steps": 6450, "eval_loss": 0.0612422414124012, "epoch": 0.31007751937984496, "percentage": 3.1, "elapsed_time": "0:38:03", "remaining_time": "19:49:20"} -{"current_steps": 210, "total_steps": 6450, "loss": 0.0615, "lr": 3.2558139534883724e-05, "epoch": 0.32558139534883723, "percentage": 3.26, "elapsed_time": "0:39:28", "remaining_time": "19:32:55"} -{"current_steps": 220, "total_steps": 6450, "loss": 0.0618, "lr": 3.4108527131782945e-05, "epoch": 0.34108527131782945, "percentage": 3.41, "elapsed_time": "0:40:49", "remaining_time": "19:15:54"} -{"current_steps": 230, "total_steps": 6450, "loss": 0.0657, "lr": 3.565891472868217e-05, "epoch": 0.35658914728682173, "percentage": 3.57, "elapsed_time": "0:42:09", "remaining_time": "19:00:04"} -{"current_steps": 240, "total_steps": 6450, "loss": 0.0813, "lr": 3.7209302325581394e-05, "epoch": 0.37209302325581395, "percentage": 3.72, "elapsed_time": "0:43:29", "remaining_time": "18:45:33"} -{"current_steps": 250, "total_steps": 6450, "loss": 0.0712, "lr": 3.875968992248062e-05, "epoch": 0.3875968992248062, "percentage": 3.88, "elapsed_time": "0:44:50", "remaining_time": "18:32:12"} -{"current_steps": 250, "total_steps": 6450, "eval_loss": 0.055263448506593704, "epoch": 0.3875968992248062, "percentage": 3.88, "elapsed_time": "0:47:34", "remaining_time": "19:40:00"} -{"current_steps": 260, "total_steps": 6450, "loss": 0.0548, "lr": 4.0310077519379843e-05, "epoch": 0.40310077519379844, "percentage": 4.03, "elapsed_time": "0:48:59", "remaining_time": "19:26:20"} -{"current_steps": 270, "total_steps": 6450, "loss": 0.0502, "lr": 4.186046511627907e-05, "epoch": 0.4186046511627907, "percentage": 4.19, "elapsed_time": "0:50:20", "remaining_time": "19:12:15"} -{"current_steps": 280, "total_steps": 6450, "loss": 0.0849, "lr": 4.34108527131783e-05, "epoch": 0.43410852713178294, "percentage": 4.34, "elapsed_time": "0:51:41", "remaining_time": "18:58:54"} -{"current_steps": 290, "total_steps": 6450, "loss": 0.0645, "lr": 4.496124031007753e-05, "epoch": 0.4496124031007752, "percentage": 4.5, "elapsed_time": "0:53:01", "remaining_time": "18:46:21"} -{"current_steps": 300, "total_steps": 6450, "loss": 0.0514, "lr": 4.651162790697675e-05, "epoch": 0.46511627906976744, "percentage": 4.65, "elapsed_time": "0:54:22", "remaining_time": "18:34:31"} -{"current_steps": 300, "total_steps": 6450, "eval_loss": 0.04920719936490059, "epoch": 0.46511627906976744, "percentage": 4.65, "elapsed_time": "0:57:06", "remaining_time": "19:30:33"} -{"current_steps": 310, "total_steps": 6450, "loss": 0.057, "lr": 4.8062015503875976e-05, "epoch": 0.4806201550387597, "percentage": 4.81, "elapsed_time": "0:58:30", "remaining_time": "19:18:54"} -{"current_steps": 320, "total_steps": 6450, "loss": 0.0407, "lr": 4.96124031007752e-05, "epoch": 0.49612403100775193, "percentage": 4.96, "elapsed_time": "0:59:51", "remaining_time": "19:06:41"} -{"current_steps": 330, "total_steps": 6450, "loss": 0.051, "lr": 5.1162790697674425e-05, "epoch": 0.5116279069767442, "percentage": 5.12, "elapsed_time": "1:01:12", "remaining_time": "18:55:00"} -{"current_steps": 340, "total_steps": 6450, "loss": 0.0581, "lr": 5.271317829457365e-05, "epoch": 0.5271317829457365, "percentage": 5.27, "elapsed_time": "1:02:32", "remaining_time": "18:43:52"} -{"current_steps": 350, "total_steps": 6450, "loss": 0.0468, "lr": 5.426356589147287e-05, "epoch": 0.5426356589147286, "percentage": 5.43, "elapsed_time": "1:03:52", "remaining_time": "18:33:19"} -{"current_steps": 350, "total_steps": 6450, "eval_loss": 0.04546884447336197, "epoch": 0.5426356589147286, "percentage": 5.43, "elapsed_time": "1:06:36", "remaining_time": "19:20:58"} -{"current_steps": 360, "total_steps": 6450, "loss": 0.0489, "lr": 5.5813953488372095e-05, "epoch": 0.5581395348837209, "percentage": 5.58, "elapsed_time": "1:08:01", "remaining_time": "19:10:50"} -{"current_steps": 370, "total_steps": 6450, "loss": 0.0631, "lr": 5.736434108527132e-05, "epoch": 0.5736434108527132, "percentage": 5.74, "elapsed_time": "1:09:22", "remaining_time": "19:00:06"} -{"current_steps": 380, "total_steps": 6450, "loss": 0.0668, "lr": 5.891472868217055e-05, "epoch": 0.5891472868217055, "percentage": 5.89, "elapsed_time": "1:10:43", "remaining_time": "18:49:45"} -{"current_steps": 390, "total_steps": 6450, "loss": 0.0601, "lr": 6.0465116279069765e-05, "epoch": 0.6046511627906976, "percentage": 6.05, "elapsed_time": "1:12:04", "remaining_time": "18:39:51"} -{"current_steps": 400, "total_steps": 6450, "loss": 0.0575, "lr": 6.201550387596899e-05, "epoch": 0.6201550387596899, "percentage": 6.2, "elapsed_time": "1:13:24", "remaining_time": "18:30:20"} -{"current_steps": 400, "total_steps": 6450, "eval_loss": 0.04904007911682129, "epoch": 0.6201550387596899, "percentage": 6.2, "elapsed_time": "1:16:08", "remaining_time": "19:11:40"} -{"current_steps": 410, "total_steps": 6450, "loss": 0.0598, "lr": 6.356589147286823e-05, "epoch": 0.6356589147286822, "percentage": 6.36, "elapsed_time": "1:17:33", "remaining_time": "19:02:32"} -{"current_steps": 420, "total_steps": 6450, "loss": 0.0531, "lr": 6.511627906976745e-05, "epoch": 0.6511627906976745, "percentage": 6.51, "elapsed_time": "1:18:54", "remaining_time": "18:52:54"} -{"current_steps": 430, "total_steps": 6450, "loss": 0.0547, "lr": 6.666666666666667e-05, "epoch": 0.6666666666666666, "percentage": 6.67, "elapsed_time": "1:20:15", "remaining_time": "18:43:37"} -{"current_steps": 440, "total_steps": 6450, "loss": 0.0666, "lr": 6.821705426356589e-05, "epoch": 0.6821705426356589, "percentage": 6.82, "elapsed_time": "1:21:36", "remaining_time": "18:34:40"} -{"current_steps": 450, "total_steps": 6450, "loss": 0.0488, "lr": 6.976744186046513e-05, "epoch": 0.6976744186046512, "percentage": 6.98, "elapsed_time": "1:22:56", "remaining_time": "18:25:54"} -{"current_steps": 450, "total_steps": 6450, "eval_loss": 0.04147861525416374, "epoch": 0.6976744186046512, "percentage": 6.98, "elapsed_time": "1:25:40", "remaining_time": "19:02:20"} -{"current_steps": 460, "total_steps": 6450, "loss": 0.0529, "lr": 7.131782945736435e-05, "epoch": 0.7131782945736435, "percentage": 7.13, "elapsed_time": "1:27:05", "remaining_time": "18:54:03"} -{"current_steps": 470, "total_steps": 6450, "loss": 0.0469, "lr": 7.286821705426357e-05, "epoch": 0.7286821705426356, "percentage": 7.29, "elapsed_time": "1:28:26", "remaining_time": "18:45:11"} -{"current_steps": 480, "total_steps": 6450, "loss": 0.0513, "lr": 7.441860465116279e-05, "epoch": 0.7441860465116279, "percentage": 7.44, "elapsed_time": "1:29:47", "remaining_time": "18:36:41"} -{"current_steps": 490, "total_steps": 6450, "loss": 0.0456, "lr": 7.596899224806202e-05, "epoch": 0.7596899224806202, "percentage": 7.6, "elapsed_time": "1:31:07", "remaining_time": "18:28:25"} -{"current_steps": 500, "total_steps": 6450, "loss": 0.0531, "lr": 7.751937984496124e-05, "epoch": 0.7751937984496124, "percentage": 7.75, "elapsed_time": "1:32:28", "remaining_time": "18:20:28"} -{"current_steps": 500, "total_steps": 6450, "eval_loss": 0.04052061215043068, "epoch": 0.7751937984496124, "percentage": 7.75, "elapsed_time": "1:35:12", "remaining_time": "18:52:59"} -{"current_steps": 510, "total_steps": 6450, "loss": 0.045, "lr": 7.906976744186047e-05, "epoch": 0.7906976744186046, "percentage": 7.91, "elapsed_time": "1:36:36", "remaining_time": "18:45:12"} -{"current_steps": 520, "total_steps": 6450, "loss": 0.0412, "lr": 8.062015503875969e-05, "epoch": 0.8062015503875969, "percentage": 8.06, "elapsed_time": "1:37:57", "remaining_time": "18:37:01"} -{"current_steps": 530, "total_steps": 6450, "loss": 0.0522, "lr": 8.217054263565892e-05, "epoch": 0.8217054263565892, "percentage": 8.22, "elapsed_time": "1:39:17", "remaining_time": "18:29:07"} -{"current_steps": 540, "total_steps": 6450, "loss": 0.042, "lr": 8.372093023255814e-05, "epoch": 0.8372093023255814, "percentage": 8.37, "elapsed_time": "1:40:38", "remaining_time": "18:21:26"} -{"current_steps": 550, "total_steps": 6450, "loss": 0.0495, "lr": 8.527131782945736e-05, "epoch": 0.8527131782945736, "percentage": 8.53, "elapsed_time": "1:41:58", "remaining_time": "18:13:57"} -{"current_steps": 550, "total_steps": 6450, "eval_loss": 0.04120254144072533, "epoch": 0.8527131782945736, "percentage": 8.53, "elapsed_time": "1:44:42", "remaining_time": "18:43:15"} -{"current_steps": 560, "total_steps": 6450, "loss": 0.0517, "lr": 8.68217054263566e-05, "epoch": 0.8682170542635659, "percentage": 8.68, "elapsed_time": "1:46:07", "remaining_time": "18:36:11"} -{"current_steps": 570, "total_steps": 6450, "loss": 0.049, "lr": 8.837209302325582e-05, "epoch": 0.8837209302325582, "percentage": 8.84, "elapsed_time": "1:47:28", "remaining_time": "18:28:40"} -{"current_steps": 580, "total_steps": 6450, "loss": 0.0373, "lr": 8.992248062015505e-05, "epoch": 0.8992248062015504, "percentage": 8.99, "elapsed_time": "1:48:49", "remaining_time": "18:21:19"} -{"current_steps": 590, "total_steps": 6450, "loss": 0.0398, "lr": 9.147286821705426e-05, "epoch": 0.9147286821705426, "percentage": 9.15, "elapsed_time": "1:50:09", "remaining_time": "18:14:08"} -{"current_steps": 600, "total_steps": 6450, "loss": 0.0682, "lr": 9.30232558139535e-05, "epoch": 0.9302325581395349, "percentage": 9.3, "elapsed_time": "1:51:30", "remaining_time": "18:07:09"} -{"current_steps": 600, "total_steps": 6450, "eval_loss": 0.05146737024188042, "epoch": 0.9302325581395349, "percentage": 9.3, "elapsed_time": "1:54:14", "remaining_time": "18:33:49"} -{"current_steps": 610, "total_steps": 6450, "loss": 0.0478, "lr": 9.457364341085272e-05, "epoch": 0.9457364341085271, "percentage": 9.46, "elapsed_time": "1:55:39", "remaining_time": "18:27:16"} -{"current_steps": 620, "total_steps": 6450, "loss": 0.0433, "lr": 9.612403100775195e-05, "epoch": 0.9612403100775194, "percentage": 9.61, "elapsed_time": "1:57:00", "remaining_time": "18:20:16"} -{"current_steps": 630, "total_steps": 6450, "loss": 0.0428, "lr": 9.767441860465116e-05, "epoch": 0.9767441860465116, "percentage": 9.77, "elapsed_time": "1:58:21", "remaining_time": "18:13:22"} -{"current_steps": 640, "total_steps": 6450, "loss": 0.055, "lr": 9.92248062015504e-05, "epoch": 0.9922480620155039, "percentage": 9.92, "elapsed_time": "1:59:42", "remaining_time": "18:06:40"} -{"current_steps": 650, "total_steps": 6450, "loss": 0.0391, "lr": 9.99998169477592e-05, "epoch": 1.0077519379844961, "percentage": 10.08, "elapsed_time": "2:01:02", "remaining_time": "18:00:04"} -{"current_steps": 650, "total_steps": 6450, "eval_loss": 0.038673676550388336, "epoch": 1.0077519379844961, "percentage": 10.08, "elapsed_time": "2:03:46", "remaining_time": "18:24:27"} -{"current_steps": 660, "total_steps": 6450, "loss": 0.0371, "lr": 9.999835253787473e-05, "epoch": 1.0232558139534884, "percentage": 10.23, "elapsed_time": "2:05:11", "remaining_time": "18:18:15"} -{"current_steps": 670, "total_steps": 6450, "loss": 0.0537, "lr": 9.999542376099589e-05, "epoch": 1.0387596899224807, "percentage": 10.39, "elapsed_time": "2:06:32", "remaining_time": "18:11:40"} -{"current_steps": 680, "total_steps": 6450, "loss": 0.0294, "lr": 9.999103070290155e-05, "epoch": 1.054263565891473, "percentage": 10.54, "elapsed_time": "2:07:53", "remaining_time": "18:05:12"} -{"current_steps": 690, "total_steps": 6450, "loss": 0.0394, "lr": 9.998517349225698e-05, "epoch": 1.069767441860465, "percentage": 10.7, "elapsed_time": "2:09:14", "remaining_time": "17:58:51"} -{"current_steps": 700, "total_steps": 6450, "loss": 0.0372, "lr": 9.997785230060993e-05, "epoch": 1.0852713178294573, "percentage": 10.85, "elapsed_time": "2:10:34", "remaining_time": "17:52:35"} -{"current_steps": 700, "total_steps": 6450, "eval_loss": 0.040567439049482346, "epoch": 1.0852713178294573, "percentage": 10.85, "elapsed_time": "2:13:18", "remaining_time": "18:15:02"} -{"current_steps": 710, "total_steps": 6450, "loss": 0.0325, "lr": 9.996906734238567e-05, "epoch": 1.1007751937984496, "percentage": 11.01, "elapsed_time": "2:14:43", "remaining_time": "18:09:08"} -{"current_steps": 720, "total_steps": 6450, "loss": 0.0416, "lr": 9.99588188748808e-05, "epoch": 1.1162790697674418, "percentage": 11.16, "elapsed_time": "2:16:04", "remaining_time": "18:02:52"} -{"current_steps": 730, "total_steps": 6450, "loss": 0.0375, "lr": 9.994710719825549e-05, "epoch": 1.1317829457364341, "percentage": 11.32, "elapsed_time": "2:17:24", "remaining_time": "17:56:42"} -{"current_steps": 740, "total_steps": 6450, "loss": 0.0512, "lr": 9.993393265552493e-05, "epoch": 1.1472868217054264, "percentage": 11.47, "elapsed_time": "2:18:45", "remaining_time": "17:50:41"} -{"current_steps": 750, "total_steps": 6450, "loss": 0.0337, "lr": 9.991929563254914e-05, "epoch": 1.1627906976744187, "percentage": 11.63, "elapsed_time": "2:20:05", "remaining_time": "17:44:45"} -{"current_steps": 750, "total_steps": 6450, "eval_loss": 0.03701839596033096, "epoch": 1.1627906976744187, "percentage": 11.63, "elapsed_time": "2:22:49", "remaining_time": "18:05:30"} -{"current_steps": 760, "total_steps": 6450, "loss": 0.043, "lr": 9.990319655802171e-05, "epoch": 1.178294573643411, "percentage": 11.78, "elapsed_time": "2:24:15", "remaining_time": "18:00:03"} -{"current_steps": 770, "total_steps": 6450, "loss": 0.0359, "lr": 9.988563590345727e-05, "epoch": 1.193798449612403, "percentage": 11.94, "elapsed_time": "2:25:36", "remaining_time": "17:54:05"} -{"current_steps": 780, "total_steps": 6450, "loss": 0.0354, "lr": 9.986661418317759e-05, "epoch": 1.2093023255813953, "percentage": 12.09, "elapsed_time": "2:26:57", "remaining_time": "17:48:16"} -{"current_steps": 790, "total_steps": 6450, "loss": 0.0389, "lr": 9.984613195429662e-05, "epoch": 1.2248062015503876, "percentage": 12.25, "elapsed_time": "2:28:18", "remaining_time": "17:42:33"} -{"current_steps": 800, "total_steps": 6450, "loss": 0.0292, "lr": 9.982418981670414e-05, "epoch": 1.2403100775193798, "percentage": 12.4, "elapsed_time": "2:29:39", "remaining_time": "17:36:56"} -{"current_steps": 800, "total_steps": 6450, "eval_loss": 0.04220827668905258, "epoch": 1.2403100775193798, "percentage": 12.4, "elapsed_time": "2:32:23", "remaining_time": "17:56:16"} -{"current_steps": 810, "total_steps": 6450, "loss": 0.0349, "lr": 9.980078841304816e-05, "epoch": 1.255813953488372, "percentage": 12.56, "elapsed_time": "2:33:48", "remaining_time": "17:51:00"} -{"current_steps": 820, "total_steps": 6450, "loss": 0.041, "lr": 9.977592842871611e-05, "epoch": 1.2713178294573644, "percentage": 12.71, "elapsed_time": "2:35:09", "remaining_time": "17:45:17"} -{"current_steps": 830, "total_steps": 6450, "loss": 0.0453, "lr": 9.974961059181482e-05, "epoch": 1.2868217054263567, "percentage": 12.87, "elapsed_time": "2:36:30", "remaining_time": "17:39:43"} -{"current_steps": 840, "total_steps": 6450, "loss": 0.0398, "lr": 9.97218356731491e-05, "epoch": 1.302325581395349, "percentage": 13.02, "elapsed_time": "2:37:51", "remaining_time": "17:34:15"} -{"current_steps": 850, "total_steps": 6450, "loss": 0.0394, "lr": 9.969260448619924e-05, "epoch": 1.3178294573643412, "percentage": 13.18, "elapsed_time": "2:39:11", "remaining_time": "17:28:50"} -{"current_steps": 850, "total_steps": 6450, "eval_loss": 0.035287585109472275, "epoch": 1.3178294573643412, "percentage": 13.18, "elapsed_time": "2:41:56", "remaining_time": "17:46:52"} -{"current_steps": 860, "total_steps": 6450, "loss": 0.0377, "lr": 9.966191788709716e-05, "epoch": 1.3333333333333333, "percentage": 13.33, "elapsed_time": "2:43:20", "remaining_time": "17:41:45"} -{"current_steps": 870, "total_steps": 6450, "loss": 0.0298, "lr": 9.962977677460132e-05, "epoch": 1.3488372093023255, "percentage": 13.49, "elapsed_time": "2:44:41", "remaining_time": "17:36:18"} -{"current_steps": 880, "total_steps": 6450, "loss": 0.0501, "lr": 9.959618209007044e-05, "epoch": 1.3643410852713178, "percentage": 13.64, "elapsed_time": "2:46:02", "remaining_time": "17:30:58"} -{"current_steps": 890, "total_steps": 6450, "loss": 0.0325, "lr": 9.956113481743589e-05, "epoch": 1.37984496124031, "percentage": 13.8, "elapsed_time": "2:47:23", "remaining_time": "17:25:42"} -{"current_steps": 900, "total_steps": 6450, "loss": 0.0454, "lr": 9.952463598317285e-05, "epoch": 1.3953488372093024, "percentage": 13.95, "elapsed_time": "2:48:43", "remaining_time": "17:20:28"} -{"current_steps": 900, "total_steps": 6450, "eval_loss": 0.036218829452991486, "epoch": 1.3953488372093024, "percentage": 13.95, "elapsed_time": "2:51:27", "remaining_time": "17:37:21"} -{"current_steps": 910, "total_steps": 6450, "loss": 0.0332, "lr": 9.948668665627034e-05, "epoch": 1.4108527131782946, "percentage": 14.11, "elapsed_time": "2:52:52", "remaining_time": "17:32:26"} -{"current_steps": 920, "total_steps": 6450, "loss": 0.0342, "lr": 9.94472879481998e-05, "epoch": 1.4263565891472867, "percentage": 14.26, "elapsed_time": "2:54:13", "remaining_time": "17:27:12"} -{"current_steps": 930, "total_steps": 6450, "loss": 0.0371, "lr": 9.940644101288259e-05, "epoch": 1.441860465116279, "percentage": 14.42, "elapsed_time": "2:55:33", "remaining_time": "17:22:04"} -{"current_steps": 940, "total_steps": 6450, "loss": 0.0378, "lr": 9.936414704665622e-05, "epoch": 1.4573643410852712, "percentage": 14.57, "elapsed_time": "2:56:55", "remaining_time": "17:17:04"} -{"current_steps": 950, "total_steps": 6450, "loss": 0.0457, "lr": 9.932040728823929e-05, "epoch": 1.4728682170542635, "percentage": 14.73, "elapsed_time": "2:58:16", "remaining_time": "17:12:04"} -{"current_steps": 950, "total_steps": 6450, "eval_loss": 0.037599749863147736, "epoch": 1.4728682170542635, "percentage": 14.73, "elapsed_time": "3:01:00", "remaining_time": "17:27:55"} -{"current_steps": 960, "total_steps": 6450, "loss": 0.042, "lr": 9.927522301869515e-05, "epoch": 1.4883720930232558, "percentage": 14.88, "elapsed_time": "3:02:26", "remaining_time": "17:23:17"} -{"current_steps": 970, "total_steps": 6450, "loss": 0.0362, "lr": 9.922859556139446e-05, "epoch": 1.503875968992248, "percentage": 15.04, "elapsed_time": "3:03:46", "remaining_time": "17:18:15"} -{"current_steps": 980, "total_steps": 6450, "loss": 0.041, "lr": 9.918052628197645e-05, "epoch": 1.5193798449612403, "percentage": 15.19, "elapsed_time": "3:05:07", "remaining_time": "17:13:19"} -{"current_steps": 990, "total_steps": 6450, "loss": 0.0307, "lr": 9.91310165883088e-05, "epoch": 1.5348837209302326, "percentage": 15.35, "elapsed_time": "3:06:28", "remaining_time": "17:08:26"} -{"current_steps": 1000, "total_steps": 6450, "loss": 0.0299, "lr": 9.90800679304465e-05, "epoch": 1.550387596899225, "percentage": 15.5, "elapsed_time": "3:07:49", "remaining_time": "17:03:37"} -{"current_steps": 1000, "total_steps": 6450, "eval_loss": 0.038449838757514954, "epoch": 1.550387596899225, "percentage": 15.5, "elapsed_time": "3:10:33", "remaining_time": "17:18:32"} -{"current_steps": 1010, "total_steps": 6450, "loss": 0.0461, "lr": 9.902768180058941e-05, "epoch": 1.5658914728682172, "percentage": 15.66, "elapsed_time": "3:11:58", "remaining_time": "17:13:58"} -{"current_steps": 1020, "total_steps": 6450, "loss": 0.0441, "lr": 9.897385973303845e-05, "epoch": 1.5813953488372094, "percentage": 15.81, "elapsed_time": "3:13:18", "remaining_time": "17:09:07"} -{"current_steps": 1030, "total_steps": 6450, "loss": 0.0351, "lr": 9.891860330415077e-05, "epoch": 1.5968992248062015, "percentage": 15.97, "elapsed_time": "3:14:40", "remaining_time": "17:04:23"} -{"current_steps": 1040, "total_steps": 6450, "loss": 0.0379, "lr": 9.886191413229349e-05, "epoch": 1.6124031007751938, "percentage": 16.12, "elapsed_time": "3:16:01", "remaining_time": "16:59:40"} -{"current_steps": 1050, "total_steps": 6450, "loss": 0.0375, "lr": 9.880379387779637e-05, "epoch": 1.627906976744186, "percentage": 16.28, "elapsed_time": "3:17:21", "remaining_time": "16:55:00"} -{"current_steps": 1050, "total_steps": 6450, "eval_loss": 0.03629838302731514, "epoch": 1.627906976744186, "percentage": 16.28, "elapsed_time": "3:20:06", "remaining_time": "17:09:05"} -{"current_steps": 1060, "total_steps": 6450, "loss": 0.0333, "lr": 9.874424424290313e-05, "epoch": 1.6434108527131783, "percentage": 16.43, "elapsed_time": "3:21:31", "remaining_time": "17:04:44"} -{"current_steps": 1070, "total_steps": 6450, "loss": 0.0313, "lr": 9.868326697172164e-05, "epoch": 1.6589147286821704, "percentage": 16.59, "elapsed_time": "3:22:53", "remaining_time": "17:00:06"} -{"current_steps": 1080, "total_steps": 6450, "loss": 0.0398, "lr": 9.862086385017283e-05, "epoch": 1.6744186046511627, "percentage": 16.74, "elapsed_time": "3:24:14", "remaining_time": "16:55:31"} -{"current_steps": 1090, "total_steps": 6450, "loss": 0.038, "lr": 9.855703670593834e-05, "epoch": 1.689922480620155, "percentage": 16.9, "elapsed_time": "3:25:34", "remaining_time": "16:50:56"} -{"current_steps": 1100, "total_steps": 6450, "loss": 0.0266, "lr": 9.849178740840701e-05, "epoch": 1.7054263565891472, "percentage": 17.05, "elapsed_time": "3:26:55", "remaining_time": "16:46:24"} -{"current_steps": 1100, "total_steps": 6450, "eval_loss": 0.03744375705718994, "epoch": 1.7054263565891472, "percentage": 17.05, "elapsed_time": "3:29:39", "remaining_time": "16:59:42"} -{"current_steps": 1110, "total_steps": 6450, "loss": 0.0531, "lr": 9.842511786862019e-05, "epoch": 1.7209302325581395, "percentage": 17.21, "elapsed_time": "3:31:04", "remaining_time": "16:55:24"} -{"current_steps": 1120, "total_steps": 6450, "loss": 0.0381, "lr": 9.835703003921568e-05, "epoch": 1.7364341085271318, "percentage": 17.36, "elapsed_time": "3:32:25", "remaining_time": "16:50:53"} -{"current_steps": 1130, "total_steps": 6450, "loss": 0.0345, "lr": 9.828752591437061e-05, "epoch": 1.751937984496124, "percentage": 17.52, "elapsed_time": "3:33:45", "remaining_time": "16:46:22"} -{"current_steps": 1140, "total_steps": 6450, "loss": 0.0318, "lr": 9.821660752974293e-05, "epoch": 1.7674418604651163, "percentage": 17.67, "elapsed_time": "3:35:06", "remaining_time": "16:41:56"} -{"current_steps": 1150, "total_steps": 6450, "loss": 0.0385, "lr": 9.814427696241196e-05, "epoch": 1.7829457364341086, "percentage": 17.83, "elapsed_time": "3:36:27", "remaining_time": "16:37:33"} -{"current_steps": 1150, "total_steps": 6450, "eval_loss": 0.03696512430906296, "epoch": 1.7829457364341086, "percentage": 17.83, "elapsed_time": "3:39:11", "remaining_time": "16:50:10"} -{"current_steps": 1160, "total_steps": 6450, "loss": 0.025, "lr": 9.807053633081739e-05, "epoch": 1.7984496124031009, "percentage": 17.98, "elapsed_time": "3:40:36", "remaining_time": "16:46:04"} -{"current_steps": 1170, "total_steps": 6450, "loss": 0.0299, "lr": 9.799538779469734e-05, "epoch": 1.8139534883720931, "percentage": 18.14, "elapsed_time": "3:41:57", "remaining_time": "16:41:41"} -{"current_steps": 1180, "total_steps": 6450, "loss": 0.029, "lr": 9.791883355502502e-05, "epoch": 1.8294573643410854, "percentage": 18.29, "elapsed_time": "3:43:18", "remaining_time": "16:37:20"} -{"current_steps": 1190, "total_steps": 6450, "loss": 0.0329, "lr": 9.784087585394437e-05, "epoch": 1.8449612403100775, "percentage": 18.45, "elapsed_time": "3:44:39", "remaining_time": "16:33:01"} -{"current_steps": 1200, "total_steps": 6450, "loss": 0.0365, "lr": 9.77615169747043e-05, "epoch": 1.8604651162790697, "percentage": 18.6, "elapsed_time": "3:46:00", "remaining_time": "16:28:46"} -{"current_steps": 1200, "total_steps": 6450, "eval_loss": 0.03505348786711693, "epoch": 1.8604651162790697, "percentage": 18.6, "elapsed_time": "3:48:44", "remaining_time": "16:40:44"} -{"current_steps": 1210, "total_steps": 6450, "loss": 0.0324, "lr": 9.768075924159185e-05, "epoch": 1.875968992248062, "percentage": 18.76, "elapsed_time": "3:50:09", "remaining_time": "16:36:45"} -{"current_steps": 1220, "total_steps": 6450, "loss": 0.0427, "lr": 9.759860501986417e-05, "epoch": 1.8914728682170543, "percentage": 18.91, "elapsed_time": "3:51:30", "remaining_time": "16:32:28"} -{"current_steps": 1230, "total_steps": 6450, "loss": 0.0374, "lr": 9.751505671567913e-05, "epoch": 1.9069767441860463, "percentage": 19.07, "elapsed_time": "3:52:51", "remaining_time": "16:28:14"} -{"current_steps": 1240, "total_steps": 6450, "loss": 0.0343, "lr": 9.743011677602493e-05, "epoch": 1.9224806201550386, "percentage": 19.22, "elapsed_time": "3:54:12", "remaining_time": "16:24:02"} -{"current_steps": 1250, "total_steps": 6450, "loss": 0.0399, "lr": 9.734378768864843e-05, "epoch": 1.937984496124031, "percentage": 19.38, "elapsed_time": "3:55:33", "remaining_time": "16:19:54"} -{"current_steps": 1250, "total_steps": 6450, "eval_loss": 0.03432035446166992, "epoch": 1.937984496124031, "percentage": 19.38, "elapsed_time": "3:58:17", "remaining_time": "16:31:18"} -{"current_steps": 1260, "total_steps": 6450, "loss": 0.0524, "lr": 9.725607198198227e-05, "epoch": 1.9534883720930232, "percentage": 19.53, "elapsed_time": "3:59:42", "remaining_time": "16:27:24"} -{"current_steps": 1270, "total_steps": 6450, "loss": 0.0377, "lr": 9.71669722250708e-05, "epoch": 1.9689922480620154, "percentage": 19.69, "elapsed_time": "4:01:04", "remaining_time": "16:23:14"} -{"current_steps": 1280, "total_steps": 6450, "loss": 0.0428, "lr": 9.707649102749489e-05, "epoch": 1.9844961240310077, "percentage": 19.84, "elapsed_time": "4:02:24", "remaining_time": "16:19:06"} -{"current_steps": 1290, "total_steps": 6450, "loss": 0.0369, "lr": 9.698463103929542e-05, "epoch": 2.0, "percentage": 20.0, "elapsed_time": "4:03:45", "remaining_time": "16:15:01"} -{"current_steps": 1300, "total_steps": 6450, "loss": 0.0331, "lr": 9.689139495089575e-05, "epoch": 2.0155038759689923, "percentage": 20.16, "elapsed_time": "4:05:06", "remaining_time": "16:10:58"} -{"current_steps": 1300, "total_steps": 6450, "eval_loss": 0.03468600660562515, "epoch": 2.0155038759689923, "percentage": 20.16, "elapsed_time": "4:07:50", "remaining_time": "16:21:49"} -{"current_steps": 1310, "total_steps": 6450, "loss": 0.0289, "lr": 9.679678549302287e-05, "epoch": 2.0310077519379846, "percentage": 20.31, "elapsed_time": "4:09:16", "remaining_time": "16:18:03"} -{"current_steps": 1320, "total_steps": 6450, "loss": 0.0249, "lr": 9.67008054366274e-05, "epoch": 2.046511627906977, "percentage": 20.47, "elapsed_time": "4:10:37", "remaining_time": "16:14:00"} -{"current_steps": 1330, "total_steps": 6450, "loss": 0.0192, "lr": 9.660345759280254e-05, "epoch": 2.062015503875969, "percentage": 20.62, "elapsed_time": "4:11:57", "remaining_time": "16:09:58"} -{"current_steps": 1340, "total_steps": 6450, "loss": 0.026, "lr": 9.650474481270158e-05, "epoch": 2.0775193798449614, "percentage": 20.78, "elapsed_time": "4:13:18", "remaining_time": "16:05:59"} -{"current_steps": 1350, "total_steps": 6450, "loss": 0.0234, "lr": 9.640466998745456e-05, "epoch": 2.0930232558139537, "percentage": 20.93, "elapsed_time": "4:14:39", "remaining_time": "16:02:03"} -{"current_steps": 1350, "total_steps": 6450, "eval_loss": 0.03671898692846298, "epoch": 2.0930232558139537, "percentage": 20.93, "elapsed_time": "4:17:24", "remaining_time": "16:12:24"} -{"current_steps": 1360, "total_steps": 6450, "loss": 0.0301, "lr": 9.630323604808344e-05, "epoch": 2.108527131782946, "percentage": 21.09, "elapsed_time": "4:18:49", "remaining_time": "16:08:42"} -{"current_steps": 1370, "total_steps": 6450, "loss": 0.0237, "lr": 9.62004459654164e-05, "epoch": 2.124031007751938, "percentage": 21.24, "elapsed_time": "4:20:10", "remaining_time": "16:04:45"} -{"current_steps": 1380, "total_steps": 6450, "loss": 0.0269, "lr": 9.609630275000072e-05, "epoch": 2.13953488372093, "percentage": 21.4, "elapsed_time": "4:21:31", "remaining_time": "16:00:51"} -{"current_steps": 1390, "total_steps": 6450, "loss": 0.0247, "lr": 9.599080945201462e-05, "epoch": 2.1550387596899223, "percentage": 21.55, "elapsed_time": "4:22:53", "remaining_time": "15:56:59"} -{"current_steps": 1400, "total_steps": 6450, "loss": 0.0241, "lr": 9.588396916117799e-05, "epoch": 2.1705426356589146, "percentage": 21.71, "elapsed_time": "4:24:13", "remaining_time": "15:53:07"} -{"current_steps": 1400, "total_steps": 6450, "eval_loss": 0.03474796190857887, "epoch": 2.1705426356589146, "percentage": 21.71, "elapsed_time": "4:26:58", "remaining_time": "16:03:00"} -{"current_steps": 1410, "total_steps": 6450, "loss": 0.0217, "lr": 9.577578500666187e-05, "epoch": 2.186046511627907, "percentage": 21.86, "elapsed_time": "4:28:23", "remaining_time": "15:59:21"} -{"current_steps": 1420, "total_steps": 6450, "loss": 0.0223, "lr": 9.566626015699672e-05, "epoch": 2.201550387596899, "percentage": 22.02, "elapsed_time": "4:29:44", "remaining_time": "15:55:28"} -{"current_steps": 1430, "total_steps": 6450, "loss": 0.0366, "lr": 9.555539781997977e-05, "epoch": 2.2170542635658914, "percentage": 22.17, "elapsed_time": "4:31:04", "remaining_time": "15:51:38"} -{"current_steps": 1440, "total_steps": 6450, "loss": 0.0265, "lr": 9.544320124258092e-05, "epoch": 2.2325581395348837, "percentage": 22.33, "elapsed_time": "4:32:25", "remaining_time": "15:47:48"} -{"current_steps": 1450, "total_steps": 6450, "loss": 0.0208, "lr": 9.532967371084778e-05, "epoch": 2.248062015503876, "percentage": 22.48, "elapsed_time": "4:33:46", "remaining_time": "15:44:03"} -{"current_steps": 1450, "total_steps": 6450, "eval_loss": 0.03416348248720169, "epoch": 2.248062015503876, "percentage": 22.48, "elapsed_time": "4:36:30", "remaining_time": "15:53:30"} -{"current_steps": 1460, "total_steps": 6450, "loss": 0.0227, "lr": 9.521481854980929e-05, "epoch": 2.2635658914728682, "percentage": 22.64, "elapsed_time": "4:37:56", "remaining_time": "15:49:57"} -{"current_steps": 1470, "total_steps": 6450, "loss": 0.0204, "lr": 9.509863912337842e-05, "epoch": 2.2790697674418605, "percentage": 22.79, "elapsed_time": "4:39:17", "remaining_time": "15:46:10"} -{"current_steps": 1480, "total_steps": 6450, "loss": 0.0364, "lr": 9.498113883425364e-05, "epoch": 2.294573643410853, "percentage": 22.95, "elapsed_time": "4:40:38", "remaining_time": "15:42:26"} -{"current_steps": 1490, "total_steps": 6450, "loss": 0.0221, "lr": 9.486232112381925e-05, "epoch": 2.310077519379845, "percentage": 23.1, "elapsed_time": "4:41:59", "remaining_time": "15:38:42"} -{"current_steps": 1500, "total_steps": 6450, "loss": 0.0321, "lr": 9.474218947204459e-05, "epoch": 2.3255813953488373, "percentage": 23.26, "elapsed_time": "4:43:20", "remaining_time": "15:35:00"} -{"current_steps": 1500, "total_steps": 6450, "eval_loss": 0.03633042424917221, "epoch": 2.3255813953488373, "percentage": 23.26, "elapsed_time": "4:46:04", "remaining_time": "15:44:03"} -{"current_steps": 1510, "total_steps": 6450, "loss": 0.0191, "lr": 9.462074739738211e-05, "epoch": 2.3410852713178296, "percentage": 23.41, "elapsed_time": "4:47:29", "remaining_time": "15:40:32"} -{"current_steps": 1520, "total_steps": 6450, "loss": 0.036, "lr": 9.44979984566643e-05, "epoch": 2.356589147286822, "percentage": 23.57, "elapsed_time": "4:48:50", "remaining_time": "15:36:49"} -{"current_steps": 1530, "total_steps": 6450, "loss": 0.0254, "lr": 9.437394624499958e-05, "epoch": 2.3720930232558137, "percentage": 23.72, "elapsed_time": "4:50:11", "remaining_time": "15:33:08"} -{"current_steps": 1540, "total_steps": 6450, "loss": 0.0243, "lr": 9.424859439566696e-05, "epoch": 2.387596899224806, "percentage": 23.88, "elapsed_time": "4:51:31", "remaining_time": "15:29:28"} -{"current_steps": 1550, "total_steps": 6450, "loss": 0.0193, "lr": 9.41219465800096e-05, "epoch": 2.4031007751937983, "percentage": 24.03, "elapsed_time": "4:52:52", "remaining_time": "15:25:50"} -{"current_steps": 1550, "total_steps": 6450, "eval_loss": 0.03856610879302025, "epoch": 2.4031007751937983, "percentage": 24.03, "elapsed_time": "4:55:36", "remaining_time": "15:34:30"} -{"current_steps": 1560, "total_steps": 6450, "loss": 0.0286, "lr": 9.399400650732735e-05, "epoch": 2.4186046511627906, "percentage": 24.19, "elapsed_time": "4:57:00", "remaining_time": "15:31:01"} -{"current_steps": 1570, "total_steps": 6450, "loss": 0.0232, "lr": 9.386477792476807e-05, "epoch": 2.434108527131783, "percentage": 24.34, "elapsed_time": "4:58:21", "remaining_time": "15:27:22"} -{"current_steps": 1580, "total_steps": 6450, "loss": 0.0223, "lr": 9.37342646172179e-05, "epoch": 2.449612403100775, "percentage": 24.5, "elapsed_time": "4:59:41", "remaining_time": "15:23:45"} -{"current_steps": 1590, "total_steps": 6450, "loss": 0.0278, "lr": 9.360247040719039e-05, "epoch": 2.4651162790697674, "percentage": 24.65, "elapsed_time": "5:01:02", "remaining_time": "15:20:10"} -{"current_steps": 1600, "total_steps": 6450, "loss": 0.0285, "lr": 9.346939915471453e-05, "epoch": 2.4806201550387597, "percentage": 24.81, "elapsed_time": "5:02:22", "remaining_time": "15:16:35"} -{"current_steps": 1600, "total_steps": 6450, "eval_loss": 0.03571667522192001, "epoch": 2.4806201550387597, "percentage": 24.81, "elapsed_time": "5:05:07", "remaining_time": "15:24:53"} -{"current_steps": 1610, "total_steps": 6450, "loss": 0.0335, "lr": 9.333505475722175e-05, "epoch": 2.496124031007752, "percentage": 24.96, "elapsed_time": "5:06:33", "remaining_time": "15:21:35"} -{"current_steps": 1620, "total_steps": 6450, "loss": 0.0248, "lr": 9.319944114943171e-05, "epoch": 2.511627906976744, "percentage": 25.12, "elapsed_time": "5:07:54", "remaining_time": "15:18:00"} -{"current_steps": 1630, "total_steps": 6450, "loss": 0.0342, "lr": 9.306256230323715e-05, "epoch": 2.5271317829457365, "percentage": 25.27, "elapsed_time": "5:09:15", "remaining_time": "15:14:28"} -{"current_steps": 1640, "total_steps": 6450, "loss": 0.029, "lr": 9.29244222275874e-05, "epoch": 2.5426356589147288, "percentage": 25.43, "elapsed_time": "5:10:35", "remaining_time": "15:10:58"} -{"current_steps": 1650, "total_steps": 6450, "loss": 0.0422, "lr": 9.278502496837116e-05, "epoch": 2.558139534883721, "percentage": 25.58, "elapsed_time": "5:11:56", "remaining_time": "15:07:28"} -{"current_steps": 1650, "total_steps": 6450, "eval_loss": 0.035971496254205704, "epoch": 2.558139534883721, "percentage": 25.58, "elapsed_time": "5:14:40", "remaining_time": "15:15:26"} -{"current_steps": 1660, "total_steps": 6450, "loss": 0.0265, "lr": 9.264437460829782e-05, "epoch": 2.5736434108527133, "percentage": 25.74, "elapsed_time": "5:16:06", "remaining_time": "15:12:08"} -{"current_steps": 1670, "total_steps": 6450, "loss": 0.0319, "lr": 9.250247526677806e-05, "epoch": 2.5891472868217056, "percentage": 25.89, "elapsed_time": "5:17:27", "remaining_time": "15:08:37"} -{"current_steps": 1680, "total_steps": 6450, "loss": 0.0239, "lr": 9.235933109980301e-05, "epoch": 2.604651162790698, "percentage": 26.05, "elapsed_time": "5:18:47", "remaining_time": "15:05:09"} -{"current_steps": 1690, "total_steps": 6450, "loss": 0.0273, "lr": 9.221494629982273e-05, "epoch": 2.62015503875969, "percentage": 26.2, "elapsed_time": "5:20:08", "remaining_time": "15:01:42"} -{"current_steps": 1700, "total_steps": 6450, "loss": 0.0223, "lr": 9.206932509562325e-05, "epoch": 2.6356589147286824, "percentage": 26.36, "elapsed_time": "5:21:29", "remaining_time": "14:58:16"} -{"current_steps": 1700, "total_steps": 6450, "eval_loss": 0.039764828979969025, "epoch": 2.6356589147286824, "percentage": 26.36, "elapsed_time": "5:24:13", "remaining_time": "15:05:55"} -{"current_steps": 1710, "total_steps": 6450, "loss": 0.0259, "lr": 9.192247175220276e-05, "epoch": 2.6511627906976747, "percentage": 26.51, "elapsed_time": "5:25:39", "remaining_time": "15:02:41"} -{"current_steps": 1720, "total_steps": 6450, "loss": 0.0228, "lr": 9.177439057064683e-05, "epoch": 2.6666666666666665, "percentage": 26.67, "elapsed_time": "5:26:59", "remaining_time": "14:59:14"} -{"current_steps": 1730, "total_steps": 6450, "loss": 0.0217, "lr": 9.16250858880022e-05, "epoch": 2.682170542635659, "percentage": 26.82, "elapsed_time": "5:28:20", "remaining_time": "14:55:49"} -{"current_steps": 1740, "total_steps": 6450, "loss": 0.025, "lr": 9.147456207714997e-05, "epoch": 2.697674418604651, "percentage": 26.98, "elapsed_time": "5:29:41", "remaining_time": "14:52:25"} -{"current_steps": 1750, "total_steps": 6450, "loss": 0.0222, "lr": 9.13228235466774e-05, "epoch": 2.7131782945736433, "percentage": 27.13, "elapsed_time": "5:31:01", "remaining_time": "14:49:02"} -{"current_steps": 1750, "total_steps": 6450, "eval_loss": 0.039446908980607986, "epoch": 2.7131782945736433, "percentage": 27.13, "elapsed_time": "5:33:46", "remaining_time": "14:56:24"} -{"current_steps": 1760, "total_steps": 6450, "loss": 0.0378, "lr": 9.116987474074884e-05, "epoch": 2.7286821705426356, "percentage": 27.29, "elapsed_time": "5:35:11", "remaining_time": "14:53:13"} -{"current_steps": 1770, "total_steps": 6450, "loss": 0.0347, "lr": 9.101572013897555e-05, "epoch": 2.744186046511628, "percentage": 27.44, "elapsed_time": "5:36:32", "remaining_time": "14:49:51"} -{"current_steps": 1780, "total_steps": 6450, "loss": 0.0334, "lr": 9.086036425628453e-05, "epoch": 2.75968992248062, "percentage": 27.6, "elapsed_time": "5:37:53", "remaining_time": "14:46:29"} -{"current_steps": 1790, "total_steps": 6450, "loss": 0.0347, "lr": 9.070381164278621e-05, "epoch": 2.7751937984496124, "percentage": 27.75, "elapsed_time": "5:39:14", "remaining_time": "14:43:08"} -{"current_steps": 1800, "total_steps": 6450, "loss": 0.0295, "lr": 9.05460668836413e-05, "epoch": 2.7906976744186047, "percentage": 27.91, "elapsed_time": "5:40:34", "remaining_time": "14:39:49"} -{"current_steps": 1800, "total_steps": 6450, "eval_loss": 0.03609917685389519, "epoch": 2.7906976744186047, "percentage": 27.91, "elapsed_time": "5:43:19", "remaining_time": "14:46:54"} -{"current_steps": 1810, "total_steps": 6450, "loss": 0.0234, "lr": 9.038713459892637e-05, "epoch": 2.806201550387597, "percentage": 28.06, "elapsed_time": "5:44:43", "remaining_time": "14:43:43"} -{"current_steps": 1820, "total_steps": 6450, "loss": 0.0322, "lr": 9.022701944349868e-05, "epoch": 2.8217054263565893, "percentage": 28.22, "elapsed_time": "5:46:04", "remaining_time": "14:40:24"} -{"current_steps": 1830, "total_steps": 6450, "loss": 0.024, "lr": 9.006572610685968e-05, "epoch": 2.8372093023255816, "percentage": 28.37, "elapsed_time": "5:47:25", "remaining_time": "14:37:06"} -{"current_steps": 1840, "total_steps": 6450, "loss": 0.0291, "lr": 8.990325931301782e-05, "epoch": 2.8527131782945734, "percentage": 28.53, "elapsed_time": "5:48:46", "remaining_time": "14:33:49"} -{"current_steps": 1850, "total_steps": 6450, "loss": 0.0254, "lr": 8.97396238203501e-05, "epoch": 2.8682170542635657, "percentage": 28.68, "elapsed_time": "5:50:07", "remaining_time": "14:30:34"} -{"current_steps": 1850, "total_steps": 6450, "eval_loss": 0.038111526519060135, "epoch": 2.8682170542635657, "percentage": 28.68, "elapsed_time": "5:52:51", "remaining_time": "14:37:22"} -{"current_steps": 1860, "total_steps": 6450, "loss": 0.0394, "lr": 8.957482442146272e-05, "epoch": 2.883720930232558, "percentage": 28.84, "elapsed_time": "5:54:15", "remaining_time": "14:34:13"} -{"current_steps": 1870, "total_steps": 6450, "loss": 0.0192, "lr": 8.94088659430507e-05, "epoch": 2.89922480620155, "percentage": 28.99, "elapsed_time": "5:55:36", "remaining_time": "14:30:56"} -{"current_steps": 1880, "total_steps": 6450, "loss": 0.0288, "lr": 8.924175324575659e-05, "epoch": 2.9147286821705425, "percentage": 29.15, "elapsed_time": "5:56:56", "remaining_time": "14:27:40"} -{"current_steps": 1890, "total_steps": 6450, "loss": 0.0219, "lr": 8.907349122402801e-05, "epoch": 2.9302325581395348, "percentage": 29.3, "elapsed_time": "5:58:17", "remaining_time": "14:24:26"} -{"current_steps": 1900, "total_steps": 6450, "loss": 0.0262, "lr": 8.890408480597436e-05, "epoch": 2.945736434108527, "percentage": 29.46, "elapsed_time": "5:59:37", "remaining_time": "14:21:12"} -{"current_steps": 1900, "total_steps": 6450, "eval_loss": 0.03564886376261711, "epoch": 2.945736434108527, "percentage": 29.46, "elapsed_time": "6:02:21", "remaining_time": "14:27:45"} -{"current_steps": 1910, "total_steps": 6450, "loss": 0.0264, "lr": 8.873353895322247e-05, "epoch": 2.9612403100775193, "percentage": 29.61, "elapsed_time": "6:03:46", "remaining_time": "14:24:40"} -{"current_steps": 1920, "total_steps": 6450, "loss": 0.032, "lr": 8.856185866077129e-05, "epoch": 2.9767441860465116, "percentage": 29.77, "elapsed_time": "6:05:07", "remaining_time": "14:21:26"} -{"current_steps": 1930, "total_steps": 6450, "loss": 0.0199, "lr": 8.838904895684555e-05, "epoch": 2.992248062015504, "percentage": 29.92, "elapsed_time": "6:06:27", "remaining_time": "14:18:14"} -{"current_steps": 1940, "total_steps": 6450, "loss": 0.0238, "lr": 8.821511490274854e-05, "epoch": 3.007751937984496, "percentage": 30.08, "elapsed_time": "6:07:48", "remaining_time": "14:15:03"} -{"current_steps": 1950, "total_steps": 6450, "loss": 0.0143, "lr": 8.80400615927139e-05, "epoch": 3.0232558139534884, "percentage": 30.23, "elapsed_time": "6:09:08", "remaining_time": "14:11:52"} -{"current_steps": 1950, "total_steps": 6450, "eval_loss": 0.03934966400265694, "epoch": 3.0232558139534884, "percentage": 30.23, "elapsed_time": "6:11:52", "remaining_time": "14:18:10"} -{"current_steps": 1960, "total_steps": 6450, "loss": 0.0207, "lr": 8.786389415375635e-05, "epoch": 3.0387596899224807, "percentage": 30.39, "elapsed_time": "6:13:17", "remaining_time": "14:15:07"} -{"current_steps": 1970, "total_steps": 6450, "loss": 0.0105, "lr": 8.768661774552154e-05, "epoch": 3.054263565891473, "percentage": 30.54, "elapsed_time": "6:14:37", "remaining_time": "14:11:56"} -{"current_steps": 1980, "total_steps": 6450, "loss": 0.02, "lr": 8.750823756013498e-05, "epoch": 3.0697674418604652, "percentage": 30.7, "elapsed_time": "6:15:58", "remaining_time": "14:08:46"} -{"current_steps": 1990, "total_steps": 6450, "loss": 0.0222, "lr": 8.732875882204993e-05, "epoch": 3.0852713178294575, "percentage": 30.85, "elapsed_time": "6:17:18", "remaining_time": "14:05:37"} -{"current_steps": 2000, "total_steps": 6450, "loss": 0.0151, "lr": 8.71481867878944e-05, "epoch": 3.10077519379845, "percentage": 31.01, "elapsed_time": "6:18:39", "remaining_time": "14:02:30"} -{"current_steps": 2000, "total_steps": 6450, "eval_loss": 0.04309219866991043, "epoch": 3.10077519379845, "percentage": 31.01, "elapsed_time": "6:21:23", "remaining_time": "14:08:36"} -{"current_steps": 2010, "total_steps": 6450, "loss": 0.0111, "lr": 8.696652674631717e-05, "epoch": 3.116279069767442, "percentage": 31.16, "elapsed_time": "6:22:48", "remaining_time": "14:05:36"} -{"current_steps": 2020, "total_steps": 6450, "loss": 0.0183, "lr": 8.678378401783294e-05, "epoch": 3.1317829457364343, "percentage": 31.32, "elapsed_time": "6:24:09", "remaining_time": "14:02:29"} -{"current_steps": 2030, "total_steps": 6450, "loss": 0.0164, "lr": 8.659996395466647e-05, "epoch": 3.147286821705426, "percentage": 31.47, "elapsed_time": "6:25:30", "remaining_time": "13:59:23"} -{"current_steps": 2040, "total_steps": 6450, "loss": 0.0163, "lr": 8.641507194059579e-05, "epoch": 3.1627906976744184, "percentage": 31.63, "elapsed_time": "6:26:51", "remaining_time": "13:56:17"} -{"current_steps": 2050, "total_steps": 6450, "loss": 0.0123, "lr": 8.622911339079464e-05, "epoch": 3.1782945736434107, "percentage": 31.78, "elapsed_time": "6:28:11", "remaining_time": "13:53:12"} -{"current_steps": 2050, "total_steps": 6450, "eval_loss": 0.04068796709179878, "epoch": 3.1782945736434107, "percentage": 31.78, "elapsed_time": "6:30:56", "remaining_time": "13:59:05"} -{"current_steps": 2060, "total_steps": 6450, "loss": 0.0126, "lr": 8.604209375167367e-05, "epoch": 3.193798449612403, "percentage": 31.94, "elapsed_time": "6:32:23", "remaining_time": "13:56:13"} -{"current_steps": 2070, "total_steps": 6450, "loss": 0.0178, "lr": 8.585401850072113e-05, "epoch": 3.2093023255813953, "percentage": 32.09, "elapsed_time": "6:33:44", "remaining_time": "13:53:08"} -{"current_steps": 2080, "total_steps": 6450, "loss": 0.0167, "lr": 8.566489314634231e-05, "epoch": 3.2248062015503876, "percentage": 32.25, "elapsed_time": "6:35:05", "remaining_time": "13:50:04"} -{"current_steps": 2090, "total_steps": 6450, "loss": 0.0134, "lr": 8.547472322769824e-05, "epoch": 3.24031007751938, "percentage": 32.4, "elapsed_time": "6:36:26", "remaining_time": "13:47:00"} -{"current_steps": 2100, "total_steps": 6450, "loss": 0.0142, "lr": 8.528351431454351e-05, "epoch": 3.255813953488372, "percentage": 32.56, "elapsed_time": "6:37:46", "remaining_time": "13:43:58"} -{"current_steps": 2100, "total_steps": 6450, "eval_loss": 0.041905563324689865, "epoch": 3.255813953488372, "percentage": 32.56, "elapsed_time": "6:40:31", "remaining_time": "13:49:38"} -{"current_steps": 2110, "total_steps": 6450, "loss": 0.0153, "lr": 8.509127200706305e-05, "epoch": 3.2713178294573644, "percentage": 32.71, "elapsed_time": "6:41:57", "remaining_time": "13:46:46"} -{"current_steps": 2120, "total_steps": 6450, "loss": 0.0201, "lr": 8.489800193570818e-05, "epoch": 3.2868217054263567, "percentage": 32.87, "elapsed_time": "6:43:18", "remaining_time": "13:43:43"} -{"current_steps": 2130, "total_steps": 6450, "loss": 0.0241, "lr": 8.47037097610317e-05, "epoch": 3.302325581395349, "percentage": 33.02, "elapsed_time": "6:44:38", "remaining_time": "13:40:41"} -{"current_steps": 2140, "total_steps": 6450, "loss": 0.0203, "lr": 8.450840117352204e-05, "epoch": 3.317829457364341, "percentage": 33.18, "elapsed_time": "6:45:59", "remaining_time": "13:37:39"} -{"current_steps": 2150, "total_steps": 6450, "loss": 0.018, "lr": 8.43120818934367e-05, "epoch": 3.3333333333333335, "percentage": 33.33, "elapsed_time": "6:47:19", "remaining_time": "13:34:39"} -{"current_steps": 2150, "total_steps": 6450, "eval_loss": 0.03900735452771187, "epoch": 3.3333333333333335, "percentage": 33.33, "elapsed_time": "6:50:04", "remaining_time": "13:40:08"} -{"current_steps": 2160, "total_steps": 6450, "loss": 0.0242, "lr": 8.411475767063455e-05, "epoch": 3.3488372093023258, "percentage": 33.49, "elapsed_time": "6:51:29", "remaining_time": "13:37:15"} -{"current_steps": 2170, "total_steps": 6450, "loss": 0.0139, "lr": 8.391643428440766e-05, "epoch": 3.3643410852713176, "percentage": 33.64, "elapsed_time": "6:52:49", "remaining_time": "13:34:14"} -{"current_steps": 2180, "total_steps": 6450, "loss": 0.0198, "lr": 8.371711754331182e-05, "epoch": 3.37984496124031, "percentage": 33.8, "elapsed_time": "6:54:10", "remaining_time": "13:31:14"} -{"current_steps": 2190, "total_steps": 6450, "loss": 0.0124, "lr": 8.35168132849965e-05, "epoch": 3.395348837209302, "percentage": 33.95, "elapsed_time": "6:55:30", "remaining_time": "13:28:15"} -{"current_steps": 2200, "total_steps": 6450, "loss": 0.0115, "lr": 8.33155273760339e-05, "epoch": 3.4108527131782944, "percentage": 34.11, "elapsed_time": "6:56:51", "remaining_time": "13:25:17"} -{"current_steps": 2200, "total_steps": 6450, "eval_loss": 0.05070589482784271, "epoch": 3.4108527131782944, "percentage": 34.11, "elapsed_time": "6:59:35", "remaining_time": "13:30:35"} -{"current_steps": 2210, "total_steps": 6450, "loss": 0.0203, "lr": 8.31132657117471e-05, "epoch": 3.4263565891472867, "percentage": 34.26, "elapsed_time": "7:01:00", "remaining_time": "13:27:44"} -{"current_steps": 2220, "total_steps": 6450, "loss": 0.0135, "lr": 8.29100342160374e-05, "epoch": 3.441860465116279, "percentage": 34.42, "elapsed_time": "7:02:21", "remaining_time": "13:24:45"} -{"current_steps": 2230, "total_steps": 6450, "loss": 0.0179, "lr": 8.270583884121082e-05, "epoch": 3.4573643410852712, "percentage": 34.57, "elapsed_time": "7:03:42", "remaining_time": "13:21:48"} -{"current_steps": 2240, "total_steps": 6450, "loss": 0.0164, "lr": 8.250068556780375e-05, "epoch": 3.4728682170542635, "percentage": 34.73, "elapsed_time": "7:05:02", "remaining_time": "13:18:51"} -{"current_steps": 2250, "total_steps": 6450, "loss": 0.0185, "lr": 8.229458040440783e-05, "epoch": 3.488372093023256, "percentage": 34.88, "elapsed_time": "7:06:22", "remaining_time": "13:15:54"} -{"current_steps": 2250, "total_steps": 6450, "eval_loss": 0.04473824426531792, "epoch": 3.488372093023256, "percentage": 34.88, "elapsed_time": "7:09:07", "remaining_time": "13:21:01"} -{"current_steps": 2260, "total_steps": 6450, "loss": 0.0119, "lr": 8.208752938749389e-05, "epoch": 3.503875968992248, "percentage": 35.04, "elapsed_time": "7:10:33", "remaining_time": "13:18:14"} -{"current_steps": 2270, "total_steps": 6450, "loss": 0.0193, "lr": 8.18795385812353e-05, "epoch": 3.5193798449612403, "percentage": 35.19, "elapsed_time": "7:11:54", "remaining_time": "13:15:18"} -{"current_steps": 2280, "total_steps": 6450, "loss": 0.0235, "lr": 8.167061407733016e-05, "epoch": 3.5348837209302326, "percentage": 35.35, "elapsed_time": "7:13:14", "remaining_time": "13:12:23"} -{"current_steps": 2290, "total_steps": 6450, "loss": 0.0181, "lr": 8.14607619948231e-05, "epoch": 3.550387596899225, "percentage": 35.5, "elapsed_time": "7:14:35", "remaining_time": "13:09:28"} -{"current_steps": 2300, "total_steps": 6450, "loss": 0.0216, "lr": 8.124998847992586e-05, "epoch": 3.565891472868217, "percentage": 35.66, "elapsed_time": "7:15:55", "remaining_time": "13:06:34"} -{"current_steps": 2300, "total_steps": 6450, "eval_loss": 0.041897304356098175, "epoch": 3.565891472868217, "percentage": 35.66, "elapsed_time": "7:18:40", "remaining_time": "13:11:30"} -{"current_steps": 2310, "total_steps": 6450, "loss": 0.0232, "lr": 8.103829970583742e-05, "epoch": 3.5813953488372094, "percentage": 35.81, "elapsed_time": "7:20:04", "remaining_time": "13:08:42"} -{"current_steps": 2320, "total_steps": 6450, "loss": 0.0204, "lr": 8.082570187256315e-05, "epoch": 3.5968992248062017, "percentage": 35.97, "elapsed_time": "7:21:25", "remaining_time": "13:05:48"} -{"current_steps": 2330, "total_steps": 6450, "loss": 0.0159, "lr": 8.061220120673323e-05, "epoch": 3.612403100775194, "percentage": 36.12, "elapsed_time": "7:22:46", "remaining_time": "13:02:55"} -{"current_steps": 2340, "total_steps": 6450, "loss": 0.0173, "lr": 8.039780396142022e-05, "epoch": 3.6279069767441863, "percentage": 36.28, "elapsed_time": "7:24:06", "remaining_time": "13:00:02"} -{"current_steps": 2350, "total_steps": 6450, "loss": 0.0152, "lr": 8.018251641595604e-05, "epoch": 3.6434108527131785, "percentage": 36.43, "elapsed_time": "7:25:27", "remaining_time": "12:57:10"} -{"current_steps": 2350, "total_steps": 6450, "eval_loss": 0.049069929867982864, "epoch": 3.6434108527131785, "percentage": 36.43, "elapsed_time": "7:28:11", "remaining_time": "13:01:56"} -{"current_steps": 2360, "total_steps": 6450, "loss": 0.0177, "lr": 7.9966344875748e-05, "epoch": 3.6589147286821704, "percentage": 36.59, "elapsed_time": "7:29:35", "remaining_time": "12:59:10"} -{"current_steps": 2370, "total_steps": 6450, "loss": 0.0177, "lr": 7.9749295672094e-05, "epoch": 3.6744186046511627, "percentage": 36.74, "elapsed_time": "7:30:56", "remaining_time": "12:56:18"} -{"current_steps": 2380, "total_steps": 6450, "loss": 0.0205, "lr": 7.953137516199736e-05, "epoch": 3.689922480620155, "percentage": 36.9, "elapsed_time": "7:32:16", "remaining_time": "12:53:26"} -{"current_steps": 2390, "total_steps": 6450, "loss": 0.0173, "lr": 7.93125897279804e-05, "epoch": 3.705426356589147, "percentage": 37.05, "elapsed_time": "7:33:37", "remaining_time": "12:50:35"} -{"current_steps": 2400, "total_steps": 6450, "loss": 0.0258, "lr": 7.909294577789766e-05, "epoch": 3.7209302325581395, "percentage": 37.21, "elapsed_time": "7:34:57", "remaining_time": "12:47:45"} -{"current_steps": 2400, "total_steps": 6450, "eval_loss": 0.0414716899394989, "epoch": 3.7209302325581395, "percentage": 37.21, "elapsed_time": "7:37:42", "remaining_time": "12:52:22"} -{"current_steps": 2410, "total_steps": 6450, "loss": 0.0176, "lr": 7.887244974474806e-05, "epoch": 3.7364341085271318, "percentage": 37.36, "elapsed_time": "7:39:08", "remaining_time": "12:49:40"} -{"current_steps": 2420, "total_steps": 6450, "loss": 0.0231, "lr": 7.865110808648672e-05, "epoch": 3.751937984496124, "percentage": 37.52, "elapsed_time": "7:40:29", "remaining_time": "12:46:50"} -{"current_steps": 2430, "total_steps": 6450, "loss": 0.0179, "lr": 7.842892728583558e-05, "epoch": 3.7674418604651163, "percentage": 37.67, "elapsed_time": "7:41:49", "remaining_time": "12:44:00"} -{"current_steps": 2440, "total_steps": 6450, "loss": 0.0183, "lr": 7.820591385009366e-05, "epoch": 3.7829457364341086, "percentage": 37.83, "elapsed_time": "7:43:10", "remaining_time": "12:41:12"} -{"current_steps": 2450, "total_steps": 6450, "loss": 0.0135, "lr": 7.79820743109465e-05, "epoch": 3.798449612403101, "percentage": 37.98, "elapsed_time": "7:44:30", "remaining_time": "12:38:23"} -{"current_steps": 2450, "total_steps": 6450, "eval_loss": 0.041855063289403915, "epoch": 3.798449612403101, "percentage": 37.98, "elapsed_time": "7:47:15", "remaining_time": "12:42:51"} -{"current_steps": 2460, "total_steps": 6450, "loss": 0.014, "lr": 7.775741522427477e-05, "epoch": 3.813953488372093, "percentage": 38.14, "elapsed_time": "7:48:39", "remaining_time": "12:40:08"} -{"current_steps": 2470, "total_steps": 6450, "loss": 0.0145, "lr": 7.75319431699623e-05, "epoch": 3.8294573643410854, "percentage": 38.29, "elapsed_time": "7:50:00", "remaining_time": "12:37:19"} -{"current_steps": 2480, "total_steps": 6450, "loss": 0.019, "lr": 7.730566475170333e-05, "epoch": 3.8449612403100772, "percentage": 38.45, "elapsed_time": "7:51:20", "remaining_time": "12:34:32"} -{"current_steps": 2490, "total_steps": 6450, "loss": 0.0213, "lr": 7.707858659680924e-05, "epoch": 3.8604651162790695, "percentage": 38.6, "elapsed_time": "7:52:41", "remaining_time": "12:31:44"} -{"current_steps": 2500, "total_steps": 6450, "loss": 0.0171, "lr": 7.68507153560142e-05, "epoch": 3.875968992248062, "percentage": 38.76, "elapsed_time": "7:54:01", "remaining_time": "12:28:58"} -{"current_steps": 2500, "total_steps": 6450, "eval_loss": 0.041576988995075226, "epoch": 3.875968992248062, "percentage": 38.76, "elapsed_time": "7:56:46", "remaining_time": "12:33:17"} -{"current_steps": 2510, "total_steps": 6450, "loss": 0.0135, "lr": 7.662205770328064e-05, "epoch": 3.891472868217054, "percentage": 38.91, "elapsed_time": "7:58:11", "remaining_time": "12:30:37"} -{"current_steps": 2520, "total_steps": 6450, "loss": 0.0292, "lr": 7.639262033560359e-05, "epoch": 3.9069767441860463, "percentage": 39.07, "elapsed_time": "7:59:31", "remaining_time": "12:27:50"} -{"current_steps": 2530, "total_steps": 6450, "loss": 0.0233, "lr": 7.616240997281466e-05, "epoch": 3.9224806201550386, "percentage": 39.22, "elapsed_time": "8:00:52", "remaining_time": "12:25:04"} -{"current_steps": 2540, "total_steps": 6450, "loss": 0.0124, "lr": 7.593143335738511e-05, "epoch": 3.937984496124031, "percentage": 39.38, "elapsed_time": "8:02:12", "remaining_time": "12:22:18"} -{"current_steps": 2550, "total_steps": 6450, "loss": 0.0162, "lr": 7.56996972542285e-05, "epoch": 3.953488372093023, "percentage": 39.53, "elapsed_time": "8:03:32", "remaining_time": "12:19:32"} -{"current_steps": 2550, "total_steps": 6450, "eval_loss": 0.0474853552877903, "epoch": 3.953488372093023, "percentage": 39.53, "elapsed_time": "8:06:17", "remaining_time": "12:23:43"} -{"current_steps": 2560, "total_steps": 6450, "loss": 0.0179, "lr": 7.546720845050247e-05, "epoch": 3.9689922480620154, "percentage": 39.69, "elapsed_time": "8:07:41", "remaining_time": "12:21:04"} -{"current_steps": 2570, "total_steps": 6450, "loss": 0.0245, "lr": 7.523397375541002e-05, "epoch": 3.9844961240310077, "percentage": 39.84, "elapsed_time": "8:09:02", "remaining_time": "12:18:18"} -{"current_steps": 2580, "total_steps": 6450, "loss": 0.0167, "lr": 7.500000000000001e-05, "epoch": 4.0, "percentage": 40.0, "elapsed_time": "8:10:23", "remaining_time": "12:15:34"} -{"current_steps": 2590, "total_steps": 6450, "loss": 0.0122, "lr": 7.47652940369671e-05, "epoch": 4.015503875968992, "percentage": 40.16, "elapsed_time": "8:11:44", "remaining_time": "12:12:51"} -{"current_steps": 2600, "total_steps": 6450, "loss": 0.0111, "lr": 7.452986274045115e-05, "epoch": 4.0310077519379846, "percentage": 40.31, "elapsed_time": "8:13:04", "remaining_time": "12:10:07"} -{"current_steps": 2600, "total_steps": 6450, "eval_loss": 0.045642729848623276, "epoch": 4.0310077519379846, "percentage": 40.31, "elapsed_time": "8:15:48", "remaining_time": "12:14:10"} -{"current_steps": 2610, "total_steps": 6450, "loss": 0.0104, "lr": 7.42937130058357e-05, "epoch": 4.046511627906977, "percentage": 40.47, "elapsed_time": "8:17:13", "remaining_time": "12:11:32"} -{"current_steps": 2620, "total_steps": 6450, "loss": 0.0066, "lr": 7.405685174954623e-05, "epoch": 4.062015503875969, "percentage": 40.62, "elapsed_time": "8:18:33", "remaining_time": "12:08:48"} -{"current_steps": 2630, "total_steps": 6450, "loss": 0.0089, "lr": 7.381928590884741e-05, "epoch": 4.077519379844961, "percentage": 40.78, "elapsed_time": "8:19:54", "remaining_time": "12:06:05"} -{"current_steps": 2640, "total_steps": 6450, "loss": 0.0098, "lr": 7.358102244164003e-05, "epoch": 4.093023255813954, "percentage": 40.93, "elapsed_time": "8:21:14", "remaining_time": "12:03:23"} -{"current_steps": 2650, "total_steps": 6450, "loss": 0.0138, "lr": 7.334206832625719e-05, "epoch": 4.108527131782946, "percentage": 41.09, "elapsed_time": "8:22:34", "remaining_time": "12:00:41"} -{"current_steps": 2650, "total_steps": 6450, "eval_loss": 0.05424889177083969, "epoch": 4.108527131782946, "percentage": 41.09, "elapsed_time": "8:25:19", "remaining_time": "12:04:36"} -{"current_steps": 2660, "total_steps": 6450, "loss": 0.0075, "lr": 7.310243056125984e-05, "epoch": 4.124031007751938, "percentage": 41.24, "elapsed_time": "8:26:43", "remaining_time": "12:01:59"} -{"current_steps": 2670, "total_steps": 6450, "loss": 0.0085, "lr": 7.286211616523193e-05, "epoch": 4.1395348837209305, "percentage": 41.4, "elapsed_time": "8:28:04", "remaining_time": "11:59:17"} -{"current_steps": 2680, "total_steps": 6450, "loss": 0.0093, "lr": 7.262113217657477e-05, "epoch": 4.155038759689923, "percentage": 41.55, "elapsed_time": "8:29:24", "remaining_time": "11:56:36"} -{"current_steps": 2690, "total_steps": 6450, "loss": 0.0035, "lr": 7.23794856533009e-05, "epoch": 4.170542635658915, "percentage": 41.71, "elapsed_time": "8:30:44", "remaining_time": "11:53:54"} -{"current_steps": 2700, "total_steps": 6450, "loss": 0.0101, "lr": 7.213718367282737e-05, "epoch": 4.186046511627907, "percentage": 41.86, "elapsed_time": "8:32:05", "remaining_time": "11:51:14"} -{"current_steps": 2700, "total_steps": 6450, "eval_loss": 0.05315929278731346, "epoch": 4.186046511627907, "percentage": 41.86, "elapsed_time": "8:34:49", "remaining_time": "11:55:02"} -{"current_steps": 2710, "total_steps": 6450, "loss": 0.012, "lr": 7.189423333176847e-05, "epoch": 4.2015503875969, "percentage": 42.02, "elapsed_time": "8:36:15", "remaining_time": "11:52:27"} -{"current_steps": 2720, "total_steps": 6450, "loss": 0.0054, "lr": 7.165064174572787e-05, "epoch": 4.217054263565892, "percentage": 42.17, "elapsed_time": "8:37:35", "remaining_time": "11:49:47"} -{"current_steps": 2730, "total_steps": 6450, "loss": 0.0154, "lr": 7.14064160490902e-05, "epoch": 4.232558139534884, "percentage": 42.33, "elapsed_time": "8:38:56", "remaining_time": "11:47:07"} -{"current_steps": 2740, "total_steps": 6450, "loss": 0.0051, "lr": 7.116156339481215e-05, "epoch": 4.248062015503876, "percentage": 42.48, "elapsed_time": "8:40:16", "remaining_time": "11:44:28"} -{"current_steps": 2750, "total_steps": 6450, "loss": 0.0089, "lr": 7.09160909542129e-05, "epoch": 4.263565891472869, "percentage": 42.64, "elapsed_time": "8:41:37", "remaining_time": "11:41:49"} -{"current_steps": 2750, "total_steps": 6450, "eval_loss": 0.05112217739224434, "epoch": 4.263565891472869, "percentage": 42.64, "elapsed_time": "8:44:21", "remaining_time": "11:45:29"} -{"current_steps": 2760, "total_steps": 6450, "loss": 0.0073, "lr": 7.067000591676416e-05, "epoch": 4.27906976744186, "percentage": 42.79, "elapsed_time": "8:45:46", "remaining_time": "11:42:56"} -{"current_steps": 2770, "total_steps": 6450, "loss": 0.0138, "lr": 7.042331548987953e-05, "epoch": 4.294573643410852, "percentage": 42.95, "elapsed_time": "8:47:07", "remaining_time": "11:40:18"} -{"current_steps": 2780, "total_steps": 6450, "loss": 0.0114, "lr": 7.017602689870345e-05, "epoch": 4.310077519379845, "percentage": 43.1, "elapsed_time": "8:48:28", "remaining_time": "11:37:39"} -{"current_steps": 2790, "total_steps": 6450, "loss": 0.0097, "lr": 6.992814738589957e-05, "epoch": 4.325581395348837, "percentage": 43.26, "elapsed_time": "8:49:49", "remaining_time": "11:35:02"} -{"current_steps": 2800, "total_steps": 6450, "loss": 0.0096, "lr": 6.96796842114387e-05, "epoch": 4.341085271317829, "percentage": 43.41, "elapsed_time": "8:51:09", "remaining_time": "11:32:24"} -{"current_steps": 2800, "total_steps": 6450, "eval_loss": 0.054375067353248596, "epoch": 4.341085271317829, "percentage": 43.41, "elapsed_time": "8:53:54", "remaining_time": "11:35:58"} -{"current_steps": 2810, "total_steps": 6450, "loss": 0.0091, "lr": 6.943064465238597e-05, "epoch": 4.3565891472868215, "percentage": 43.57, "elapsed_time": "8:55:19", "remaining_time": "11:33:26"} -{"current_steps": 2820, "total_steps": 6450, "loss": 0.0083, "lr": 6.918103600268799e-05, "epoch": 4.372093023255814, "percentage": 43.72, "elapsed_time": "8:56:39", "remaining_time": "11:30:48"} -{"current_steps": 2830, "total_steps": 6450, "loss": 0.0104, "lr": 6.893086557295896e-05, "epoch": 4.387596899224806, "percentage": 43.88, "elapsed_time": "8:57:59", "remaining_time": "11:28:10"} -{"current_steps": 2840, "total_steps": 6450, "loss": 0.0114, "lr": 6.868014069026671e-05, "epoch": 4.403100775193798, "percentage": 44.03, "elapsed_time": "8:59:19", "remaining_time": "11:25:33"} -{"current_steps": 2850, "total_steps": 6450, "loss": 0.0102, "lr": 6.842886869791809e-05, "epoch": 4.4186046511627906, "percentage": 44.19, "elapsed_time": "9:00:40", "remaining_time": "11:22:57"} -{"current_steps": 2850, "total_steps": 6450, "eval_loss": 0.05103997886180878, "epoch": 4.4186046511627906, "percentage": 44.19, "elapsed_time": "9:03:24", "remaining_time": "11:26:24"} -{"current_steps": 2860, "total_steps": 6450, "loss": 0.0073, "lr": 6.817705695524379e-05, "epoch": 4.434108527131783, "percentage": 44.34, "elapsed_time": "9:04:50", "remaining_time": "11:23:54"} -{"current_steps": 2870, "total_steps": 6450, "loss": 0.0117, "lr": 6.792471283738293e-05, "epoch": 4.449612403100775, "percentage": 44.5, "elapsed_time": "9:06:11", "remaining_time": "11:21:18"} -{"current_steps": 2880, "total_steps": 6450, "loss": 0.0057, "lr": 6.767184373506697e-05, "epoch": 4.465116279069767, "percentage": 44.65, "elapsed_time": "9:07:31", "remaining_time": "11:18:42"} -{"current_steps": 2890, "total_steps": 6450, "loss": 0.0062, "lr": 6.741845705440329e-05, "epoch": 4.48062015503876, "percentage": 44.81, "elapsed_time": "9:08:52", "remaining_time": "11:16:07"} -{"current_steps": 2900, "total_steps": 6450, "loss": 0.0087, "lr": 6.716456021665824e-05, "epoch": 4.496124031007752, "percentage": 44.96, "elapsed_time": "9:10:12", "remaining_time": "11:13:32"} -{"current_steps": 2900, "total_steps": 6450, "eval_loss": 0.059884294867515564, "epoch": 4.496124031007752, "percentage": 44.96, "elapsed_time": "9:12:57", "remaining_time": "11:16:53"} -{"current_steps": 2910, "total_steps": 6450, "loss": 0.0104, "lr": 6.691016065803983e-05, "epoch": 4.511627906976744, "percentage": 45.12, "elapsed_time": "9:14:22", "remaining_time": "11:14:24"} -{"current_steps": 2920, "total_steps": 6450, "loss": 0.0101, "lr": 6.66552658294799e-05, "epoch": 4.5271317829457365, "percentage": 45.27, "elapsed_time": "9:15:43", "remaining_time": "11:11:48"} -{"current_steps": 2930, "total_steps": 6450, "loss": 0.0058, "lr": 6.639988319641593e-05, "epoch": 4.542635658914729, "percentage": 45.43, "elapsed_time": "9:17:03", "remaining_time": "11:09:14"} -{"current_steps": 2940, "total_steps": 6450, "loss": 0.0088, "lr": 6.614402023857232e-05, "epoch": 4.558139534883721, "percentage": 45.58, "elapsed_time": "9:18:24", "remaining_time": "11:06:40"} -{"current_steps": 2950, "total_steps": 6450, "loss": 0.0116, "lr": 6.58876844497414e-05, "epoch": 4.573643410852713, "percentage": 45.74, "elapsed_time": "9:19:45", "remaining_time": "11:04:06"} -{"current_steps": 2950, "total_steps": 6450, "eval_loss": 0.052180349826812744, "epoch": 4.573643410852713, "percentage": 45.74, "elapsed_time": "9:22:29", "remaining_time": "11:07:21"} -{"current_steps": 2960, "total_steps": 6450, "loss": 0.0038, "lr": 6.563088333756394e-05, "epoch": 4.589147286821706, "percentage": 45.89, "elapsed_time": "9:23:53", "remaining_time": "11:04:51"} -{"current_steps": 2970, "total_steps": 6450, "loss": 0.0053, "lr": 6.537362442330916e-05, "epoch": 4.604651162790698, "percentage": 46.05, "elapsed_time": "9:25:14", "remaining_time": "11:02:17"} -{"current_steps": 2980, "total_steps": 6450, "loss": 0.0098, "lr": 6.511591524165464e-05, "epoch": 4.62015503875969, "percentage": 46.2, "elapsed_time": "9:26:34", "remaining_time": "10:59:44"} -{"current_steps": 2990, "total_steps": 6450, "loss": 0.0081, "lr": 6.485776334046546e-05, "epoch": 4.635658914728682, "percentage": 46.36, "elapsed_time": "9:27:55", "remaining_time": "10:57:11"} -{"current_steps": 3000, "total_steps": 6450, "loss": 0.0098, "lr": 6.45991762805732e-05, "epoch": 4.651162790697675, "percentage": 46.51, "elapsed_time": "9:29:16", "remaining_time": "10:54:39"} -{"current_steps": 3000, "total_steps": 6450, "eval_loss": 0.05532576143741608, "epoch": 4.651162790697675, "percentage": 46.51, "elapsed_time": "9:31:59", "remaining_time": "10:57:47"} -{"current_steps": 3010, "total_steps": 6450, "loss": 0.0081, "lr": 6.434016163555452e-05, "epoch": 4.666666666666667, "percentage": 46.67, "elapsed_time": "9:33:25", "remaining_time": "10:55:20"} -{"current_steps": 3020, "total_steps": 6450, "loss": 0.0083, "lr": 6.408072699150932e-05, "epoch": 4.682170542635659, "percentage": 46.82, "elapsed_time": "9:34:45", "remaining_time": "10:52:47"} -{"current_steps": 3030, "total_steps": 6450, "loss": 0.0133, "lr": 6.382087994683859e-05, "epoch": 4.6976744186046515, "percentage": 46.98, "elapsed_time": "9:36:06", "remaining_time": "10:50:15"} -{"current_steps": 3040, "total_steps": 6450, "loss": 0.0102, "lr": 6.356062811202175e-05, "epoch": 4.713178294573644, "percentage": 47.13, "elapsed_time": "9:37:27", "remaining_time": "10:47:44"} -{"current_steps": 3050, "total_steps": 6450, "loss": 0.0092, "lr": 6.329997910939394e-05, "epoch": 4.728682170542635, "percentage": 47.29, "elapsed_time": "9:38:47", "remaining_time": "10:45:12"} -{"current_steps": 3050, "total_steps": 6450, "eval_loss": 0.05312963202595711, "epoch": 4.728682170542635, "percentage": 47.29, "elapsed_time": "9:41:31", "remaining_time": "10:48:15"} -{"current_steps": 3060, "total_steps": 6450, "loss": 0.0149, "lr": 6.303894057292261e-05, "epoch": 4.7441860465116275, "percentage": 47.44, "elapsed_time": "9:42:58", "remaining_time": "10:45:50"} -{"current_steps": 3070, "total_steps": 6450, "loss": 0.0116, "lr": 6.277752014798401e-05, "epoch": 4.75968992248062, "percentage": 47.6, "elapsed_time": "9:44:18", "remaining_time": "10:43:18"} -{"current_steps": 3080, "total_steps": 6450, "loss": 0.0127, "lr": 6.251572549113924e-05, "epoch": 4.775193798449612, "percentage": 47.75, "elapsed_time": "9:45:39", "remaining_time": "10:40:48"} -{"current_steps": 3090, "total_steps": 6450, "loss": 0.0107, "lr": 6.225356426991007e-05, "epoch": 4.790697674418604, "percentage": 47.91, "elapsed_time": "9:47:00", "remaining_time": "10:38:17"} -{"current_steps": 3100, "total_steps": 6450, "loss": 0.0158, "lr": 6.199104416255425e-05, "epoch": 4.8062015503875966, "percentage": 48.06, "elapsed_time": "9:48:20", "remaining_time": "10:35:46"} -{"current_steps": 3100, "total_steps": 6450, "eval_loss": 0.047908179461956024, "epoch": 4.8062015503875966, "percentage": 48.06, "elapsed_time": "9:51:04", "remaining_time": "10:38:44"} -{"current_steps": 3110, "total_steps": 6450, "loss": 0.0074, "lr": 6.172817285784076e-05, "epoch": 4.821705426356589, "percentage": 48.22, "elapsed_time": "9:52:29", "remaining_time": "10:36:18"} -{"current_steps": 3120, "total_steps": 6450, "loss": 0.0111, "lr": 6.146495805482451e-05, "epoch": 4.837209302325581, "percentage": 48.37, "elapsed_time": "9:53:50", "remaining_time": "10:33:48"} -{"current_steps": 3130, "total_steps": 6450, "loss": 0.0095, "lr": 6.120140746262091e-05, "epoch": 4.852713178294573, "percentage": 48.53, "elapsed_time": "9:55:10", "remaining_time": "10:31:18"} -{"current_steps": 3140, "total_steps": 6450, "loss": 0.0084, "lr": 6.093752880018005e-05, "epoch": 4.868217054263566, "percentage": 48.68, "elapsed_time": "9:56:30", "remaining_time": "10:28:48"} -{"current_steps": 3150, "total_steps": 6450, "loss": 0.0113, "lr": 6.0673329796060686e-05, "epoch": 4.883720930232558, "percentage": 48.84, "elapsed_time": "9:57:51", "remaining_time": "10:26:19"} -{"current_steps": 3150, "total_steps": 6450, "eval_loss": 0.04985112324357033, "epoch": 4.883720930232558, "percentage": 48.84, "elapsed_time": "10:00:35", "remaining_time": "10:29:11"} -{"current_steps": 3160, "total_steps": 6450, "loss": 0.0117, "lr": 6.0408818188203795e-05, "epoch": 4.89922480620155, "percentage": 48.99, "elapsed_time": "10:02:00", "remaining_time": "10:26:46"} -{"current_steps": 3170, "total_steps": 6450, "loss": 0.0116, "lr": 6.0144001723706e-05, "epoch": 4.9147286821705425, "percentage": 49.15, "elapsed_time": "10:03:21", "remaining_time": "10:24:17"} -{"current_steps": 3180, "total_steps": 6450, "loss": 0.0104, "lr": 5.987888815859266e-05, "epoch": 4.930232558139535, "percentage": 49.3, "elapsed_time": "10:04:42", "remaining_time": "10:21:49"} -{"current_steps": 3190, "total_steps": 6450, "loss": 0.0148, "lr": 5.9613485257590715e-05, "epoch": 4.945736434108527, "percentage": 49.46, "elapsed_time": "10:06:02", "remaining_time": "10:19:20"} -{"current_steps": 3200, "total_steps": 6450, "loss": 0.0115, "lr": 5.934780079390124e-05, "epoch": 4.961240310077519, "percentage": 49.61, "elapsed_time": "10:07:23", "remaining_time": "10:16:52"} -{"current_steps": 3200, "total_steps": 6450, "eval_loss": 0.04393929988145828, "epoch": 4.961240310077519, "percentage": 49.61, "elapsed_time": "10:10:07", "remaining_time": "10:19:39"} -{"current_steps": 3210, "total_steps": 6450, "loss": 0.0131, "lr": 5.908184254897182e-05, "epoch": 4.976744186046512, "percentage": 49.77, "elapsed_time": "10:11:33", "remaining_time": "10:17:16"} -{"current_steps": 3220, "total_steps": 6450, "loss": 0.0059, "lr": 5.881561831226865e-05, "epoch": 4.992248062015504, "percentage": 49.92, "elapsed_time": "10:12:53", "remaining_time": "10:14:48"} -{"current_steps": 3230, "total_steps": 6450, "loss": 0.0089, "lr": 5.854913588104832e-05, "epoch": 5.007751937984496, "percentage": 50.08, "elapsed_time": "10:14:14", "remaining_time": "10:12:20"} -{"current_steps": 3240, "total_steps": 6450, "loss": 0.0074, "lr": 5.8282403060129566e-05, "epoch": 5.023255813953488, "percentage": 50.23, "elapsed_time": "10:15:35", "remaining_time": "10:09:53"} -{"current_steps": 3250, "total_steps": 6450, "loss": 0.0021, "lr": 5.801542766166453e-05, "epoch": 5.038759689922481, "percentage": 50.39, "elapsed_time": "10:16:55", "remaining_time": "10:07:26"} -{"current_steps": 3250, "total_steps": 6450, "eval_loss": 0.0598391517996788, "epoch": 5.038759689922481, "percentage": 50.39, "elapsed_time": "10:19:39", "remaining_time": "10:10:07"} -{"current_steps": 3260, "total_steps": 6450, "loss": 0.0044, "lr": 5.774821750491014e-05, "epoch": 5.054263565891473, "percentage": 50.54, "elapsed_time": "10:21:05", "remaining_time": "10:07:45"} -{"current_steps": 3270, "total_steps": 6450, "loss": 0.007, "lr": 5.7480780415998906e-05, "epoch": 5.069767441860465, "percentage": 50.7, "elapsed_time": "10:22:25", "remaining_time": "10:05:17"} -{"current_steps": 3280, "total_steps": 6450, "loss": 0.0046, "lr": 5.7213124227709834e-05, "epoch": 5.0852713178294575, "percentage": 50.85, "elapsed_time": "10:23:45", "remaining_time": "10:02:50"} -{"current_steps": 3290, "total_steps": 6450, "loss": 0.0042, "lr": 5.6945256779238996e-05, "epoch": 5.10077519379845, "percentage": 51.01, "elapsed_time": "10:25:06", "remaining_time": "10:00:24"} -{"current_steps": 3300, "total_steps": 6450, "loss": 0.0061, "lr": 5.66771859159699e-05, "epoch": 5.116279069767442, "percentage": 51.16, "elapsed_time": "10:26:26", "remaining_time": "9:57:58"} -{"current_steps": 3300, "total_steps": 6450, "eval_loss": 0.06503809243440628, "epoch": 5.116279069767442, "percentage": 51.16, "elapsed_time": "10:29:10", "remaining_time": "10:00:34"} -{"current_steps": 3310, "total_steps": 6450, "loss": 0.0045, "lr": 5.640891948924373e-05, "epoch": 5.131782945736434, "percentage": 51.32, "elapsed_time": "10:30:36", "remaining_time": "9:58:13"} -{"current_steps": 3320, "total_steps": 6450, "loss": 0.0026, "lr": 5.614046535612936e-05, "epoch": 5.147286821705427, "percentage": 51.47, "elapsed_time": "10:31:56", "remaining_time": "9:55:47"} -{"current_steps": 3330, "total_steps": 6450, "loss": 0.0053, "lr": 5.587183137919332e-05, "epoch": 5.162790697674419, "percentage": 51.63, "elapsed_time": "10:33:17", "remaining_time": "9:53:21"} -{"current_steps": 3340, "total_steps": 6450, "loss": 0.0046, "lr": 5.5603025426269464e-05, "epoch": 5.178294573643411, "percentage": 51.78, "elapsed_time": "10:34:38", "remaining_time": "9:50:55"} -{"current_steps": 3350, "total_steps": 6450, "loss": 0.0038, "lr": 5.533405537022845e-05, "epoch": 5.1937984496124034, "percentage": 51.94, "elapsed_time": "10:35:58", "remaining_time": "9:48:30"} -{"current_steps": 3350, "total_steps": 6450, "eval_loss": 0.06426332890987396, "epoch": 5.1937984496124034, "percentage": 51.94, "elapsed_time": "10:38:42", "remaining_time": "9:51:02"} -{"current_steps": 3360, "total_steps": 6450, "loss": 0.0041, "lr": 5.5064929088747316e-05, "epoch": 5.209302325581396, "percentage": 52.09, "elapsed_time": "10:40:08", "remaining_time": "9:48:42"} -{"current_steps": 3370, "total_steps": 6450, "loss": 0.0037, "lr": 5.4795654464078674e-05, "epoch": 5.224806201550388, "percentage": 52.25, "elapsed_time": "10:41:29", "remaining_time": "9:46:16"} -{"current_steps": 3380, "total_steps": 6450, "loss": 0.0051, "lr": 5.452623938281982e-05, "epoch": 5.24031007751938, "percentage": 52.4, "elapsed_time": "10:42:49", "remaining_time": "9:43:52"} -{"current_steps": 3390, "total_steps": 6450, "loss": 0.002, "lr": 5.4256691735681786e-05, "epoch": 5.2558139534883725, "percentage": 52.56, "elapsed_time": "10:44:09", "remaining_time": "9:41:27"} -{"current_steps": 3400, "total_steps": 6450, "loss": 0.0052, "lr": 5.3987019417258264e-05, "epoch": 5.271317829457364, "percentage": 52.71, "elapsed_time": "10:45:30", "remaining_time": "9:39:03"} -{"current_steps": 3400, "total_steps": 6450, "eval_loss": 0.06585702300071716, "epoch": 5.271317829457364, "percentage": 52.71, "elapsed_time": "10:48:13", "remaining_time": "9:41:30"} -{"current_steps": 3410, "total_steps": 6450, "loss": 0.0019, "lr": 5.371723032579439e-05, "epoch": 5.286821705426356, "percentage": 52.87, "elapsed_time": "10:49:40", "remaining_time": "9:39:10"} -{"current_steps": 3420, "total_steps": 6450, "loss": 0.0046, "lr": 5.344733236295525e-05, "epoch": 5.3023255813953485, "percentage": 53.02, "elapsed_time": "10:51:00", "remaining_time": "9:36:46"} -{"current_steps": 3430, "total_steps": 6450, "loss": 0.0079, "lr": 5.3177333433594736e-05, "epoch": 5.317829457364341, "percentage": 53.18, "elapsed_time": "10:52:21", "remaining_time": "9:34:23"} -{"current_steps": 3440, "total_steps": 6450, "loss": 0.0047, "lr": 5.290724144552379e-05, "epoch": 5.333333333333333, "percentage": 53.33, "elapsed_time": "10:53:42", "remaining_time": "9:31:59"} -{"current_steps": 3450, "total_steps": 6450, "loss": 0.0058, "lr": 5.263706430927895e-05, "epoch": 5.348837209302325, "percentage": 53.49, "elapsed_time": "10:55:03", "remaining_time": "9:29:36"} -{"current_steps": 3450, "total_steps": 6450, "eval_loss": 0.059572022408246994, "epoch": 5.348837209302325, "percentage": 53.49, "elapsed_time": "10:57:46", "remaining_time": "9:31:58"} -{"current_steps": 3460, "total_steps": 6450, "loss": 0.0023, "lr": 5.236680993789052e-05, "epoch": 5.364341085271318, "percentage": 53.64, "elapsed_time": "10:59:11", "remaining_time": "9:29:39"} -{"current_steps": 3470, "total_steps": 6450, "loss": 0.0063, "lr": 5.2096486246650946e-05, "epoch": 5.37984496124031, "percentage": 53.8, "elapsed_time": "11:00:32", "remaining_time": "9:27:15"} -{"current_steps": 3480, "total_steps": 6450, "loss": 0.006, "lr": 5.182610115288295e-05, "epoch": 5.395348837209302, "percentage": 53.95, "elapsed_time": "11:01:53", "remaining_time": "9:24:53"} -{"current_steps": 3490, "total_steps": 6450, "loss": 0.006, "lr": 5.1555662575707574e-05, "epoch": 5.410852713178294, "percentage": 54.11, "elapsed_time": "11:03:13", "remaining_time": "9:22:30"} -{"current_steps": 3500, "total_steps": 6450, "loss": 0.0081, "lr": 5.128517843581233e-05, "epoch": 5.426356589147287, "percentage": 54.26, "elapsed_time": "11:04:33", "remaining_time": "9:20:07"} -{"current_steps": 3500, "total_steps": 6450, "eval_loss": 0.059476085007190704, "epoch": 5.426356589147287, "percentage": 54.26, "elapsed_time": "11:07:17", "remaining_time": "9:22:26"} -{"current_steps": 3510, "total_steps": 6450, "loss": 0.0059, "lr": 5.1014656655219197e-05, "epoch": 5.441860465116279, "percentage": 54.42, "elapsed_time": "11:08:43", "remaining_time": "9:20:07"} -{"current_steps": 3520, "total_steps": 6450, "loss": 0.0045, "lr": 5.0744105157052554e-05, "epoch": 5.457364341085271, "percentage": 54.57, "elapsed_time": "11:10:04", "remaining_time": "9:17:45"} -{"current_steps": 3530, "total_steps": 6450, "loss": 0.008, "lr": 5.047353186530718e-05, "epoch": 5.4728682170542635, "percentage": 54.73, "elapsed_time": "11:11:24", "remaining_time": "9:15:23"} -{"current_steps": 3540, "total_steps": 6450, "loss": 0.0159, "lr": 5.020294470461615e-05, "epoch": 5.488372093023256, "percentage": 54.88, "elapsed_time": "11:12:44", "remaining_time": "9:13:01"} -{"current_steps": 3550, "total_steps": 6450, "loss": 0.0051, "lr": 4.993235160001874e-05, "epoch": 5.503875968992248, "percentage": 55.04, "elapsed_time": "11:14:05", "remaining_time": "9:10:40"} -{"current_steps": 3550, "total_steps": 6450, "eval_loss": 0.06096334382891655, "epoch": 5.503875968992248, "percentage": 55.04, "elapsed_time": "11:16:49", "remaining_time": "9:12:53"} -{"current_steps": 3560, "total_steps": 6450, "loss": 0.0071, "lr": 4.966176047672829e-05, "epoch": 5.51937984496124, "percentage": 55.19, "elapsed_time": "11:18:16", "remaining_time": "9:10:37"} -{"current_steps": 3570, "total_steps": 6450, "loss": 0.0027, "lr": 4.9391179259900125e-05, "epoch": 5.534883720930233, "percentage": 55.35, "elapsed_time": "11:19:36", "remaining_time": "9:08:15"} -{"current_steps": 3580, "total_steps": 6450, "loss": 0.008, "lr": 4.912061587439944e-05, "epoch": 5.550387596899225, "percentage": 55.5, "elapsed_time": "11:20:57", "remaining_time": "9:05:54"} -{"current_steps": 3590, "total_steps": 6450, "loss": 0.0077, "lr": 4.8850078244569164e-05, "epoch": 5.565891472868217, "percentage": 55.66, "elapsed_time": "11:22:17", "remaining_time": "9:03:33"} -{"current_steps": 3600, "total_steps": 6450, "loss": 0.0036, "lr": 4.857957429399788e-05, "epoch": 5.5813953488372094, "percentage": 55.81, "elapsed_time": "11:23:38", "remaining_time": "9:01:12"} -{"current_steps": 3600, "total_steps": 6450, "eval_loss": 0.06083972007036209, "epoch": 5.5813953488372094, "percentage": 55.81, "elapsed_time": "11:26:21", "remaining_time": "9:03:22"} -{"current_steps": 3610, "total_steps": 6450, "loss": 0.0046, "lr": 4.830911194528781e-05, "epoch": 5.596899224806202, "percentage": 55.97, "elapsed_time": "11:27:48", "remaining_time": "9:01:05"} -{"current_steps": 3620, "total_steps": 6450, "loss": 0.0036, "lr": 4.803869911982264e-05, "epoch": 5.612403100775194, "percentage": 56.12, "elapsed_time": "11:29:08", "remaining_time": "8:58:44"} -{"current_steps": 3630, "total_steps": 6450, "loss": 0.0056, "lr": 4.776834373753569e-05, "epoch": 5.627906976744186, "percentage": 56.28, "elapsed_time": "11:30:28", "remaining_time": "8:56:24"} -{"current_steps": 3640, "total_steps": 6450, "loss": 0.0027, "lr": 4.749805371667781e-05, "epoch": 5.6434108527131785, "percentage": 56.43, "elapsed_time": "11:31:49", "remaining_time": "8:54:04"} -{"current_steps": 3650, "total_steps": 6450, "loss": 0.003, "lr": 4.722783697358555e-05, "epoch": 5.658914728682171, "percentage": 56.59, "elapsed_time": "11:33:09", "remaining_time": "8:51:44"} -{"current_steps": 3650, "total_steps": 6450, "eval_loss": 0.06872408092021942, "epoch": 5.658914728682171, "percentage": 56.59, "elapsed_time": "11:35:53", "remaining_time": "8:53:50"} -{"current_steps": 3660, "total_steps": 6450, "loss": 0.0049, "lr": 4.695770142244931e-05, "epoch": 5.674418604651163, "percentage": 56.74, "elapsed_time": "11:37:19", "remaining_time": "8:51:33"} -{"current_steps": 3670, "total_steps": 6450, "loss": 0.0045, "lr": 4.668765497508143e-05, "epoch": 5.689922480620155, "percentage": 56.9, "elapsed_time": "11:38:40", "remaining_time": "8:49:14"} -{"current_steps": 3680, "total_steps": 6450, "loss": 0.0082, "lr": 4.6417705540684645e-05, "epoch": 5.705426356589148, "percentage": 57.05, "elapsed_time": "11:40:00", "remaining_time": "8:46:54"} -{"current_steps": 3690, "total_steps": 6450, "loss": 0.0037, "lr": 4.614786102562026e-05, "epoch": 5.720930232558139, "percentage": 57.21, "elapsed_time": "11:41:21", "remaining_time": "8:44:35"} -{"current_steps": 3700, "total_steps": 6450, "loss": 0.0056, "lr": 4.587812933317675e-05, "epoch": 5.736434108527131, "percentage": 57.36, "elapsed_time": "11:42:41", "remaining_time": "8:42:16"} -{"current_steps": 3700, "total_steps": 6450, "eval_loss": 0.054513685405254364, "epoch": 5.736434108527131, "percentage": 57.36, "elapsed_time": "11:45:25", "remaining_time": "8:44:17"} -{"current_steps": 3710, "total_steps": 6450, "loss": 0.003, "lr": 4.560851836333813e-05, "epoch": 5.751937984496124, "percentage": 57.52, "elapsed_time": "11:46:51", "remaining_time": "8:42:02"} -{"current_steps": 3720, "total_steps": 6450, "loss": 0.0053, "lr": 4.5339036012552716e-05, "epoch": 5.767441860465116, "percentage": 57.67, "elapsed_time": "11:48:11", "remaining_time": "8:39:43"} -{"current_steps": 3730, "total_steps": 6450, "loss": 0.0078, "lr": 4.5069690173501776e-05, "epoch": 5.782945736434108, "percentage": 57.83, "elapsed_time": "11:49:31", "remaining_time": "8:37:24"} -{"current_steps": 3740, "total_steps": 6450, "loss": 0.011, "lr": 4.480048873486835e-05, "epoch": 5.7984496124031, "percentage": 57.98, "elapsed_time": "11:50:52", "remaining_time": "8:35:05"} -{"current_steps": 3750, "total_steps": 6450, "loss": 0.0039, "lr": 4.4531439581106295e-05, "epoch": 5.813953488372093, "percentage": 58.14, "elapsed_time": "11:52:12", "remaining_time": "8:32:47"} -{"current_steps": 3750, "total_steps": 6450, "eval_loss": 0.04962892085313797, "epoch": 5.813953488372093, "percentage": 58.14, "elapsed_time": "11:54:56", "remaining_time": "8:34:45"} -{"current_steps": 3760, "total_steps": 6450, "loss": 0.0066, "lr": 4.4262550592209206e-05, "epoch": 5.829457364341085, "percentage": 58.29, "elapsed_time": "11:56:21", "remaining_time": "8:32:30"} -{"current_steps": 3770, "total_steps": 6450, "loss": 0.0056, "lr": 4.399382964347982e-05, "epoch": 5.844961240310077, "percentage": 58.45, "elapsed_time": "11:57:42", "remaining_time": "8:30:11"} -{"current_steps": 3780, "total_steps": 6450, "loss": 0.0069, "lr": 4.37252846052992e-05, "epoch": 5.8604651162790695, "percentage": 58.6, "elapsed_time": "11:59:02", "remaining_time": "8:27:53"} -{"current_steps": 3790, "total_steps": 6450, "loss": 0.0065, "lr": 4.3456923342896315e-05, "epoch": 5.875968992248062, "percentage": 58.76, "elapsed_time": "12:00:22", "remaining_time": "8:25:35"} -{"current_steps": 3800, "total_steps": 6450, "loss": 0.0027, "lr": 4.3188753716117656e-05, "epoch": 5.891472868217054, "percentage": 58.91, "elapsed_time": "12:01:43", "remaining_time": "8:23:18"} -{"current_steps": 3800, "total_steps": 6450, "eval_loss": 0.062378574162721634, "epoch": 5.891472868217054, "percentage": 58.91, "elapsed_time": "12:04:26", "remaining_time": "8:25:12"} -{"current_steps": 3810, "total_steps": 6450, "loss": 0.0032, "lr": 4.292078357919701e-05, "epoch": 5.906976744186046, "percentage": 59.07, "elapsed_time": "12:05:52", "remaining_time": "8:22:58"} -{"current_steps": 3820, "total_steps": 6450, "loss": 0.0016, "lr": 4.2653020780525466e-05, "epoch": 5.922480620155039, "percentage": 59.22, "elapsed_time": "12:07:13", "remaining_time": "8:20:41"} -{"current_steps": 3830, "total_steps": 6450, "loss": 0.0041, "lr": 4.238547316242149e-05, "epoch": 5.937984496124031, "percentage": 59.38, "elapsed_time": "12:08:34", "remaining_time": "8:18:23"} -{"current_steps": 3840, "total_steps": 6450, "loss": 0.0062, "lr": 4.2118148560901325e-05, "epoch": 5.953488372093023, "percentage": 59.53, "elapsed_time": "12:09:54", "remaining_time": "8:16:06"} -{"current_steps": 3850, "total_steps": 6450, "loss": 0.0123, "lr": 4.1851054805449393e-05, "epoch": 5.9689922480620154, "percentage": 59.69, "elapsed_time": "12:11:14", "remaining_time": "8:13:49"} -{"current_steps": 3850, "total_steps": 6450, "eval_loss": 0.06262066215276718, "epoch": 5.9689922480620154, "percentage": 59.69, "elapsed_time": "12:13:58", "remaining_time": "8:15:40"} -{"current_steps": 3860, "total_steps": 6450, "loss": 0.003, "lr": 4.158419971878907e-05, "epoch": 5.984496124031008, "percentage": 59.84, "elapsed_time": "12:15:23", "remaining_time": "8:13:26"} -{"current_steps": 3870, "total_steps": 6450, "loss": 0.0043, "lr": 4.131759111665349e-05, "epoch": 6.0, "percentage": 60.0, "elapsed_time": "12:16:44", "remaining_time": "8:11:09"} -{"current_steps": 3880, "total_steps": 6450, "loss": 0.0017, "lr": 4.105123680755667e-05, "epoch": 6.015503875968992, "percentage": 60.16, "elapsed_time": "12:18:04", "remaining_time": "8:08:52"} -{"current_steps": 3890, "total_steps": 6450, "loss": 0.0008, "lr": 4.078514459256485e-05, "epoch": 6.0310077519379846, "percentage": 60.31, "elapsed_time": "12:19:25", "remaining_time": "8:06:36"} -{"current_steps": 3900, "total_steps": 6450, "loss": 0.0015, "lr": 4.051932226506797e-05, "epoch": 6.046511627906977, "percentage": 60.47, "elapsed_time": "12:20:45", "remaining_time": "8:04:20"} -{"current_steps": 3900, "total_steps": 6450, "eval_loss": 0.07338041812181473, "epoch": 6.046511627906977, "percentage": 60.47, "elapsed_time": "12:23:29", "remaining_time": "8:06:07"} -{"current_steps": 3910, "total_steps": 6450, "loss": 0.0023, "lr": 4.025377761055138e-05, "epoch": 6.062015503875969, "percentage": 60.62, "elapsed_time": "12:24:54", "remaining_time": "8:03:54"} -{"current_steps": 3920, "total_steps": 6450, "loss": 0.0017, "lr": 3.998851840636789e-05, "epoch": 6.077519379844961, "percentage": 60.78, "elapsed_time": "12:26:14", "remaining_time": "8:01:37"} -{"current_steps": 3930, "total_steps": 6450, "loss": 0.0013, "lr": 3.972355242150998e-05, "epoch": 6.093023255813954, "percentage": 60.93, "elapsed_time": "12:27:34", "remaining_time": "7:59:21"} -{"current_steps": 3940, "total_steps": 6450, "loss": 0.0051, "lr": 3.9458887416382187e-05, "epoch": 6.108527131782946, "percentage": 61.09, "elapsed_time": "12:28:55", "remaining_time": "7:57:06"} -{"current_steps": 3950, "total_steps": 6450, "loss": 0.0008, "lr": 3.9194531142573884e-05, "epoch": 6.124031007751938, "percentage": 61.24, "elapsed_time": "12:30:15", "remaining_time": "7:54:51"} -{"current_steps": 3950, "total_steps": 6450, "eval_loss": 0.0713106244802475, "epoch": 6.124031007751938, "percentage": 61.24, "elapsed_time": "12:32:59", "remaining_time": "7:56:34"} -{"current_steps": 3960, "total_steps": 6450, "loss": 0.0033, "lr": 3.893049134263224e-05, "epoch": 6.1395348837209305, "percentage": 61.4, "elapsed_time": "12:34:24", "remaining_time": "7:54:21"} -{"current_steps": 3970, "total_steps": 6450, "loss": 0.0013, "lr": 3.866677574983542e-05, "epoch": 6.155038759689923, "percentage": 61.55, "elapsed_time": "12:35:44", "remaining_time": "7:52:06"} -{"current_steps": 3980, "total_steps": 6450, "loss": 0.0026, "lr": 3.84033920879661e-05, "epoch": 6.170542635658915, "percentage": 61.71, "elapsed_time": "12:37:05", "remaining_time": "7:49:51"} -{"current_steps": 3990, "total_steps": 6450, "loss": 0.0016, "lr": 3.814034807108529e-05, "epoch": 6.186046511627907, "percentage": 61.86, "elapsed_time": "12:38:26", "remaining_time": "7:47:36"} -{"current_steps": 4000, "total_steps": 6450, "loss": 0.0057, "lr": 3.787765140330636e-05, "epoch": 6.2015503875969, "percentage": 62.02, "elapsed_time": "12:39:46", "remaining_time": "7:45:21"} -{"current_steps": 4000, "total_steps": 6450, "eval_loss": 0.06868591904640198, "epoch": 6.2015503875969, "percentage": 62.02, "elapsed_time": "12:42:30", "remaining_time": "7:47:02"} -{"current_steps": 4010, "total_steps": 6450, "loss": 0.0037, "lr": 3.7615309778569426e-05, "epoch": 6.217054263565892, "percentage": 62.17, "elapsed_time": "12:43:53", "remaining_time": "7:44:48"} -{"current_steps": 4020, "total_steps": 6450, "loss": 0.0029, "lr": 3.735333088041596e-05, "epoch": 6.232558139534884, "percentage": 62.33, "elapsed_time": "12:45:13", "remaining_time": "7:42:33"} -{"current_steps": 4030, "total_steps": 6450, "loss": 0.0018, "lr": 3.709172238176384e-05, "epoch": 6.248062015503876, "percentage": 62.48, "elapsed_time": "12:46:33", "remaining_time": "7:40:19"} -{"current_steps": 4040, "total_steps": 6450, "loss": 0.004, "lr": 3.6830491944682545e-05, "epoch": 6.263565891472869, "percentage": 62.64, "elapsed_time": "12:47:54", "remaining_time": "7:38:04"} -{"current_steps": 4050, "total_steps": 6450, "loss": 0.0034, "lr": 3.656964722016875e-05, "epoch": 6.27906976744186, "percentage": 62.79, "elapsed_time": "12:49:14", "remaining_time": "7:35:50"} -{"current_steps": 4050, "total_steps": 6450, "eval_loss": 0.06980875879526138, "epoch": 6.27906976744186, "percentage": 62.79, "elapsed_time": "12:51:58", "remaining_time": "7:37:27"} -{"current_steps": 4060, "total_steps": 6450, "loss": 0.0033, "lr": 3.6309195847922285e-05, "epoch": 6.294573643410852, "percentage": 62.95, "elapsed_time": "12:53:22", "remaining_time": "7:35:15"} -{"current_steps": 4070, "total_steps": 6450, "loss": 0.002, "lr": 3.6049145456122346e-05, "epoch": 6.310077519379845, "percentage": 63.1, "elapsed_time": "12:54:42", "remaining_time": "7:33:01"} -{"current_steps": 4080, "total_steps": 6450, "loss": 0.0014, "lr": 3.578950366120414e-05, "epoch": 6.325581395348837, "percentage": 63.26, "elapsed_time": "12:56:02", "remaining_time": "7:30:47"} -{"current_steps": 4090, "total_steps": 6450, "loss": 0.0018, "lr": 3.553027806763568e-05, "epoch": 6.341085271317829, "percentage": 63.41, "elapsed_time": "12:57:23", "remaining_time": "7:28:33"} -{"current_steps": 4100, "total_steps": 6450, "loss": 0.003, "lr": 3.527147626769521e-05, "epoch": 6.3565891472868215, "percentage": 63.57, "elapsed_time": "12:58:43", "remaining_time": "7:26:20"} -{"current_steps": 4100, "total_steps": 6450, "eval_loss": 0.0693284347653389, "epoch": 6.3565891472868215, "percentage": 63.57, "elapsed_time": "13:01:27", "remaining_time": "7:27:54"} -{"current_steps": 4110, "total_steps": 6450, "loss": 0.0009, "lr": 3.5013105841248795e-05, "epoch": 6.372093023255814, "percentage": 63.72, "elapsed_time": "13:02:51", "remaining_time": "7:25:42"} -{"current_steps": 4120, "total_steps": 6450, "loss": 0.0026, "lr": 3.475517435552821e-05, "epoch": 6.387596899224806, "percentage": 63.88, "elapsed_time": "13:04:11", "remaining_time": "7:23:29"} -{"current_steps": 4130, "total_steps": 6450, "loss": 0.002, "lr": 3.449768936490948e-05, "epoch": 6.403100775193798, "percentage": 64.03, "elapsed_time": "13:05:31", "remaining_time": "7:21:15"} -{"current_steps": 4140, "total_steps": 6450, "loss": 0.0006, "lr": 3.424065841069152e-05, "epoch": 6.4186046511627906, "percentage": 64.19, "elapsed_time": "13:06:52", "remaining_time": "7:19:02"} -{"current_steps": 4150, "total_steps": 6450, "loss": 0.0008, "lr": 3.3984089020875285e-05, "epoch": 6.434108527131783, "percentage": 64.34, "elapsed_time": "13:08:12", "remaining_time": "7:16:50"} -{"current_steps": 4150, "total_steps": 6450, "eval_loss": 0.07465077191591263, "epoch": 6.434108527131783, "percentage": 64.34, "elapsed_time": "13:10:55", "remaining_time": "7:18:20"} -{"current_steps": 4160, "total_steps": 6450, "loss": 0.0031, "lr": 3.37279887099433e-05, "epoch": 6.449612403100775, "percentage": 64.5, "elapsed_time": "13:12:20", "remaining_time": "7:16:10"} -{"current_steps": 4170, "total_steps": 6450, "loss": 0.002, "lr": 3.347236497863957e-05, "epoch": 6.465116279069767, "percentage": 64.65, "elapsed_time": "13:13:40", "remaining_time": "7:13:57"} -{"current_steps": 4180, "total_steps": 6450, "loss": 0.0058, "lr": 3.321722531374988e-05, "epoch": 6.48062015503876, "percentage": 64.81, "elapsed_time": "13:15:01", "remaining_time": "7:11:44"} -{"current_steps": 4190, "total_steps": 6450, "loss": 0.0013, "lr": 3.296257718788252e-05, "epoch": 6.496124031007752, "percentage": 64.96, "elapsed_time": "13:16:21", "remaining_time": "7:09:32"} -{"current_steps": 4200, "total_steps": 6450, "loss": 0.0019, "lr": 3.2708428059249436e-05, "epoch": 6.511627906976744, "percentage": 65.12, "elapsed_time": "13:17:41", "remaining_time": "7:07:20"} -{"current_steps": 4200, "total_steps": 6450, "eval_loss": 0.0691356211900711, "epoch": 6.511627906976744, "percentage": 65.12, "elapsed_time": "13:20:25", "remaining_time": "7:08:47"} -{"current_steps": 4210, "total_steps": 6450, "loss": 0.0042, "lr": 3.245478537144782e-05, "epoch": 6.5271317829457365, "percentage": 65.27, "elapsed_time": "13:21:49", "remaining_time": "7:06:37"} -{"current_steps": 4220, "total_steps": 6450, "loss": 0.0018, "lr": 3.2201656553242056e-05, "epoch": 6.542635658914729, "percentage": 65.43, "elapsed_time": "13:23:10", "remaining_time": "7:04:25"} -{"current_steps": 4230, "total_steps": 6450, "loss": 0.0013, "lr": 3.1949049018346126e-05, "epoch": 6.558139534883721, "percentage": 65.58, "elapsed_time": "13:24:30", "remaining_time": "7:02:13"} -{"current_steps": 4240, "total_steps": 6450, "loss": 0.0042, "lr": 3.169697016520656e-05, "epoch": 6.573643410852713, "percentage": 65.74, "elapsed_time": "13:25:50", "remaining_time": "7:00:01"} -{"current_steps": 4250, "total_steps": 6450, "loss": 0.0049, "lr": 3.144542737678568e-05, "epoch": 6.589147286821706, "percentage": 65.89, "elapsed_time": "13:27:10", "remaining_time": "6:57:49"} -{"current_steps": 4250, "total_steps": 6450, "eval_loss": 0.06617286801338196, "epoch": 6.589147286821706, "percentage": 65.89, "elapsed_time": "13:29:53", "remaining_time": "6:59:14"} -{"current_steps": 4260, "total_steps": 6450, "loss": 0.0016, "lr": 3.1194428020345376e-05, "epoch": 6.604651162790698, "percentage": 66.05, "elapsed_time": "13:31:17", "remaining_time": "6:57:04"} -{"current_steps": 4270, "total_steps": 6450, "loss": 0.0074, "lr": 3.0943979447231285e-05, "epoch": 6.62015503875969, "percentage": 66.2, "elapsed_time": "13:32:38", "remaining_time": "6:54:53"} -{"current_steps": 4280, "total_steps": 6450, "loss": 0.0007, "lr": 3.069408899265762e-05, "epoch": 6.635658914728682, "percentage": 66.36, "elapsed_time": "13:33:58", "remaining_time": "6:52:41"} -{"current_steps": 4290, "total_steps": 6450, "loss": 0.0037, "lr": 3.0444763975492208e-05, "epoch": 6.651162790697675, "percentage": 66.51, "elapsed_time": "13:35:18", "remaining_time": "6:50:30"} -{"current_steps": 4300, "total_steps": 6450, "loss": 0.0021, "lr": 3.019601169804216e-05, "epoch": 6.666666666666667, "percentage": 66.67, "elapsed_time": "13:36:38", "remaining_time": "6:48:19"} -{"current_steps": 4300, "total_steps": 6450, "eval_loss": 0.06297656148672104, "epoch": 6.666666666666667, "percentage": 66.67, "elapsed_time": "13:39:22", "remaining_time": "6:49:41"} -{"current_steps": 4310, "total_steps": 6450, "loss": 0.0036, "lr": 2.9947839445840042e-05, "epoch": 6.682170542635659, "percentage": 66.82, "elapsed_time": "13:40:46", "remaining_time": "6:47:32"} -{"current_steps": 4320, "total_steps": 6450, "loss": 0.0038, "lr": 2.9700254487430444e-05, "epoch": 6.6976744186046515, "percentage": 66.98, "elapsed_time": "13:42:07", "remaining_time": "6:45:20"} -{"current_steps": 4330, "total_steps": 6450, "loss": 0.0024, "lr": 2.9453264074157134e-05, "epoch": 6.713178294573644, "percentage": 67.13, "elapsed_time": "13:43:27", "remaining_time": "6:43:10"} -{"current_steps": 4340, "total_steps": 6450, "loss": 0.0035, "lr": 2.920687543995061e-05, "epoch": 6.728682170542635, "percentage": 67.29, "elapsed_time": "13:44:47", "remaining_time": "6:40:59"} -{"current_steps": 4350, "total_steps": 6450, "loss": 0.0042, "lr": 2.896109580111634e-05, "epoch": 6.7441860465116275, "percentage": 67.44, "elapsed_time": "13:46:07", "remaining_time": "6:38:49"} -{"current_steps": 4350, "total_steps": 6450, "eval_loss": 0.06421022117137909, "epoch": 6.7441860465116275, "percentage": 67.44, "elapsed_time": "13:48:50", "remaining_time": "6:40:07"} -{"current_steps": 4360, "total_steps": 6450, "loss": 0.0019, "lr": 2.8715932356123332e-05, "epoch": 6.75968992248062, "percentage": 67.6, "elapsed_time": "13:50:15", "remaining_time": "6:37:59"} -{"current_steps": 4370, "total_steps": 6450, "loss": 0.0019, "lr": 2.8471392285393306e-05, "epoch": 6.775193798449612, "percentage": 67.75, "elapsed_time": "13:51:35", "remaining_time": "6:35:48"} -{"current_steps": 4380, "total_steps": 6450, "loss": 0.0031, "lr": 2.8227482751090445e-05, "epoch": 6.790697674418604, "percentage": 67.91, "elapsed_time": "13:52:55", "remaining_time": "6:33:38"} -{"current_steps": 4390, "total_steps": 6450, "loss": 0.0016, "lr": 2.7984210896911522e-05, "epoch": 6.8062015503875966, "percentage": 68.06, "elapsed_time": "13:54:15", "remaining_time": "6:31:28"} -{"current_steps": 4400, "total_steps": 6450, "loss": 0.0046, "lr": 2.7741583847876818e-05, "epoch": 6.821705426356589, "percentage": 68.22, "elapsed_time": "13:55:36", "remaining_time": "6:29:18"} -{"current_steps": 4400, "total_steps": 6450, "eval_loss": 0.06887716054916382, "epoch": 6.821705426356589, "percentage": 68.22, "elapsed_time": "13:58:19", "remaining_time": "6:30:34"} -{"current_steps": 4410, "total_steps": 6450, "loss": 0.0009, "lr": 2.7499608710121288e-05, "epoch": 6.837209302325581, "percentage": 68.37, "elapsed_time": "13:59:43", "remaining_time": "6:28:26"} -{"current_steps": 4420, "total_steps": 6450, "loss": 0.0022, "lr": 2.7258292570686565e-05, "epoch": 6.852713178294573, "percentage": 68.53, "elapsed_time": "14:01:04", "remaining_time": "6:26:17"} -{"current_steps": 4430, "total_steps": 6450, "loss": 0.0002, "lr": 2.7017642497313323e-05, "epoch": 6.868217054263566, "percentage": 68.68, "elapsed_time": "14:02:24", "remaining_time": "6:24:07"} -{"current_steps": 4440, "total_steps": 6450, "loss": 0.0042, "lr": 2.6777665538234293e-05, "epoch": 6.883720930232558, "percentage": 68.84, "elapsed_time": "14:03:44", "remaining_time": "6:21:58"} -{"current_steps": 4450, "total_steps": 6450, "loss": 0.0057, "lr": 2.6538368721967837e-05, "epoch": 6.89922480620155, "percentage": 68.99, "elapsed_time": "14:05:05", "remaining_time": "6:19:48"} -{"current_steps": 4450, "total_steps": 6450, "eval_loss": 0.0728408694267273, "epoch": 6.89922480620155, "percentage": 68.99, "elapsed_time": "14:07:49", "remaining_time": "6:21:02"} -{"current_steps": 4460, "total_steps": 6450, "loss": 0.0006, "lr": 2.629975905711204e-05, "epoch": 6.9147286821705425, "percentage": 69.15, "elapsed_time": "14:09:13", "remaining_time": "6:18:55"} -{"current_steps": 4470, "total_steps": 6450, "loss": 0.0035, "lr": 2.606184353213956e-05, "epoch": 6.930232558139535, "percentage": 69.3, "elapsed_time": "14:10:34", "remaining_time": "6:16:45"} -{"current_steps": 4480, "total_steps": 6450, "loss": 0.0029, "lr": 2.58246291151928e-05, "epoch": 6.945736434108527, "percentage": 69.46, "elapsed_time": "14:11:54", "remaining_time": "6:14:36"} -{"current_steps": 4490, "total_steps": 6450, "loss": 0.0026, "lr": 2.558812275387995e-05, "epoch": 6.961240310077519, "percentage": 69.61, "elapsed_time": "14:13:14", "remaining_time": "6:12:27"} -{"current_steps": 4500, "total_steps": 6450, "loss": 0.0015, "lr": 2.5352331375071437e-05, "epoch": 6.976744186046512, "percentage": 69.77, "elapsed_time": "14:14:34", "remaining_time": "6:10:19"} -{"current_steps": 4500, "total_steps": 6450, "eval_loss": 0.07535959035158157, "epoch": 6.976744186046512, "percentage": 69.77, "elapsed_time": "14:17:18", "remaining_time": "6:11:30"} -{"current_steps": 4510, "total_steps": 6450, "loss": 0.004, "lr": 2.5117261884697064e-05, "epoch": 6.992248062015504, "percentage": 69.92, "elapsed_time": "14:18:43", "remaining_time": "6:09:22"} -{"current_steps": 4520, "total_steps": 6450, "loss": 0.0018, "lr": 2.4882921167543743e-05, "epoch": 7.007751937984496, "percentage": 70.08, "elapsed_time": "14:20:03", "remaining_time": "6:07:14"} -{"current_steps": 4530, "total_steps": 6450, "loss": 0.0012, "lr": 2.4649316087053837e-05, "epoch": 7.023255813953488, "percentage": 70.23, "elapsed_time": "14:21:23", "remaining_time": "6:05:05"} -{"current_steps": 4540, "total_steps": 6450, "loss": 0.0005, "lr": 2.4416453485124196e-05, "epoch": 7.038759689922481, "percentage": 70.39, "elapsed_time": "14:22:43", "remaining_time": "6:02:57"} -{"current_steps": 4550, "total_steps": 6450, "loss": 0.0011, "lr": 2.4184340181905673e-05, "epoch": 7.054263565891473, "percentage": 70.54, "elapsed_time": "14:24:04", "remaining_time": "6:00:49"} -{"current_steps": 4550, "total_steps": 6450, "eval_loss": 0.08152835071086884, "epoch": 7.054263565891473, "percentage": 70.54, "elapsed_time": "14:26:47", "remaining_time": "6:01:57"} -{"current_steps": 4560, "total_steps": 6450, "loss": 0.0016, "lr": 2.3952982975603496e-05, "epoch": 7.069767441860465, "percentage": 70.7, "elapsed_time": "14:28:12", "remaining_time": "5:59:50"} -{"current_steps": 4570, "total_steps": 6450, "loss": 0.0007, "lr": 2.372238864227805e-05, "epoch": 7.0852713178294575, "percentage": 70.85, "elapsed_time": "14:29:32", "remaining_time": "5:57:42"} -{"current_steps": 4580, "total_steps": 6450, "loss": 0.0021, "lr": 2.3492563935646493e-05, "epoch": 7.10077519379845, "percentage": 71.01, "elapsed_time": "14:30:52", "remaining_time": "5:55:34"} -{"current_steps": 4590, "total_steps": 6450, "loss": 0.0002, "lr": 2.326351558688493e-05, "epoch": 7.116279069767442, "percentage": 71.16, "elapsed_time": "14:32:12", "remaining_time": "5:53:26"} -{"current_steps": 4600, "total_steps": 6450, "loss": 0.002, "lr": 2.3035250304431206e-05, "epoch": 7.131782945736434, "percentage": 71.32, "elapsed_time": "14:33:33", "remaining_time": "5:51:19"} -{"current_steps": 4600, "total_steps": 6450, "eval_loss": 0.08660873025655746, "epoch": 7.131782945736434, "percentage": 71.32, "elapsed_time": "14:36:16", "remaining_time": "5:52:25"} -{"current_steps": 4610, "total_steps": 6450, "loss": 0.0002, "lr": 2.2807774773788515e-05, "epoch": 7.147286821705427, "percentage": 71.47, "elapsed_time": "14:37:41", "remaining_time": "5:50:18"} -{"current_steps": 4620, "total_steps": 6450, "loss": 0.0002, "lr": 2.2581095657329598e-05, "epoch": 7.162790697674419, "percentage": 71.63, "elapsed_time": "14:39:01", "remaining_time": "5:48:11"} -{"current_steps": 4630, "total_steps": 6450, "loss": 0.0003, "lr": 2.2355219594101483e-05, "epoch": 7.178294573643411, "percentage": 71.78, "elapsed_time": "14:40:22", "remaining_time": "5:46:03"} -{"current_steps": 4640, "total_steps": 6450, "loss": 0.0002, "lr": 2.2130153199631214e-05, "epoch": 7.1937984496124034, "percentage": 71.94, "elapsed_time": "14:41:42", "remaining_time": "5:43:56"} -{"current_steps": 4650, "total_steps": 6450, "loss": 0.0006, "lr": 2.1905903065731974e-05, "epoch": 7.209302325581396, "percentage": 72.09, "elapsed_time": "14:43:02", "remaining_time": "5:41:49"} -{"current_steps": 4650, "total_steps": 6450, "eval_loss": 0.09439540654420853, "epoch": 7.209302325581396, "percentage": 72.09, "elapsed_time": "14:45:46", "remaining_time": "5:42:52"} -{"current_steps": 4660, "total_steps": 6450, "loss": 0.0002, "lr": 2.1682475760310078e-05, "epoch": 7.224806201550388, "percentage": 72.25, "elapsed_time": "14:47:11", "remaining_time": "5:40:47"} -{"current_steps": 4670, "total_steps": 6450, "loss": 0.001, "lr": 2.1459877827172537e-05, "epoch": 7.24031007751938, "percentage": 72.4, "elapsed_time": "14:48:31", "remaining_time": "5:38:39"} -{"current_steps": 4680, "total_steps": 6450, "loss": 0.0017, "lr": 2.123811578583551e-05, "epoch": 7.2558139534883725, "percentage": 72.56, "elapsed_time": "14:49:51", "remaining_time": "5:36:32"} -{"current_steps": 4690, "total_steps": 6450, "loss": 0.0019, "lr": 2.1017196131333304e-05, "epoch": 7.271317829457364, "percentage": 72.71, "elapsed_time": "14:51:12", "remaining_time": "5:34:26"} -{"current_steps": 4700, "total_steps": 6450, "loss": 0.0011, "lr": 2.079712533402808e-05, "epoch": 7.286821705426356, "percentage": 72.87, "elapsed_time": "14:52:32", "remaining_time": "5:32:19"} -{"current_steps": 4700, "total_steps": 6450, "eval_loss": 0.09016954898834229, "epoch": 7.286821705426356, "percentage": 72.87, "elapsed_time": "14:55:16", "remaining_time": "5:33:20"} -{"current_steps": 4710, "total_steps": 6450, "loss": 0.0004, "lr": 2.057790983942047e-05, "epoch": 7.3023255813953485, "percentage": 73.02, "elapsed_time": "14:56:40", "remaining_time": "5:31:15"} -{"current_steps": 4720, "total_steps": 6450, "loss": 0.0013, "lr": 2.0359556067960727e-05, "epoch": 7.317829457364341, "percentage": 73.18, "elapsed_time": "14:58:01", "remaining_time": "5:29:08"} -{"current_steps": 4730, "total_steps": 6450, "loss": 0.0087, "lr": 2.0142070414860704e-05, "epoch": 7.333333333333333, "percentage": 73.33, "elapsed_time": "14:59:21", "remaining_time": "5:27:02"} -{"current_steps": 4740, "total_steps": 6450, "loss": 0.0006, "lr": 1.9925459249906485e-05, "epoch": 7.348837209302325, "percentage": 73.49, "elapsed_time": "15:00:42", "remaining_time": "5:24:56"} -{"current_steps": 4750, "total_steps": 6450, "loss": 0.0013, "lr": 1.970972891727194e-05, "epoch": 7.364341085271318, "percentage": 73.64, "elapsed_time": "15:02:02", "remaining_time": "5:22:50"} -{"current_steps": 4750, "total_steps": 6450, "eval_loss": 0.08376794308423996, "epoch": 7.364341085271318, "percentage": 73.64, "elapsed_time": "15:04:46", "remaining_time": "5:23:48"} -{"current_steps": 4760, "total_steps": 6450, "loss": 0.0002, "lr": 1.9494885735332847e-05, "epoch": 7.37984496124031, "percentage": 73.8, "elapsed_time": "15:06:11", "remaining_time": "5:21:44"} -{"current_steps": 4770, "total_steps": 6450, "loss": 0.0003, "lr": 1.928093599648179e-05, "epoch": 7.395348837209302, "percentage": 73.95, "elapsed_time": "15:07:31", "remaining_time": "5:19:37"} -{"current_steps": 4780, "total_steps": 6450, "loss": 0.0004, "lr": 1.9067885966943983e-05, "epoch": 7.410852713178294, "percentage": 74.11, "elapsed_time": "15:08:51", "remaining_time": "5:17:31"} -{"current_steps": 4790, "total_steps": 6450, "loss": 0.0002, "lr": 1.8855741886593643e-05, "epoch": 7.426356589147287, "percentage": 74.26, "elapsed_time": "15:10:12", "remaining_time": "5:15:26"} -{"current_steps": 4800, "total_steps": 6450, "loss": 0.0002, "lr": 1.86445099687713e-05, "epoch": 7.441860465116279, "percentage": 74.42, "elapsed_time": "15:11:32", "remaining_time": "5:13:20"} -{"current_steps": 4800, "total_steps": 6450, "eval_loss": 0.08967275172472, "epoch": 7.441860465116279, "percentage": 74.42, "elapsed_time": "15:14:16", "remaining_time": "5:14:16"} -{"current_steps": 4810, "total_steps": 6450, "loss": 0.0032, "lr": 1.8434196400101745e-05, "epoch": 7.457364341085271, "percentage": 74.57, "elapsed_time": "15:15:45", "remaining_time": "5:12:13"} -{"current_steps": 4820, "total_steps": 6450, "loss": 0.0029, "lr": 1.822480734031291e-05, "epoch": 7.4728682170542635, "percentage": 74.73, "elapsed_time": "15:17:05", "remaining_time": "5:10:08"} -{"current_steps": 4830, "total_steps": 6450, "loss": 0.0014, "lr": 1.801634892205545e-05, "epoch": 7.488372093023256, "percentage": 74.88, "elapsed_time": "15:18:26", "remaining_time": "5:08:02"} -{"current_steps": 4840, "total_steps": 6450, "loss": 0.001, "lr": 1.7808827250723042e-05, "epoch": 7.503875968992248, "percentage": 75.04, "elapsed_time": "15:19:46", "remaining_time": "5:05:57"} -{"current_steps": 4850, "total_steps": 6450, "loss": 0.001, "lr": 1.760224840427369e-05, "epoch": 7.51937984496124, "percentage": 75.19, "elapsed_time": "15:21:07", "remaining_time": "5:03:52"} -{"current_steps": 4850, "total_steps": 6450, "eval_loss": 0.08261636644601822, "epoch": 7.51937984496124, "percentage": 75.19, "elapsed_time": "15:23:51", "remaining_time": "5:04:46"} -{"current_steps": 4860, "total_steps": 6450, "loss": 0.0011, "lr": 1.7396618433051647e-05, "epoch": 7.534883720930233, "percentage": 75.35, "elapsed_time": "15:25:15", "remaining_time": "5:02:42"} -{"current_steps": 4870, "total_steps": 6450, "loss": 0.0011, "lr": 1.7191943359610214e-05, "epoch": 7.550387596899225, "percentage": 75.5, "elapsed_time": "15:26:35", "remaining_time": "5:00:37"} -{"current_steps": 4880, "total_steps": 6450, "loss": 0.001, "lr": 1.698822917853532e-05, "epoch": 7.565891472868217, "percentage": 75.66, "elapsed_time": "15:27:55", "remaining_time": "4:58:32"} -{"current_steps": 4890, "total_steps": 6450, "loss": 0.0004, "lr": 1.678548185627004e-05, "epoch": 7.5813953488372094, "percentage": 75.81, "elapsed_time": "15:29:16", "remaining_time": "4:56:27"} -{"current_steps": 4900, "total_steps": 6450, "loss": 0.0031, "lr": 1.6583707330939775e-05, "epoch": 7.596899224806202, "percentage": 75.97, "elapsed_time": "15:30:36", "remaining_time": "4:54:22"} -{"current_steps": 4900, "total_steps": 6450, "eval_loss": 0.08551254123449326, "epoch": 7.596899224806202, "percentage": 75.97, "elapsed_time": "15:33:20", "remaining_time": "4:55:14"} -{"current_steps": 4910, "total_steps": 6450, "loss": 0.0013, "lr": 1.638291151217832e-05, "epoch": 7.612403100775194, "percentage": 76.12, "elapsed_time": "15:34:44", "remaining_time": "4:53:10"} -{"current_steps": 4920, "total_steps": 6450, "loss": 0.0009, "lr": 1.618310028095486e-05, "epoch": 7.627906976744186, "percentage": 76.28, "elapsed_time": "15:36:04", "remaining_time": "4:51:05"} -{"current_steps": 4930, "total_steps": 6450, "loss": 0.001, "lr": 1.5984279489401655e-05, "epoch": 7.6434108527131785, "percentage": 76.43, "elapsed_time": "15:37:24", "remaining_time": "4:49:01"} -{"current_steps": 4940, "total_steps": 6450, "loss": 0.0005, "lr": 1.5786454960642694e-05, "epoch": 7.658914728682171, "percentage": 76.59, "elapsed_time": "15:38:45", "remaining_time": "4:46:56"} -{"current_steps": 4950, "total_steps": 6450, "loss": 0.0005, "lr": 1.5589632488623053e-05, "epoch": 7.674418604651163, "percentage": 76.74, "elapsed_time": "15:40:05", "remaining_time": "4:44:52"} -{"current_steps": 4950, "total_steps": 6450, "eval_loss": 0.08510509133338928, "epoch": 7.674418604651163, "percentage": 76.74, "elapsed_time": "15:42:49", "remaining_time": "4:45:42"} -{"current_steps": 4960, "total_steps": 6450, "loss": 0.0002, "lr": 1.539381783793933e-05, "epoch": 7.689922480620155, "percentage": 76.9, "elapsed_time": "15:44:14", "remaining_time": "4:43:39"} -{"current_steps": 4970, "total_steps": 6450, "loss": 0.0009, "lr": 1.5199016743670718e-05, "epoch": 7.705426356589148, "percentage": 77.05, "elapsed_time": "15:45:34", "remaining_time": "4:41:34"} -{"current_steps": 4980, "total_steps": 6450, "loss": 0.0003, "lr": 1.500523491121108e-05, "epoch": 7.720930232558139, "percentage": 77.21, "elapsed_time": "15:46:54", "remaining_time": "4:39:30"} -{"current_steps": 4990, "total_steps": 6450, "loss": 0.0002, "lr": 1.4812478016101784e-05, "epoch": 7.736434108527131, "percentage": 77.36, "elapsed_time": "15:48:15", "remaining_time": "4:37:26"} -{"current_steps": 5000, "total_steps": 6450, "loss": 0.0002, "lr": 1.462075170386556e-05, "epoch": 7.751937984496124, "percentage": 77.52, "elapsed_time": "15:49:35", "remaining_time": "4:35:22"} -{"current_steps": 5000, "total_steps": 6450, "eval_loss": 0.0883769541978836, "epoch": 7.751937984496124, "percentage": 77.52, "elapsed_time": "15:52:19", "remaining_time": "4:36:10"} -{"current_steps": 5010, "total_steps": 6450, "loss": 0.0008, "lr": 1.4430061589841121e-05, "epoch": 7.767441860465116, "percentage": 77.67, "elapsed_time": "15:53:43", "remaining_time": "4:34:07"} -{"current_steps": 5020, "total_steps": 6450, "loss": 0.0019, "lr": 1.424041325901863e-05, "epoch": 7.782945736434108, "percentage": 77.83, "elapsed_time": "15:55:04", "remaining_time": "4:32:03"} -{"current_steps": 5030, "total_steps": 6450, "loss": 0.0002, "lr": 1.4051812265876257e-05, "epoch": 7.7984496124031, "percentage": 77.98, "elapsed_time": "15:56:24", "remaining_time": "4:30:00"} -{"current_steps": 5040, "total_steps": 6450, "loss": 0.0021, "lr": 1.386426413421738e-05, "epoch": 7.813953488372093, "percentage": 78.14, "elapsed_time": "15:57:44", "remaining_time": "4:27:56"} -{"current_steps": 5050, "total_steps": 6450, "loss": 0.0008, "lr": 1.3677774357008899e-05, "epoch": 7.829457364341085, "percentage": 78.29, "elapsed_time": "15:59:04", "remaining_time": "4:25:52"} -{"current_steps": 5050, "total_steps": 6450, "eval_loss": 0.0885603129863739, "epoch": 7.829457364341085, "percentage": 78.29, "elapsed_time": "16:01:48", "remaining_time": "4:26:38"} -{"current_steps": 5060, "total_steps": 6450, "loss": 0.0002, "lr": 1.3492348396220228e-05, "epoch": 7.844961240310077, "percentage": 78.45, "elapsed_time": "16:03:13", "remaining_time": "4:24:36"} -{"current_steps": 5070, "total_steps": 6450, "loss": 0.0017, "lr": 1.3307991682663462e-05, "epoch": 7.8604651162790695, "percentage": 78.6, "elapsed_time": "16:04:33", "remaining_time": "4:22:32"} -{"current_steps": 5080, "total_steps": 6450, "loss": 0.0005, "lr": 1.3124709615834264e-05, "epoch": 7.875968992248062, "percentage": 78.76, "elapsed_time": "16:05:54", "remaining_time": "4:20:29"} -{"current_steps": 5090, "total_steps": 6450, "loss": 0.0004, "lr": 1.2942507563753653e-05, "epoch": 7.891472868217054, "percentage": 78.91, "elapsed_time": "16:07:14", "remaining_time": "4:18:26"} -{"current_steps": 5100, "total_steps": 6450, "loss": 0.001, "lr": 1.2761390862810907e-05, "epoch": 7.906976744186046, "percentage": 79.07, "elapsed_time": "16:08:34", "remaining_time": "4:16:23"} -{"current_steps": 5100, "total_steps": 6450, "eval_loss": 0.09059925377368927, "epoch": 7.906976744186046, "percentage": 79.07, "elapsed_time": "16:11:18", "remaining_time": "4:17:06"} -{"current_steps": 5110, "total_steps": 6450, "loss": 0.0007, "lr": 1.2581364817607195e-05, "epoch": 7.922480620155039, "percentage": 79.22, "elapsed_time": "16:12:42", "remaining_time": "4:15:04"} -{"current_steps": 5120, "total_steps": 6450, "loss": 0.0017, "lr": 1.240243470080022e-05, "epoch": 7.937984496124031, "percentage": 79.38, "elapsed_time": "16:14:03", "remaining_time": "4:13:01"} -{"current_steps": 5130, "total_steps": 6450, "loss": 0.0007, "lr": 1.2224605752949786e-05, "epoch": 7.953488372093023, "percentage": 79.53, "elapsed_time": "16:15:23", "remaining_time": "4:10:58"} -{"current_steps": 5140, "total_steps": 6450, "loss": 0.0001, "lr": 1.2047883182364351e-05, "epoch": 7.9689922480620154, "percentage": 79.69, "elapsed_time": "16:16:43", "remaining_time": "4:08:55"} -{"current_steps": 5150, "total_steps": 6450, "loss": 0.0012, "lr": 1.1872272164948455e-05, "epoch": 7.984496124031008, "percentage": 79.84, "elapsed_time": "16:18:03", "remaining_time": "4:06:53"} -{"current_steps": 5150, "total_steps": 6450, "eval_loss": 0.09185978770256042, "epoch": 7.984496124031008, "percentage": 79.84, "elapsed_time": "16:20:47", "remaining_time": "4:07:34"} -{"current_steps": 5160, "total_steps": 6450, "loss": 0.0021, "lr": 1.1697777844051105e-05, "epoch": 8.0, "percentage": 80.0, "elapsed_time": "16:22:12", "remaining_time": "4:05:33"} -{"current_steps": 5170, "total_steps": 6450, "loss": 0.0009, "lr": 1.1524405330315185e-05, "epoch": 8.015503875968992, "percentage": 80.16, "elapsed_time": "16:23:32", "remaining_time": "4:03:30"} -{"current_steps": 5180, "total_steps": 6450, "loss": 0.0001, "lr": 1.1352159701527743e-05, "epoch": 8.031007751937985, "percentage": 80.31, "elapsed_time": "16:24:53", "remaining_time": "4:01:28"} -{"current_steps": 5190, "total_steps": 6450, "loss": 0.0001, "lr": 1.118104600247129e-05, "epoch": 8.046511627906977, "percentage": 80.47, "elapsed_time": "16:26:13", "remaining_time": "3:59:25"} -{"current_steps": 5200, "total_steps": 6450, "loss": 0.0001, "lr": 1.1011069244775995e-05, "epoch": 8.062015503875969, "percentage": 80.62, "elapsed_time": "16:27:34", "remaining_time": "3:57:23"} -{"current_steps": 5200, "total_steps": 6450, "eval_loss": 0.09263475239276886, "epoch": 8.062015503875969, "percentage": 80.62, "elapsed_time": "16:30:18", "remaining_time": "3:58:03"} -{"current_steps": 5210, "total_steps": 6450, "loss": 0.0002, "lr": 1.0842234406772972e-05, "epoch": 8.077519379844961, "percentage": 80.78, "elapsed_time": "16:31:43", "remaining_time": "3:56:02"} -{"current_steps": 5220, "total_steps": 6450, "loss": 0.0001, "lr": 1.0674546433348454e-05, "epoch": 8.093023255813954, "percentage": 80.93, "elapsed_time": "16:33:03", "remaining_time": "3:53:59"} -{"current_steps": 5230, "total_steps": 6450, "loss": 0.0008, "lr": 1.0508010235798905e-05, "epoch": 8.108527131782946, "percentage": 81.09, "elapsed_time": "16:34:24", "remaining_time": "3:51:57"} -{"current_steps": 5240, "total_steps": 6450, "loss": 0.0002, "lr": 1.0342630691687283e-05, "epoch": 8.124031007751938, "percentage": 81.24, "elapsed_time": "16:35:45", "remaining_time": "3:49:56"} -{"current_steps": 5250, "total_steps": 6450, "loss": 0.0002, "lr": 1.0178412644700092e-05, "epoch": 8.13953488372093, "percentage": 81.4, "elapsed_time": "16:37:05", "remaining_time": "3:47:54"} -{"current_steps": 5250, "total_steps": 6450, "eval_loss": 0.09628988057374954, "epoch": 8.13953488372093, "percentage": 81.4, "elapsed_time": "16:39:49", "remaining_time": "3:48:31"} -{"current_steps": 5260, "total_steps": 6450, "loss": 0.0, "lr": 1.0015360904505572e-05, "epoch": 8.155038759689923, "percentage": 81.55, "elapsed_time": "16:41:14", "remaining_time": "3:46:30"} -{"current_steps": 5270, "total_steps": 6450, "loss": 0.0004, "lr": 9.853480246612813e-06, "epoch": 8.170542635658915, "percentage": 81.71, "elapsed_time": "16:42:34", "remaining_time": "3:44:29"} -{"current_steps": 5280, "total_steps": 6450, "loss": 0.0002, "lr": 9.692775412231863e-06, "epoch": 8.186046511627907, "percentage": 81.86, "elapsed_time": "16:43:55", "remaining_time": "3:42:27"} -{"current_steps": 5290, "total_steps": 6450, "loss": 0.0006, "lr": 9.533251108134921e-06, "epoch": 8.2015503875969, "percentage": 82.02, "elapsed_time": "16:45:16", "remaining_time": "3:40:26"} -{"current_steps": 5300, "total_steps": 6450, "loss": 0.0, "lr": 9.374912006518466e-06, "epoch": 8.217054263565892, "percentage": 82.17, "elapsed_time": "16:46:36", "remaining_time": "3:38:24"} -{"current_steps": 5300, "total_steps": 6450, "eval_loss": 0.0979791209101677, "epoch": 8.217054263565892, "percentage": 82.17, "elapsed_time": "16:49:20", "remaining_time": "3:39:00"} -{"current_steps": 5310, "total_steps": 6450, "loss": 0.0001, "lr": 9.21776274486636e-06, "epoch": 8.232558139534884, "percentage": 82.33, "elapsed_time": "16:50:45", "remaining_time": "3:36:59"} -{"current_steps": 5320, "total_steps": 6450, "loss": 0.0005, "lr": 9.061807925814097e-06, "epoch": 8.248062015503876, "percentage": 82.48, "elapsed_time": "16:52:05", "remaining_time": "3:34:58"} -{"current_steps": 5330, "total_steps": 6450, "loss": 0.0009, "lr": 8.907052117013982e-06, "epoch": 8.263565891472869, "percentage": 82.64, "elapsed_time": "16:53:26", "remaining_time": "3:32:57"} -{"current_steps": 5340, "total_steps": 6450, "loss": 0.0002, "lr": 8.75349985100134e-06, "epoch": 8.279069767441861, "percentage": 82.79, "elapsed_time": "16:54:46", "remaining_time": "3:30:56"} -{"current_steps": 5350, "total_steps": 6450, "loss": 0.0, "lr": 8.601155625061734e-06, "epoch": 8.294573643410853, "percentage": 82.95, "elapsed_time": "16:56:07", "remaining_time": "3:28:55"} -{"current_steps": 5350, "total_steps": 6450, "eval_loss": 0.09938393533229828, "epoch": 8.294573643410853, "percentage": 82.95, "elapsed_time": "16:58:51", "remaining_time": "3:29:29"} -{"current_steps": 5360, "total_steps": 6450, "loss": 0.0005, "lr": 8.450023901099313e-06, "epoch": 8.310077519379846, "percentage": 83.1, "elapsed_time": "17:00:16", "remaining_time": "3:27:28"} -{"current_steps": 5370, "total_steps": 6450, "loss": 0.0008, "lr": 8.30010910550611e-06, "epoch": 8.325581395348838, "percentage": 83.26, "elapsed_time": "17:01:36", "remaining_time": "3:25:27"} -{"current_steps": 5380, "total_steps": 6450, "loss": 0.0004, "lr": 8.151415629032339e-06, "epoch": 8.34108527131783, "percentage": 83.41, "elapsed_time": "17:02:57", "remaining_time": "3:23:27"} -{"current_steps": 5390, "total_steps": 6450, "loss": 0.0006, "lr": 8.003947826657898e-06, "epoch": 8.356589147286822, "percentage": 83.57, "elapsed_time": "17:04:17", "remaining_time": "3:21:26"} -{"current_steps": 5400, "total_steps": 6450, "loss": 0.0008, "lr": 7.857710017464737e-06, "epoch": 8.372093023255815, "percentage": 83.72, "elapsed_time": "17:05:38", "remaining_time": "3:19:25"} -{"current_steps": 5400, "total_steps": 6450, "eval_loss": 0.10101110488176346, "epoch": 8.372093023255815, "percentage": 83.72, "elapsed_time": "17:08:22", "remaining_time": "3:19:57"} -{"current_steps": 5410, "total_steps": 6450, "loss": 0.0008, "lr": 7.712706484510423e-06, "epoch": 8.387596899224807, "percentage": 83.88, "elapsed_time": "17:09:46", "remaining_time": "3:17:57"} -{"current_steps": 5420, "total_steps": 6450, "loss": 0.0007, "lr": 7.568941474702618e-06, "epoch": 8.4031007751938, "percentage": 84.03, "elapsed_time": "17:11:06", "remaining_time": "3:15:56"} -{"current_steps": 5430, "total_steps": 6450, "loss": 0.0002, "lr": 7.426419198674772e-06, "epoch": 8.418604651162791, "percentage": 84.19, "elapsed_time": "17:12:27", "remaining_time": "3:13:56"} -{"current_steps": 5440, "total_steps": 6450, "loss": 0.0022, "lr": 7.285143830662777e-06, "epoch": 8.434108527131784, "percentage": 84.34, "elapsed_time": "17:13:48", "remaining_time": "3:11:56"} -{"current_steps": 5450, "total_steps": 6450, "loss": 0.0002, "lr": 7.145119508382664e-06, "epoch": 8.449612403100776, "percentage": 84.5, "elapsed_time": "17:15:08", "remaining_time": "3:09:56"} -{"current_steps": 5450, "total_steps": 6450, "eval_loss": 0.10002466291189194, "epoch": 8.449612403100776, "percentage": 84.5, "elapsed_time": "17:17:52", "remaining_time": "3:10:26"} -{"current_steps": 5460, "total_steps": 6450, "loss": 0.0007, "lr": 7.006350332909495e-06, "epoch": 8.465116279069768, "percentage": 84.65, "elapsed_time": "17:19:17", "remaining_time": "3:08:26"} -{"current_steps": 5470, "total_steps": 6450, "loss": 0.0011, "lr": 6.8688403685571945e-06, "epoch": 8.48062015503876, "percentage": 84.81, "elapsed_time": "17:20:37", "remaining_time": "3:06:26"} -{"current_steps": 5480, "total_steps": 6450, "loss": 0.0001, "lr": 6.732593642759533e-06, "epoch": 8.496124031007753, "percentage": 84.96, "elapsed_time": "17:21:58", "remaining_time": "3:04:26"} -{"current_steps": 5490, "total_steps": 6450, "loss": 0.0008, "lr": 6.5976141459521355e-06, "epoch": 8.511627906976745, "percentage": 85.12, "elapsed_time": "17:23:18", "remaining_time": "3:02:26"} -{"current_steps": 5500, "total_steps": 6450, "loss": 0.0005, "lr": 6.463905831455686e-06, "epoch": 8.527131782945737, "percentage": 85.27, "elapsed_time": "17:24:39", "remaining_time": "3:00:26"} -{"current_steps": 5500, "total_steps": 6450, "eval_loss": 0.09973295032978058, "epoch": 8.527131782945737, "percentage": 85.27, "elapsed_time": "17:27:23", "remaining_time": "3:00:54"} -{"current_steps": 5510, "total_steps": 6450, "loss": 0.0001, "lr": 6.331472615360062e-06, "epoch": 8.542635658914728, "percentage": 85.43, "elapsed_time": "17:28:47", "remaining_time": "2:58:55"} -{"current_steps": 5520, "total_steps": 6450, "loss": 0.0004, "lr": 6.2003183764096695e-06, "epoch": 8.55813953488372, "percentage": 85.58, "elapsed_time": "17:30:08", "remaining_time": "2:56:55"} -{"current_steps": 5530, "total_steps": 6450, "loss": 0.001, "lr": 6.070446955889853e-06, "epoch": 8.573643410852712, "percentage": 85.74, "elapsed_time": "17:31:29", "remaining_time": "2:54:55"} -{"current_steps": 5540, "total_steps": 6450, "loss": 0.001, "lr": 5.941862157514383e-06, "epoch": 8.589147286821705, "percentage": 85.89, "elapsed_time": "17:32:49", "remaining_time": "2:52:56"} -{"current_steps": 5550, "total_steps": 6450, "loss": 0.0001, "lr": 5.814567747314048e-06, "epoch": 8.604651162790697, "percentage": 86.05, "elapsed_time": "17:34:10", "remaining_time": "2:50:56"} -{"current_steps": 5550, "total_steps": 6450, "eval_loss": 0.10008525848388672, "epoch": 8.604651162790697, "percentage": 86.05, "elapsed_time": "17:36:54", "remaining_time": "2:51:23"} -{"current_steps": 5560, "total_steps": 6450, "loss": 0.0006, "lr": 5.688567453526328e-06, "epoch": 8.62015503875969, "percentage": 86.2, "elapsed_time": "17:38:19", "remaining_time": "2:49:24"} -{"current_steps": 5570, "total_steps": 6450, "loss": 0.0001, "lr": 5.563864966486254e-06, "epoch": 8.635658914728682, "percentage": 86.36, "elapsed_time": "17:39:39", "remaining_time": "2:47:24"} -{"current_steps": 5580, "total_steps": 6450, "loss": 0.0001, "lr": 5.440463938518303e-06, "epoch": 8.651162790697674, "percentage": 86.51, "elapsed_time": "17:41:00", "remaining_time": "2:45:25"} -{"current_steps": 5590, "total_steps": 6450, "loss": 0.0012, "lr": 5.318367983829392e-06, "epoch": 8.666666666666666, "percentage": 86.67, "elapsed_time": "17:42:21", "remaining_time": "2:43:26"} -{"current_steps": 5600, "total_steps": 6450, "loss": 0.0001, "lr": 5.197580678403075e-06, "epoch": 8.682170542635658, "percentage": 86.82, "elapsed_time": "17:43:42", "remaining_time": "2:41:27"} -{"current_steps": 5600, "total_steps": 6450, "eval_loss": 0.10040813684463501, "epoch": 8.682170542635658, "percentage": 86.82, "elapsed_time": "17:46:26", "remaining_time": "2:41:52"} -{"current_steps": 5610, "total_steps": 6450, "loss": 0.0001, "lr": 5.078105559894791e-06, "epoch": 8.69767441860465, "percentage": 86.98, "elapsed_time": "17:47:51", "remaining_time": "2:39:53"} -{"current_steps": 5620, "total_steps": 6450, "loss": 0.001, "lr": 4.959946127528231e-06, "epoch": 8.713178294573643, "percentage": 87.13, "elapsed_time": "17:49:12", "remaining_time": "2:37:54"} -{"current_steps": 5630, "total_steps": 6450, "loss": 0.0001, "lr": 4.843105841992895e-06, "epoch": 8.728682170542635, "percentage": 87.29, "elapsed_time": "17:50:32", "remaining_time": "2:35:55"} -{"current_steps": 5640, "total_steps": 6450, "loss": 0.0002, "lr": 4.727588125342669e-06, "epoch": 8.744186046511627, "percentage": 87.44, "elapsed_time": "17:51:53", "remaining_time": "2:33:56"} -{"current_steps": 5650, "total_steps": 6450, "loss": 0.0013, "lr": 4.613396360895683e-06, "epoch": 8.75968992248062, "percentage": 87.6, "elapsed_time": "17:53:13", "remaining_time": "2:31:57"} -{"current_steps": 5650, "total_steps": 6450, "eval_loss": 0.10096357017755508, "epoch": 8.75968992248062, "percentage": 87.6, "elapsed_time": "17:55:57", "remaining_time": "2:32:20"} -{"current_steps": 5660, "total_steps": 6450, "loss": 0.0006, "lr": 4.5005338931351335e-06, "epoch": 8.775193798449612, "percentage": 87.75, "elapsed_time": "17:57:22", "remaining_time": "2:30:22"} -{"current_steps": 5670, "total_steps": 6450, "loss": 0.0001, "lr": 4.389004027611404e-06, "epoch": 8.790697674418604, "percentage": 87.91, "elapsed_time": "17:58:43", "remaining_time": "2:28:23"} -{"current_steps": 5680, "total_steps": 6450, "loss": 0.0008, "lr": 4.278810030845193e-06, "epoch": 8.806201550387597, "percentage": 88.06, "elapsed_time": "18:00:04", "remaining_time": "2:26:25"} -{"current_steps": 5690, "total_steps": 6450, "loss": 0.0006, "lr": 4.169955130231884e-06, "epoch": 8.821705426356589, "percentage": 88.22, "elapsed_time": "18:01:24", "remaining_time": "2:24:26"} -{"current_steps": 5700, "total_steps": 6450, "loss": 0.0003, "lr": 4.062442513947007e-06, "epoch": 8.837209302325581, "percentage": 88.37, "elapsed_time": "18:02:44", "remaining_time": "2:22:28"} -{"current_steps": 5700, "total_steps": 6450, "eval_loss": 0.10085734724998474, "epoch": 8.837209302325581, "percentage": 88.37, "elapsed_time": "18:05:29", "remaining_time": "2:22:49"} -{"current_steps": 5710, "total_steps": 6450, "loss": 0.0001, "lr": 3.9562753308528264e-06, "epoch": 8.852713178294573, "percentage": 88.53, "elapsed_time": "18:06:54", "remaining_time": "2:20:51"} -{"current_steps": 5720, "total_steps": 6450, "loss": 0.0001, "lr": 3.851456690406197e-06, "epoch": 8.868217054263566, "percentage": 88.68, "elapsed_time": "18:08:14", "remaining_time": "2:18:53"} -{"current_steps": 5730, "total_steps": 6450, "loss": 0.0029, "lr": 3.7479896625674027e-06, "epoch": 8.883720930232558, "percentage": 88.84, "elapsed_time": "18:09:35", "remaining_time": "2:16:54"} -{"current_steps": 5740, "total_steps": 6450, "loss": 0.0009, "lr": 3.645877277710308e-06, "epoch": 8.89922480620155, "percentage": 88.99, "elapsed_time": "18:10:55", "remaining_time": "2:14:56"} -{"current_steps": 5750, "total_steps": 6450, "loss": 0.0, "lr": 3.5451225265335786e-06, "epoch": 8.914728682170542, "percentage": 89.15, "elapsed_time": "18:12:16", "remaining_time": "2:12:58"} -{"current_steps": 5750, "total_steps": 6450, "eval_loss": 0.10091914236545563, "epoch": 8.914728682170542, "percentage": 89.15, "elapsed_time": "18:15:00", "remaining_time": "2:13:18"} -{"current_steps": 5760, "total_steps": 6450, "loss": 0.0003, "lr": 3.445728359973094e-06, "epoch": 8.930232558139535, "percentage": 89.3, "elapsed_time": "18:16:25", "remaining_time": "2:11:20"} -{"current_steps": 5770, "total_steps": 6450, "loss": 0.0009, "lr": 3.3476976891155087e-06, "epoch": 8.945736434108527, "percentage": 89.46, "elapsed_time": "18:17:46", "remaining_time": "2:09:22"} -{"current_steps": 5780, "total_steps": 6450, "loss": 0.001, "lr": 3.2510333851129893e-06, "epoch": 8.96124031007752, "percentage": 89.61, "elapsed_time": "18:19:06", "remaining_time": "2:07:24"} -{"current_steps": 5790, "total_steps": 6450, "loss": 0.0001, "lr": 3.1557382790991687e-06, "epoch": 8.976744186046512, "percentage": 89.77, "elapsed_time": "18:20:27", "remaining_time": "2:05:26"} -{"current_steps": 5800, "total_steps": 6450, "loss": 0.0003, "lr": 3.0618151621061466e-06, "epoch": 8.992248062015504, "percentage": 89.92, "elapsed_time": "18:21:47", "remaining_time": "2:03:28"} -{"current_steps": 5800, "total_steps": 6450, "eval_loss": 0.10091939568519592, "epoch": 8.992248062015504, "percentage": 89.92, "elapsed_time": "18:24:31", "remaining_time": "2:03:46"} -{"current_steps": 5810, "total_steps": 6450, "loss": 0.0, "lr": 2.9692667849828215e-06, "epoch": 9.007751937984496, "percentage": 90.08, "elapsed_time": "18:25:56", "remaining_time": "2:01:49"} -{"current_steps": 5820, "total_steps": 6450, "loss": 0.0006, "lr": 2.878095858314278e-06, "epoch": 9.023255813953488, "percentage": 90.23, "elapsed_time": "18:27:17", "remaining_time": "1:59:51"} -{"current_steps": 5830, "total_steps": 6450, "loss": 0.001, "lr": 2.7883050523424213e-06, "epoch": 9.03875968992248, "percentage": 90.39, "elapsed_time": "18:28:38", "remaining_time": "1:57:53"} -{"current_steps": 5840, "total_steps": 6450, "loss": 0.0005, "lr": 2.699896996887763e-06, "epoch": 9.054263565891473, "percentage": 90.54, "elapsed_time": "18:29:58", "remaining_time": "1:55:56"} -{"current_steps": 5850, "total_steps": 6450, "loss": 0.0001, "lr": 2.6128742812723704e-06, "epoch": 9.069767441860465, "percentage": 90.7, "elapsed_time": "18:31:19", "remaining_time": "1:53:58"} -{"current_steps": 5850, "total_steps": 6450, "eval_loss": 0.10133634507656097, "epoch": 9.069767441860465, "percentage": 90.7, "elapsed_time": "18:34:03", "remaining_time": "1:54:15"} -{"current_steps": 5860, "total_steps": 6450, "loss": 0.0, "lr": 2.5272394542440847e-06, "epoch": 9.085271317829458, "percentage": 90.85, "elapsed_time": "18:35:28", "remaining_time": "1:52:18"} -{"current_steps": 5870, "total_steps": 6450, "loss": 0.0005, "lr": 2.4429950239018284e-06, "epoch": 9.10077519379845, "percentage": 91.01, "elapsed_time": "18:36:49", "remaining_time": "1:50:21"} -{"current_steps": 5880, "total_steps": 6450, "loss": 0.0006, "lr": 2.3601434576221546e-06, "epoch": 9.116279069767442, "percentage": 91.16, "elapsed_time": "18:38:10", "remaining_time": "1:48:23"} -{"current_steps": 5890, "total_steps": 6450, "loss": 0.0006, "lr": 2.278687181987016e-06, "epoch": 9.131782945736434, "percentage": 91.32, "elapsed_time": "18:39:30", "remaining_time": "1:46:26"} -{"current_steps": 5900, "total_steps": 6450, "loss": 0.0004, "lr": 2.198628582712642e-06, "epoch": 9.147286821705427, "percentage": 91.47, "elapsed_time": "18:40:51", "remaining_time": "1:44:29"} -{"current_steps": 5900, "total_steps": 6450, "eval_loss": 0.10208235681056976, "epoch": 9.147286821705427, "percentage": 91.47, "elapsed_time": "18:43:35", "remaining_time": "1:44:44"} -{"current_steps": 5910, "total_steps": 6450, "loss": 0.0004, "lr": 2.1199700045797077e-06, "epoch": 9.162790697674419, "percentage": 91.63, "elapsed_time": "18:45:00", "remaining_time": "1:42:47"} -{"current_steps": 5920, "total_steps": 6450, "loss": 0.0004, "lr": 2.0427137513646167e-06, "epoch": 9.178294573643411, "percentage": 91.78, "elapsed_time": "18:46:20", "remaining_time": "1:40:50"} -{"current_steps": 5930, "total_steps": 6450, "loss": 0.0004, "lr": 1.9668620857720864e-06, "epoch": 9.193798449612403, "percentage": 91.94, "elapsed_time": "18:47:41", "remaining_time": "1:38:53"} -{"current_steps": 5940, "total_steps": 6450, "loss": 0.0006, "lr": 1.8924172293688147e-06, "epoch": 9.209302325581396, "percentage": 92.09, "elapsed_time": "18:49:01", "remaining_time": "1:36:56"} -{"current_steps": 5950, "total_steps": 6450, "loss": 0.0, "lr": 1.819381362518463e-06, "epoch": 9.224806201550388, "percentage": 92.25, "elapsed_time": "18:50:22", "remaining_time": "1:34:59"} -{"current_steps": 5950, "total_steps": 6450, "eval_loss": 0.10275321453809738, "epoch": 9.224806201550388, "percentage": 92.25, "elapsed_time": "18:53:06", "remaining_time": "1:35:13"} -{"current_steps": 5960, "total_steps": 6450, "loss": 0.0002, "lr": 1.7477566243177646e-06, "epoch": 9.24031007751938, "percentage": 92.4, "elapsed_time": "18:54:30", "remaining_time": "1:33:16"} -{"current_steps": 5970, "total_steps": 6450, "loss": 0.0003, "lr": 1.6775451125338959e-06, "epoch": 9.255813953488373, "percentage": 92.56, "elapsed_time": "18:55:51", "remaining_time": "1:31:19"} -{"current_steps": 5980, "total_steps": 6450, "loss": 0.0007, "lr": 1.6087488835430209e-06, "epoch": 9.271317829457365, "percentage": 92.71, "elapsed_time": "18:57:11", "remaining_time": "1:29:22"} -{"current_steps": 5990, "total_steps": 6450, "loss": 0.0001, "lr": 1.5413699522700775e-06, "epoch": 9.286821705426357, "percentage": 92.87, "elapsed_time": "18:58:32", "remaining_time": "1:27:26"} -{"current_steps": 6000, "total_steps": 6450, "loss": 0.0002, "lr": 1.4754102921297364e-06, "epoch": 9.30232558139535, "percentage": 93.02, "elapsed_time": "18:59:52", "remaining_time": "1:25:29"} -{"current_steps": 6000, "total_steps": 6450, "eval_loss": 0.10337940603494644, "epoch": 9.30232558139535, "percentage": 93.02, "elapsed_time": "19:02:36", "remaining_time": "1:25:41"} -{"current_steps": 6010, "total_steps": 6450, "loss": 0.0003, "lr": 1.4108718349686468e-06, "epoch": 9.317829457364342, "percentage": 93.18, "elapsed_time": "19:04:01", "remaining_time": "1:23:45"} -{"current_steps": 6020, "total_steps": 6450, "loss": 0.0009, "lr": 1.3477564710088098e-06, "epoch": 9.333333333333334, "percentage": 93.33, "elapsed_time": "19:05:21", "remaining_time": "1:21:48"} -{"current_steps": 6030, "total_steps": 6450, "loss": 0.0002, "lr": 1.2860660487922616e-06, "epoch": 9.348837209302326, "percentage": 93.49, "elapsed_time": "19:06:42", "remaining_time": "1:19:52"} -{"current_steps": 6040, "total_steps": 6450, "loss": 0.0003, "lr": 1.2258023751268887e-06, "epoch": 9.364341085271318, "percentage": 93.64, "elapsed_time": "19:08:02", "remaining_time": "1:17:55"} -{"current_steps": 6050, "total_steps": 6450, "loss": 0.0, "lr": 1.1669672150335486e-06, "epoch": 9.37984496124031, "percentage": 93.8, "elapsed_time": "19:09:22", "remaining_time": "1:15:59"} -{"current_steps": 6050, "total_steps": 6450, "eval_loss": 0.10398336499929428, "epoch": 9.37984496124031, "percentage": 93.8, "elapsed_time": "19:12:06", "remaining_time": "1:16:10"} -{"current_steps": 6060, "total_steps": 6450, "loss": 0.0001, "lr": 1.1095622916943494e-06, "epoch": 9.395348837209303, "percentage": 93.95, "elapsed_time": "19:13:31", "remaining_time": "1:14:14"} -{"current_steps": 6070, "total_steps": 6450, "loss": 0.0003, "lr": 1.0535892864021901e-06, "epoch": 9.410852713178295, "percentage": 94.11, "elapsed_time": "19:14:52", "remaining_time": "1:12:17"} -{"current_steps": 6080, "total_steps": 6450, "loss": 0.0006, "lr": 9.990498385115065e-07, "epoch": 9.426356589147288, "percentage": 94.26, "elapsed_time": "19:16:12", "remaining_time": "1:10:21"} -{"current_steps": 6090, "total_steps": 6450, "loss": 0.001, "lr": 9.459455453902866e-07, "epoch": 9.44186046511628, "percentage": 94.42, "elapsed_time": "19:17:32", "remaining_time": "1:08:25"} -{"current_steps": 6100, "total_steps": 6450, "loss": 0.0001, "lr": 8.942779623732578e-07, "epoch": 9.457364341085272, "percentage": 94.57, "elapsed_time": "19:18:52", "remaining_time": "1:06:29"} -{"current_steps": 6100, "total_steps": 6450, "eval_loss": 0.10399701446294785, "epoch": 9.457364341085272, "percentage": 94.57, "elapsed_time": "19:21:36", "remaining_time": "1:06:38"} -{"current_steps": 6110, "total_steps": 6450, "loss": 0.0004, "lr": 8.440486027163519e-07, "epoch": 9.472868217054264, "percentage": 94.73, "elapsed_time": "19:23:01", "remaining_time": "1:04:43"} -{"current_steps": 6120, "total_steps": 6450, "loss": 0.0001, "lr": 7.952589375523567e-07, "epoch": 9.488372093023255, "percentage": 94.88, "elapsed_time": "19:24:21", "remaining_time": "1:02:47"} -{"current_steps": 6130, "total_steps": 6450, "loss": 0.0005, "lr": 7.479103958478784e-07, "epoch": 9.503875968992247, "percentage": 95.04, "elapsed_time": "19:25:42", "remaining_time": "1:00:51"} -{"current_steps": 6140, "total_steps": 6450, "loss": 0.0004, "lr": 7.02004364361436e-07, "epoch": 9.51937984496124, "percentage": 95.19, "elapsed_time": "19:27:02", "remaining_time": "0:58:55"} -{"current_steps": 6150, "total_steps": 6450, "loss": 0.0, "lr": 6.57542187602872e-07, "epoch": 9.534883720930232, "percentage": 95.35, "elapsed_time": "19:28:23", "remaining_time": "0:56:59"} -{"current_steps": 6150, "total_steps": 6450, "eval_loss": 0.10399660468101501, "epoch": 9.534883720930232, "percentage": 95.35, "elapsed_time": "19:31:06", "remaining_time": "0:57:07"} -{"current_steps": 6160, "total_steps": 6450, "loss": 0.0, "lr": 6.145251677939778e-07, "epoch": 9.550387596899224, "percentage": 95.5, "elapsed_time": "19:32:32", "remaining_time": "0:55:12"} -{"current_steps": 6170, "total_steps": 6450, "loss": 0.0004, "lr": 5.729545648303525e-07, "epoch": 9.565891472868216, "percentage": 95.66, "elapsed_time": "19:33:52", "remaining_time": "0:53:16"} -{"current_steps": 6180, "total_steps": 6450, "loss": 0.0003, "lr": 5.328315962444874e-07, "epoch": 9.581395348837209, "percentage": 95.81, "elapsed_time": "19:35:12", "remaining_time": "0:51:20"} -{"current_steps": 6190, "total_steps": 6450, "loss": 0.0001, "lr": 4.94157437170123e-07, "epoch": 9.5968992248062, "percentage": 95.97, "elapsed_time": "19:36:32", "remaining_time": "0:49:25"} -{"current_steps": 6200, "total_steps": 6450, "loss": 0.0, "lr": 4.5693322030782584e-07, "epoch": 9.612403100775193, "percentage": 96.12, "elapsed_time": "19:37:53", "remaining_time": "0:47:29"} -{"current_steps": 6200, "total_steps": 6450, "eval_loss": 0.10415206849575043, "epoch": 9.612403100775193, "percentage": 96.12, "elapsed_time": "19:40:36", "remaining_time": "0:47:36"} -{"current_steps": 6210, "total_steps": 6450, "loss": 0.0003, "lr": 4.2116003589179887e-07, "epoch": 9.627906976744185, "percentage": 96.28, "elapsed_time": "19:42:01", "remaining_time": "0:45:40"} -{"current_steps": 6220, "total_steps": 6450, "loss": 0.0002, "lr": 3.868389316579846e-07, "epoch": 9.643410852713178, "percentage": 96.43, "elapsed_time": "19:43:22", "remaining_time": "0:43:45"} -{"current_steps": 6230, "total_steps": 6450, "loss": 0.0004, "lr": 3.5397091281333947e-07, "epoch": 9.65891472868217, "percentage": 96.59, "elapsed_time": "19:44:42", "remaining_time": "0:41:50"} -{"current_steps": 6240, "total_steps": 6450, "loss": 0.0001, "lr": 3.2255694200643006e-07, "epoch": 9.674418604651162, "percentage": 96.74, "elapsed_time": "19:46:02", "remaining_time": "0:39:54"} -{"current_steps": 6250, "total_steps": 6450, "loss": 0.0004, "lr": 2.9259793929921063e-07, "epoch": 9.689922480620154, "percentage": 96.9, "elapsed_time": "19:47:23", "remaining_time": "0:37:59"} -{"current_steps": 6250, "total_steps": 6450, "eval_loss": 0.10420067608356476, "epoch": 9.689922480620154, "percentage": 96.9, "elapsed_time": "19:50:06", "remaining_time": "0:38:05"} -{"current_steps": 6260, "total_steps": 6450, "loss": 0.0005, "lr": 2.640947821400841e-07, "epoch": 9.705426356589147, "percentage": 97.05, "elapsed_time": "19:51:33", "remaining_time": "0:36:09"} -{"current_steps": 6270, "total_steps": 6450, "loss": 0.0, "lr": 2.3704830533821108e-07, "epoch": 9.720930232558139, "percentage": 97.21, "elapsed_time": "19:52:53", "remaining_time": "0:34:14"} -{"current_steps": 6280, "total_steps": 6450, "loss": 0.0008, "lr": 2.1145930103904644e-07, "epoch": 9.736434108527131, "percentage": 97.36, "elapsed_time": "19:54:13", "remaining_time": "0:32:19"} -{"current_steps": 6290, "total_steps": 6450, "loss": 0.0015, "lr": 1.8732851870115754e-07, "epoch": 9.751937984496124, "percentage": 97.52, "elapsed_time": "19:55:34", "remaining_time": "0:30:24"} -{"current_steps": 6300, "total_steps": 6450, "loss": 0.0006, "lr": 1.6465666507425315e-07, "epoch": 9.767441860465116, "percentage": 97.67, "elapsed_time": "19:56:55", "remaining_time": "0:28:29"} -{"current_steps": 6300, "total_steps": 6450, "eval_loss": 0.10436151176691055, "epoch": 9.767441860465116, "percentage": 97.67, "elapsed_time": "19:59:38", "remaining_time": "0:28:33"} -{"current_steps": 6310, "total_steps": 6450, "loss": 0.0, "lr": 1.434444041784888e-07, "epoch": 9.782945736434108, "percentage": 97.83, "elapsed_time": "20:01:03", "remaining_time": "0:26:38"} -{"current_steps": 6320, "total_steps": 6450, "loss": 0.0, "lr": 1.236923572850379e-07, "epoch": 9.7984496124031, "percentage": 97.98, "elapsed_time": "20:02:23", "remaining_time": "0:24:43"} -{"current_steps": 6330, "total_steps": 6450, "loss": 0.0002, "lr": 1.0540110289786742e-07, "epoch": 9.813953488372093, "percentage": 98.14, "elapsed_time": "20:03:43", "remaining_time": "0:22:49"} -{"current_steps": 6340, "total_steps": 6450, "loss": 0.0003, "lr": 8.857117673681804e-08, "epoch": 9.829457364341085, "percentage": 98.29, "elapsed_time": "20:05:03", "remaining_time": "0:20:54"} -{"current_steps": 6350, "total_steps": 6450, "loss": 0.0006, "lr": 7.320307172190011e-08, "epoch": 9.844961240310077, "percentage": 98.45, "elapsed_time": "20:06:23", "remaining_time": "0:18:59"} -{"current_steps": 6350, "total_steps": 6450, "eval_loss": 0.10437916219234467, "epoch": 9.844961240310077, "percentage": 98.45, "elapsed_time": "20:09:07", "remaining_time": "0:19:02"} -{"current_steps": 6360, "total_steps": 6450, "loss": 0.0009, "lr": 5.929723795884967e-08, "epoch": 9.86046511627907, "percentage": 98.6, "elapsed_time": "20:10:31", "remaining_time": "0:17:07"} -{"current_steps": 6370, "total_steps": 6450, "loss": 0.0, "lr": 4.685408272597225e-08, "epoch": 9.875968992248062, "percentage": 98.76, "elapsed_time": "20:11:50", "remaining_time": "0:15:13"} -{"current_steps": 6380, "total_steps": 6450, "loss": 0.0, "lr": 3.587397046219132e-08, "epoch": 9.891472868217054, "percentage": 98.91, "elapsed_time": "20:13:10", "remaining_time": "0:13:18"} -{"current_steps": 6390, "total_steps": 6450, "loss": 0.0002, "lr": 2.6357222756384636e-08, "epoch": 9.906976744186046, "percentage": 99.07, "elapsed_time": "20:14:30", "remaining_time": "0:11:24"} -{"current_steps": 6400, "total_steps": 6450, "loss": 0.0003, "lr": 1.830411833795287e-08, "epoch": 9.922480620155039, "percentage": 99.22, "elapsed_time": "20:15:49", "remaining_time": "0:09:29"} -{"current_steps": 6400, "total_steps": 6450, "eval_loss": 0.10459784418344498, "epoch": 9.922480620155039, "percentage": 99.22, "elapsed_time": "20:18:30", "remaining_time": "0:09:31"} -{"current_steps": 6410, "total_steps": 6450, "loss": 0.0004, "lr": 1.1714893068687227e-08, "epoch": 9.937984496124031, "percentage": 99.38, "elapsed_time": "20:19:53", "remaining_time": "0:07:36"} -{"current_steps": 6420, "total_steps": 6450, "loss": 0.0, "lr": 6.589739935819461e-09, "epoch": 9.953488372093023, "percentage": 99.53, "elapsed_time": "20:21:12", "remaining_time": "0:05:42"} -{"current_steps": 6430, "total_steps": 6450, "loss": 0.0001, "lr": 2.928809046398584e-09, "epoch": 9.968992248062015, "percentage": 99.69, "elapsed_time": "20:22:30", "remaining_time": "0:03:48"} -{"current_steps": 6440, "total_steps": 6450, "loss": 0.0005, "lr": 7.322076228777341e-10, "epoch": 9.984496124031008, "percentage": 99.84, "elapsed_time": "20:23:49", "remaining_time": "0:01:54"} -{"current_steps": 6450, "total_steps": 6450, "loss": 0.0002, "lr": 0.0, "epoch": 10.0, "percentage": 100.0, "elapsed_time": "20:25:08", "remaining_time": "0:00:00"} -{"current_steps": 6450, "total_steps": 6450, "eval_loss": 0.10437238216400146, "epoch": 10.0, "percentage": 100.0, "elapsed_time": "20:27:48", "remaining_time": "0:00:00"} -{"current_steps": 6450, "total_steps": 6450, "epoch": 10.0, "percentage": 100.0, "elapsed_time": "20:27:54", "remaining_time": "0:00:00"} +{"current_steps": 10, "total_steps": 3225, "loss": 1.585, "lr": 3.0959752321981426e-06, "epoch": 0.015503875968992248, "percentage": 0.31, "elapsed_time": "0:01:24", "remaining_time": "7:30:10"} +{"current_steps": 20, "total_steps": 3225, "loss": 1.523, "lr": 6.191950464396285e-06, "epoch": 0.031007751937984496, "percentage": 0.62, "elapsed_time": "0:02:48", "remaining_time": "7:29:51"} +{"current_steps": 30, "total_steps": 3225, "loss": 1.318, "lr": 9.287925696594429e-06, "epoch": 0.046511627906976744, "percentage": 0.93, "elapsed_time": "0:04:13", "remaining_time": "7:29:06"} +{"current_steps": 40, "total_steps": 3225, "loss": 0.8377, "lr": 1.238390092879257e-05, "epoch": 0.06201550387596899, "percentage": 1.24, "elapsed_time": "0:05:37", "remaining_time": "7:28:12"} +{"current_steps": 50, "total_steps": 3225, "loss": 0.5122, "lr": 1.5479876160990712e-05, "epoch": 0.07751937984496124, "percentage": 1.55, "elapsed_time": "0:07:02", "remaining_time": "7:27:01"} +{"current_steps": 50, "total_steps": 3225, "eval_loss": 0.41176876425743103, "epoch": 0.07751937984496124, "percentage": 1.55, "elapsed_time": "0:09:55", "remaining_time": "10:30:26"}