diff --git "a/trainer_log.jsonl" "b/trainer_log.jsonl" --- "a/trainer_log.jsonl" +++ "b/trainer_log.jsonl" @@ -1,791 +1,6 @@ -{"current_steps": 10, "total_steps": 6590, "loss": 1.5203, "lr": 1.5174506828528075e-06, "epoch": 0.015165876777251185, "percentage": 0.15, "elapsed_time": "0:01:18", "remaining_time": "14:18:47"} -{"current_steps": 20, "total_steps": 6590, "loss": 1.5103, "lr": 3.034901365705615e-06, "epoch": 0.03033175355450237, "percentage": 0.3, "elapsed_time": "0:02:36", "remaining_time": "14:15:22"} -{"current_steps": 30, "total_steps": 6590, "loss": 1.5543, "lr": 4.552352048558422e-06, "epoch": 0.04549763033175355, "percentage": 0.46, "elapsed_time": "0:03:53", "remaining_time": "14:11:35"} -{"current_steps": 40, "total_steps": 6590, "loss": 1.2872, "lr": 6.06980273141123e-06, "epoch": 0.06066350710900474, "percentage": 0.61, "elapsed_time": "0:05:11", "remaining_time": "14:09:19"} -{"current_steps": 50, "total_steps": 6590, "loss": 0.9962, "lr": 7.587253414264037e-06, "epoch": 0.07582938388625593, "percentage": 0.76, "elapsed_time": "0:06:28", "remaining_time": "14:07:36"} -{"current_steps": 50, "total_steps": 6590, "eval_loss": 0.7209104299545288, "epoch": 0.07582938388625593, "percentage": 0.76, "elapsed_time": "0:09:09", "remaining_time": "19:58:52"} -{"current_steps": 60, "total_steps": 6590, "loss": 0.8671, "lr": 9.104704097116844e-06, "epoch": 0.0909952606635071, "percentage": 0.91, "elapsed_time": "0:10:31", "remaining_time": "19:05:48"} -{"current_steps": 70, "total_steps": 6590, "loss": 0.5082, "lr": 1.0622154779969651e-05, "epoch": 0.1061611374407583, "percentage": 1.06, "elapsed_time": "0:11:49", "remaining_time": "18:21:27"} -{"current_steps": 80, "total_steps": 6590, "loss": 0.4098, "lr": 1.213960546282246e-05, "epoch": 0.12132701421800948, "percentage": 1.21, "elapsed_time": "0:13:07", "remaining_time": "17:47:33"} -{"current_steps": 90, "total_steps": 6590, "loss": 0.2307, "lr": 1.3657056145675265e-05, "epoch": 0.13649289099526066, "percentage": 1.37, "elapsed_time": "0:14:24", "remaining_time": "17:20:43"} -{"current_steps": 100, "total_steps": 6590, "loss": 0.1767, "lr": 1.5174506828528074e-05, "epoch": 0.15165876777251186, "percentage": 1.52, "elapsed_time": "0:15:42", "remaining_time": "16:59:22"} -{"current_steps": 100, "total_steps": 6590, "eval_loss": 0.15857024490833282, "epoch": 0.15165876777251186, "percentage": 1.52, "elapsed_time": "0:18:23", "remaining_time": "19:53:28"} -{"current_steps": 110, "total_steps": 6590, "loss": 0.164, "lr": 1.6691957511380883e-05, "epoch": 0.16682464454976303, "percentage": 1.67, "elapsed_time": "0:19:46", "remaining_time": "19:24:46"} -{"current_steps": 120, "total_steps": 6590, "loss": 0.1124, "lr": 1.8209408194233688e-05, "epoch": 0.1819905213270142, "percentage": 1.82, "elapsed_time": "0:21:03", "remaining_time": "18:55:45"} -{"current_steps": 130, "total_steps": 6590, "loss": 0.0971, "lr": 1.9726858877086497e-05, "epoch": 0.1971563981042654, "percentage": 1.97, "elapsed_time": "0:22:21", "remaining_time": "18:31:01"} -{"current_steps": 140, "total_steps": 6590, "loss": 0.0853, "lr": 2.1244309559939302e-05, "epoch": 0.2123222748815166, "percentage": 2.12, "elapsed_time": "0:23:39", "remaining_time": "18:09:41"} -{"current_steps": 150, "total_steps": 6590, "loss": 0.0837, "lr": 2.276176024279211e-05, "epoch": 0.22748815165876776, "percentage": 2.28, "elapsed_time": "0:24:56", "remaining_time": "17:51:05"} -{"current_steps": 150, "total_steps": 6590, "eval_loss": 0.07980982959270477, "epoch": 0.22748815165876776, "percentage": 2.28, "elapsed_time": "0:27:37", "remaining_time": "19:46:16"} -{"current_steps": 160, "total_steps": 6590, "loss": 0.0933, "lr": 2.427921092564492e-05, "epoch": 0.24265402843601896, "percentage": 2.43, "elapsed_time": "0:29:00", "remaining_time": "19:25:27"} -{"current_steps": 170, "total_steps": 6590, "loss": 0.0997, "lr": 2.5796661608497725e-05, "epoch": 0.25781990521327014, "percentage": 2.58, "elapsed_time": "0:30:17", "remaining_time": "19:04:06"} -{"current_steps": 180, "total_steps": 6590, "loss": 0.0668, "lr": 2.731411229135053e-05, "epoch": 0.2729857819905213, "percentage": 2.73, "elapsed_time": "0:31:35", "remaining_time": "18:45:09"} -{"current_steps": 190, "total_steps": 6590, "loss": 0.0623, "lr": 2.883156297420334e-05, "epoch": 0.2881516587677725, "percentage": 2.88, "elapsed_time": "0:32:53", "remaining_time": "18:27:39"} -{"current_steps": 200, "total_steps": 6590, "loss": 0.0672, "lr": 3.0349013657056148e-05, "epoch": 0.3033175355450237, "percentage": 3.03, "elapsed_time": "0:34:10", "remaining_time": "18:11:53"} -{"current_steps": 200, "total_steps": 6590, "eval_loss": 0.06620903313159943, "epoch": 0.3033175355450237, "percentage": 3.03, "elapsed_time": "0:36:51", "remaining_time": "19:37:39"} -{"current_steps": 210, "total_steps": 6590, "loss": 0.0675, "lr": 3.1866464339908954e-05, "epoch": 0.3184834123222749, "percentage": 3.19, "elapsed_time": "0:38:14", "remaining_time": "19:21:43"} -{"current_steps": 220, "total_steps": 6590, "loss": 0.083, "lr": 3.3383915022761766e-05, "epoch": 0.33364928909952607, "percentage": 3.34, "elapsed_time": "0:39:32", "remaining_time": "19:04:44"} -{"current_steps": 230, "total_steps": 6590, "loss": 0.051, "lr": 3.490136570561457e-05, "epoch": 0.34881516587677724, "percentage": 3.49, "elapsed_time": "0:40:49", "remaining_time": "18:49:00"} -{"current_steps": 240, "total_steps": 6590, "loss": 0.0484, "lr": 3.6418816388467377e-05, "epoch": 0.3639810426540284, "percentage": 3.64, "elapsed_time": "0:42:06", "remaining_time": "18:34:18"} -{"current_steps": 250, "total_steps": 6590, "loss": 0.0585, "lr": 3.793626707132019e-05, "epoch": 0.3791469194312796, "percentage": 3.79, "elapsed_time": "0:43:24", "remaining_time": "18:20:54"} -{"current_steps": 250, "total_steps": 6590, "eval_loss": 0.05650362744927406, "epoch": 0.3791469194312796, "percentage": 3.79, "elapsed_time": "0:46:05", "remaining_time": "19:28:57"} -{"current_steps": 260, "total_steps": 6590, "loss": 0.0587, "lr": 3.9453717754172994e-05, "epoch": 0.3943127962085308, "percentage": 3.95, "elapsed_time": "0:47:27", "remaining_time": "19:15:24"} -{"current_steps": 270, "total_steps": 6590, "loss": 0.049, "lr": 4.09711684370258e-05, "epoch": 0.409478672985782, "percentage": 4.1, "elapsed_time": "0:48:45", "remaining_time": "19:01:13"} -{"current_steps": 280, "total_steps": 6590, "loss": 0.0536, "lr": 4.2488619119878605e-05, "epoch": 0.4246445497630332, "percentage": 4.25, "elapsed_time": "0:50:02", "remaining_time": "18:47:51"} -{"current_steps": 290, "total_steps": 6590, "loss": 0.0684, "lr": 4.400606980273142e-05, "epoch": 0.43981042654028435, "percentage": 4.4, "elapsed_time": "0:51:20", "remaining_time": "18:35:24"} -{"current_steps": 300, "total_steps": 6590, "loss": 0.0501, "lr": 4.552352048558422e-05, "epoch": 0.4549763033175355, "percentage": 4.55, "elapsed_time": "0:52:38", "remaining_time": "18:23:42"} -{"current_steps": 300, "total_steps": 6590, "eval_loss": 0.050522029399871826, "epoch": 0.4549763033175355, "percentage": 4.55, "elapsed_time": "0:55:19", "remaining_time": "19:19:59"} -{"current_steps": 310, "total_steps": 6590, "loss": 0.0586, "lr": 4.704097116843703e-05, "epoch": 0.47014218009478675, "percentage": 4.7, "elapsed_time": "0:56:41", "remaining_time": "19:08:32"} -{"current_steps": 320, "total_steps": 6590, "loss": 0.0456, "lr": 4.855842185128984e-05, "epoch": 0.48530805687203793, "percentage": 4.86, "elapsed_time": "0:57:59", "remaining_time": "18:56:17"} -{"current_steps": 330, "total_steps": 6590, "loss": 0.0612, "lr": 5.0075872534142645e-05, "epoch": 0.500473933649289, "percentage": 5.01, "elapsed_time": "0:59:17", "remaining_time": "18:44:40"} -{"current_steps": 340, "total_steps": 6590, "loss": 0.0573, "lr": 5.159332321699545e-05, "epoch": 0.5156398104265403, "percentage": 5.16, "elapsed_time": "1:00:34", "remaining_time": "18:33:34"} -{"current_steps": 350, "total_steps": 6590, "loss": 0.0571, "lr": 5.3110773899848256e-05, "epoch": 0.5308056872037915, "percentage": 5.31, "elapsed_time": "1:01:52", "remaining_time": "18:23:09"} -{"current_steps": 350, "total_steps": 6590, "eval_loss": 0.048958808183670044, "epoch": 0.5308056872037915, "percentage": 5.31, "elapsed_time": "1:04:33", "remaining_time": "19:11:01"} -{"current_steps": 360, "total_steps": 6590, "loss": 0.0538, "lr": 5.462822458270106e-05, "epoch": 0.5459715639810426, "percentage": 5.46, "elapsed_time": "1:05:55", "remaining_time": "19:00:52"} -{"current_steps": 370, "total_steps": 6590, "loss": 0.033, "lr": 5.6145675265553874e-05, "epoch": 0.5611374407582939, "percentage": 5.61, "elapsed_time": "1:07:13", "remaining_time": "18:50:01"} -{"current_steps": 380, "total_steps": 6590, "loss": 0.0678, "lr": 5.766312594840668e-05, "epoch": 0.576303317535545, "percentage": 5.77, "elapsed_time": "1:08:31", "remaining_time": "18:39:43"} -{"current_steps": 390, "total_steps": 6590, "loss": 0.0715, "lr": 5.9180576631259484e-05, "epoch": 0.5914691943127962, "percentage": 5.92, "elapsed_time": "1:09:48", "remaining_time": "18:29:51"} -{"current_steps": 400, "total_steps": 6590, "loss": 0.0694, "lr": 6.0698027314112297e-05, "epoch": 0.6066350710900474, "percentage": 6.07, "elapsed_time": "1:11:06", "remaining_time": "18:20:23"} -{"current_steps": 400, "total_steps": 6590, "eval_loss": 0.04914228990674019, "epoch": 0.6066350710900474, "percentage": 6.07, "elapsed_time": "1:13:47", "remaining_time": "19:01:55"} -{"current_steps": 410, "total_steps": 6590, "loss": 0.0445, "lr": 6.22154779969651e-05, "epoch": 0.6218009478672986, "percentage": 6.22, "elapsed_time": "1:15:09", "remaining_time": "18:52:55"} -{"current_steps": 420, "total_steps": 6590, "loss": 0.0381, "lr": 6.373292867981791e-05, "epoch": 0.6369668246445498, "percentage": 6.37, "elapsed_time": "1:16:27", "remaining_time": "18:43:05"} -{"current_steps": 430, "total_steps": 6590, "loss": 0.0671, "lr": 6.525037936267073e-05, "epoch": 0.6521327014218009, "percentage": 6.53, "elapsed_time": "1:17:45", "remaining_time": "18:33:50"} -{"current_steps": 440, "total_steps": 6590, "loss": 0.0485, "lr": 6.676783004552353e-05, "epoch": 0.6672985781990521, "percentage": 6.68, "elapsed_time": "1:19:02", "remaining_time": "18:24:51"} -{"current_steps": 450, "total_steps": 6590, "loss": 0.0582, "lr": 6.828528072837634e-05, "epoch": 0.6824644549763034, "percentage": 6.83, "elapsed_time": "1:20:20", "remaining_time": "18:16:08"} -{"current_steps": 450, "total_steps": 6590, "eval_loss": 0.04864715039730072, "epoch": 0.6824644549763034, "percentage": 6.83, "elapsed_time": "1:23:01", "remaining_time": "18:52:46"} -{"current_steps": 460, "total_steps": 6590, "loss": 0.0492, "lr": 6.980273141122914e-05, "epoch": 0.6976303317535545, "percentage": 6.98, "elapsed_time": "1:24:23", "remaining_time": "18:44:32"} -{"current_steps": 470, "total_steps": 6590, "loss": 0.051, "lr": 7.132018209408195e-05, "epoch": 0.7127962085308057, "percentage": 7.13, "elapsed_time": "1:25:40", "remaining_time": "18:35:42"} -{"current_steps": 480, "total_steps": 6590, "loss": 0.0411, "lr": 7.283763277693475e-05, "epoch": 0.7279620853080568, "percentage": 7.28, "elapsed_time": "1:26:58", "remaining_time": "18:27:10"} -{"current_steps": 490, "total_steps": 6590, "loss": 0.061, "lr": 7.435508345978756e-05, "epoch": 0.7431279620853081, "percentage": 7.44, "elapsed_time": "1:28:16", "remaining_time": "18:18:56"} -{"current_steps": 500, "total_steps": 6590, "loss": 0.0363, "lr": 7.587253414264038e-05, "epoch": 0.7582938388625592, "percentage": 7.59, "elapsed_time": "1:29:34", "remaining_time": "18:10:55"} -{"current_steps": 500, "total_steps": 6590, "eval_loss": 0.043231334537267685, "epoch": 0.7582938388625592, "percentage": 7.59, "elapsed_time": "1:32:15", "remaining_time": "18:43:37"} -{"current_steps": 510, "total_steps": 6590, "loss": 0.0536, "lr": 7.738998482549318e-05, "epoch": 0.7734597156398104, "percentage": 7.74, "elapsed_time": "1:33:37", "remaining_time": "18:36:05"} -{"current_steps": 520, "total_steps": 6590, "loss": 0.0417, "lr": 7.890743550834599e-05, "epoch": 0.7886255924170616, "percentage": 7.89, "elapsed_time": "1:34:54", "remaining_time": "18:27:54"} -{"current_steps": 530, "total_steps": 6590, "loss": 0.0563, "lr": 8.04248861911988e-05, "epoch": 0.8037914691943128, "percentage": 8.04, "elapsed_time": "1:36:12", "remaining_time": "18:19:58"} -{"current_steps": 540, "total_steps": 6590, "loss": 0.0445, "lr": 8.19423368740516e-05, "epoch": 0.818957345971564, "percentage": 8.19, "elapsed_time": "1:37:30", "remaining_time": "18:12:26"} -{"current_steps": 550, "total_steps": 6590, "loss": 0.0349, "lr": 8.34597875569044e-05, "epoch": 0.8341232227488151, "percentage": 8.35, "elapsed_time": "1:38:48", "remaining_time": "18:05:00"} -{"current_steps": 550, "total_steps": 6590, "eval_loss": 0.04664945974946022, "epoch": 0.8341232227488151, "percentage": 8.35, "elapsed_time": "1:41:29", "remaining_time": "18:34:28"} -{"current_steps": 560, "total_steps": 6590, "loss": 0.0444, "lr": 8.497723823975721e-05, "epoch": 0.8492890995260663, "percentage": 8.5, "elapsed_time": "1:42:50", "remaining_time": "18:27:26"} -{"current_steps": 570, "total_steps": 6590, "loss": 0.0515, "lr": 8.649468892261003e-05, "epoch": 0.8644549763033176, "percentage": 8.65, "elapsed_time": "1:44:08", "remaining_time": "18:19:52"} -{"current_steps": 580, "total_steps": 6590, "loss": 0.0543, "lr": 8.801213960546283e-05, "epoch": 0.8796208530805687, "percentage": 8.8, "elapsed_time": "1:45:25", "remaining_time": "18:12:28"} -{"current_steps": 590, "total_steps": 6590, "loss": 0.0602, "lr": 8.952959028831564e-05, "epoch": 0.8947867298578199, "percentage": 8.95, "elapsed_time": "1:46:43", "remaining_time": "18:05:18"} -{"current_steps": 600, "total_steps": 6590, "loss": 0.0473, "lr": 9.104704097116844e-05, "epoch": 0.909952606635071, "percentage": 9.1, "elapsed_time": "1:48:01", "remaining_time": "17:58:24"} -{"current_steps": 600, "total_steps": 6590, "eval_loss": 0.04575315862894058, "epoch": 0.909952606635071, "percentage": 9.1, "elapsed_time": "1:50:42", "remaining_time": "18:25:12"} -{"current_steps": 610, "total_steps": 6590, "loss": 0.038, "lr": 9.256449165402125e-05, "epoch": 0.9251184834123223, "percentage": 9.26, "elapsed_time": "1:52:05", "remaining_time": "18:18:48"} -{"current_steps": 620, "total_steps": 6590, "loss": 0.0343, "lr": 9.408194233687406e-05, "epoch": 0.9402843601895735, "percentage": 9.41, "elapsed_time": "1:53:22", "remaining_time": "18:11:45"} -{"current_steps": 630, "total_steps": 6590, "loss": 0.0532, "lr": 9.559939301972687e-05, "epoch": 0.9554502369668246, "percentage": 9.56, "elapsed_time": "1:54:40", "remaining_time": "18:04:51"} -{"current_steps": 640, "total_steps": 6590, "loss": 0.0407, "lr": 9.711684370257968e-05, "epoch": 0.9706161137440759, "percentage": 9.71, "elapsed_time": "1:55:58", "remaining_time": "17:58:08"} -{"current_steps": 650, "total_steps": 6590, "loss": 0.0493, "lr": 9.863429438543249e-05, "epoch": 0.985781990521327, "percentage": 9.86, "elapsed_time": "1:57:15", "remaining_time": "17:51:37"} -{"current_steps": 650, "total_steps": 6590, "eval_loss": 0.04452311992645264, "epoch": 0.985781990521327, "percentage": 9.86, "elapsed_time": "1:59:57", "remaining_time": "18:16:10"} -{"current_steps": 660, "total_steps": 6590, "loss": 0.0454, "lr": 9.999999298570713e-05, "epoch": 1.000947867298578, "percentage": 10.02, "elapsed_time": "2:01:19", "remaining_time": "18:10:04"} -{"current_steps": 670, "total_steps": 6590, "loss": 0.04, "lr": 9.99991512729427e-05, "epoch": 1.0161137440758294, "percentage": 10.17, "elapsed_time": "2:02:36", "remaining_time": "18:03:24"} -{"current_steps": 680, "total_steps": 6590, "loss": 0.0448, "lr": 9.999690672866212e-05, "epoch": 1.0312796208530806, "percentage": 10.32, "elapsed_time": "2:03:54", "remaining_time": "17:56:57"} -{"current_steps": 690, "total_steps": 6590, "loss": 0.0442, "lr": 9.999325941584081e-05, "epoch": 1.0464454976303317, "percentage": 10.47, "elapsed_time": "2:05:12", "remaining_time": "17:50:38"} -{"current_steps": 700, "total_steps": 6590, "loss": 0.0371, "lr": 9.99882094368118e-05, "epoch": 1.061611374407583, "percentage": 10.62, "elapsed_time": "2:06:30", "remaining_time": "17:44:30"} -{"current_steps": 700, "total_steps": 6590, "eval_loss": 0.0471104234457016, "epoch": 1.061611374407583, "percentage": 10.62, "elapsed_time": "2:09:11", "remaining_time": "18:07:05"} -{"current_steps": 710, "total_steps": 6590, "loss": 0.0341, "lr": 9.99817569332629e-05, "epoch": 1.0767772511848341, "percentage": 10.77, "elapsed_time": "2:10:33", "remaining_time": "18:01:16"} -{"current_steps": 720, "total_steps": 6590, "loss": 0.0509, "lr": 9.99739020862327e-05, "epoch": 1.0919431279620853, "percentage": 10.93, "elapsed_time": "2:11:51", "remaining_time": "17:55:01"} -{"current_steps": 730, "total_steps": 6590, "loss": 0.0432, "lr": 9.996464511610545e-05, "epoch": 1.1071090047393364, "percentage": 11.08, "elapsed_time": "2:13:09", "remaining_time": "17:48:54"} -{"current_steps": 740, "total_steps": 6590, "loss": 0.0485, "lr": 9.9953986282605e-05, "epoch": 1.1222748815165877, "percentage": 11.23, "elapsed_time": "2:14:27", "remaining_time": "17:42:54"} -{"current_steps": 750, "total_steps": 6590, "loss": 0.0413, "lr": 9.994192588478732e-05, "epoch": 1.1374407582938388, "percentage": 11.38, "elapsed_time": "2:15:45", "remaining_time": "17:37:03"} -{"current_steps": 750, "total_steps": 6590, "eval_loss": 0.04678098484873772, "epoch": 1.1374407582938388, "percentage": 11.38, "elapsed_time": "2:18:26", "remaining_time": "17:57:57"} -{"current_steps": 760, "total_steps": 6590, "loss": 0.0334, "lr": 9.992846426103231e-05, "epoch": 1.15260663507109, "percentage": 11.53, "elapsed_time": "2:19:48", "remaining_time": "17:52:26"} -{"current_steps": 770, "total_steps": 6590, "loss": 0.0436, "lr": 9.991360178903418e-05, "epoch": 1.1677725118483413, "percentage": 11.68, "elapsed_time": "2:21:05", "remaining_time": "17:46:28"} -{"current_steps": 780, "total_steps": 6590, "loss": 0.0471, "lr": 9.989733888579087e-05, "epoch": 1.1829383886255924, "percentage": 11.84, "elapsed_time": "2:22:23", "remaining_time": "17:40:37"} -{"current_steps": 790, "total_steps": 6590, "loss": 0.0403, "lr": 9.98796760075924e-05, "epoch": 1.1981042654028435, "percentage": 11.99, "elapsed_time": "2:23:41", "remaining_time": "17:34:55"} -{"current_steps": 800, "total_steps": 6590, "loss": 0.0379, "lr": 9.986061365000804e-05, "epoch": 1.2132701421800949, "percentage": 12.14, "elapsed_time": "2:24:58", "remaining_time": "17:29:18"} -{"current_steps": 800, "total_steps": 6590, "eval_loss": 0.039671480655670166, "epoch": 1.2132701421800949, "percentage": 12.14, "elapsed_time": "2:27:40", "remaining_time": "17:48:44"} -{"current_steps": 810, "total_steps": 6590, "loss": 0.0384, "lr": 9.984015234787239e-05, "epoch": 1.228436018957346, "percentage": 12.29, "elapsed_time": "2:29:01", "remaining_time": "17:43:26"} -{"current_steps": 820, "total_steps": 6590, "loss": 0.0425, "lr": 9.981829267527036e-05, "epoch": 1.2436018957345971, "percentage": 12.44, "elapsed_time": "2:30:19", "remaining_time": "17:37:46"} -{"current_steps": 830, "total_steps": 6590, "loss": 0.033, "lr": 9.979503524552112e-05, "epoch": 1.2587677725118485, "percentage": 12.59, "elapsed_time": "2:31:37", "remaining_time": "17:32:12"} -{"current_steps": 840, "total_steps": 6590, "loss": 0.0329, "lr": 9.977038071116087e-05, "epoch": 1.2739336492890996, "percentage": 12.75, "elapsed_time": "2:32:55", "remaining_time": "17:26:45"} -{"current_steps": 850, "total_steps": 6590, "loss": 0.0351, "lr": 9.974432976392451e-05, "epoch": 1.2890995260663507, "percentage": 12.9, "elapsed_time": "2:34:12", "remaining_time": "17:21:22"} -{"current_steps": 850, "total_steps": 6590, "eval_loss": 0.041223689913749695, "epoch": 1.2890995260663507, "percentage": 12.9, "elapsed_time": "2:36:53", "remaining_time": "17:39:31"} -{"current_steps": 860, "total_steps": 6590, "loss": 0.057, "lr": 9.971688313472623e-05, "epoch": 1.3042654028436018, "percentage": 13.05, "elapsed_time": "2:38:18", "remaining_time": "17:34:43"} -{"current_steps": 870, "total_steps": 6590, "loss": 0.0448, "lr": 9.968804159363903e-05, "epoch": 1.3194312796208532, "percentage": 13.2, "elapsed_time": "2:39:35", "remaining_time": "17:29:17"} -{"current_steps": 880, "total_steps": 6590, "loss": 0.0363, "lr": 9.965780594987311e-05, "epoch": 1.3345971563981043, "percentage": 13.35, "elapsed_time": "2:40:53", "remaining_time": "17:23:56"} -{"current_steps": 890, "total_steps": 6590, "loss": 0.0306, "lr": 9.962617705175314e-05, "epoch": 1.3497630331753554, "percentage": 13.51, "elapsed_time": "2:42:10", "remaining_time": "17:18:41"} -{"current_steps": 900, "total_steps": 6590, "loss": 0.03, "lr": 9.95931557866945e-05, "epoch": 1.3649289099526065, "percentage": 13.66, "elapsed_time": "2:43:28", "remaining_time": "17:13:30"} -{"current_steps": 900, "total_steps": 6590, "eval_loss": 0.04190010949969292, "epoch": 1.3649289099526065, "percentage": 13.66, "elapsed_time": "2:46:09", "remaining_time": "17:30:29"} -{"current_steps": 910, "total_steps": 6590, "loss": 0.0396, "lr": 9.955874308117835e-05, "epoch": 1.3800947867298579, "percentage": 13.81, "elapsed_time": "2:47:31", "remaining_time": "17:25:38"} -{"current_steps": 920, "total_steps": 6590, "loss": 0.0453, "lr": 9.952293990072558e-05, "epoch": 1.395260663507109, "percentage": 13.96, "elapsed_time": "2:48:49", "remaining_time": "17:20:26"} -{"current_steps": 930, "total_steps": 6590, "loss": 0.0359, "lr": 9.948574724986992e-05, "epoch": 1.41042654028436, "percentage": 14.11, "elapsed_time": "2:50:06", "remaining_time": "17:15:19"} -{"current_steps": 940, "total_steps": 6590, "loss": 0.0399, "lr": 9.944716617212948e-05, "epoch": 1.4255924170616114, "percentage": 14.26, "elapsed_time": "2:51:24", "remaining_time": "17:10:17"} -{"current_steps": 950, "total_steps": 6590, "loss": 0.0321, "lr": 9.94071977499777e-05, "epoch": 1.4407582938388626, "percentage": 14.42, "elapsed_time": "2:52:42", "remaining_time": "17:05:17"} -{"current_steps": 950, "total_steps": 6590, "eval_loss": 0.04309966787695885, "epoch": 1.4407582938388626, "percentage": 14.42, "elapsed_time": "2:55:23", "remaining_time": "17:21:13"} -{"current_steps": 960, "total_steps": 6590, "loss": 0.0406, "lr": 9.936584310481285e-05, "epoch": 1.4559241706161137, "percentage": 14.57, "elapsed_time": "2:56:45", "remaining_time": "17:16:35"} -{"current_steps": 970, "total_steps": 6590, "loss": 0.0328, "lr": 9.932310339692661e-05, "epoch": 1.471090047393365, "percentage": 14.72, "elapsed_time": "2:58:03", "remaining_time": "17:11:35"} -{"current_steps": 980, "total_steps": 6590, "loss": 0.0339, "lr": 9.927897982547154e-05, "epoch": 1.4862559241706161, "percentage": 14.87, "elapsed_time": "2:59:20", "remaining_time": "17:06:40"} -{"current_steps": 990, "total_steps": 6590, "loss": 0.0371, "lr": 9.923347362842736e-05, "epoch": 1.5014218009478673, "percentage": 15.02, "elapsed_time": "3:00:38", "remaining_time": "17:01:47"} -{"current_steps": 1000, "total_steps": 6590, "loss": 0.0448, "lr": 9.918658608256633e-05, "epoch": 1.5165876777251186, "percentage": 15.17, "elapsed_time": "3:01:56", "remaining_time": "16:57:00"} -{"current_steps": 1000, "total_steps": 6590, "eval_loss": 0.038589827716350555, "epoch": 1.5165876777251186, "percentage": 15.17, "elapsed_time": "3:04:37", "remaining_time": "17:12:01"} -{"current_steps": 1010, "total_steps": 6590, "loss": 0.0325, "lr": 9.913831850341726e-05, "epoch": 1.5317535545023697, "percentage": 15.33, "elapsed_time": "3:05:59", "remaining_time": "17:07:33"} -{"current_steps": 1020, "total_steps": 6590, "loss": 0.0259, "lr": 9.908867224522881e-05, "epoch": 1.5469194312796208, "percentage": 15.48, "elapsed_time": "3:07:17", "remaining_time": "17:02:44"} -{"current_steps": 1030, "total_steps": 6590, "loss": 0.029, "lr": 9.903764870093136e-05, "epoch": 1.5620853080568722, "percentage": 15.63, "elapsed_time": "3:08:35", "remaining_time": "16:57:59"} -{"current_steps": 1040, "total_steps": 6590, "loss": 0.0453, "lr": 9.898524930209786e-05, "epoch": 1.577251184834123, "percentage": 15.78, "elapsed_time": "3:09:53", "remaining_time": "16:53:20"} -{"current_steps": 1050, "total_steps": 6590, "loss": 0.0301, "lr": 9.893147551890387e-05, "epoch": 1.5924170616113744, "percentage": 15.93, "elapsed_time": "3:11:10", "remaining_time": "16:48:41"} -{"current_steps": 1050, "total_steps": 6590, "eval_loss": 0.03665034472942352, "epoch": 1.5924170616113744, "percentage": 15.93, "elapsed_time": "3:13:51", "remaining_time": "17:02:51"} -{"current_steps": 1060, "total_steps": 6590, "loss": 0.0391, "lr": 9.887632886008616e-05, "epoch": 1.6075829383886255, "percentage": 16.08, "elapsed_time": "3:15:14", "remaining_time": "16:58:32"} -{"current_steps": 1070, "total_steps": 6590, "loss": 0.0389, "lr": 9.88198108729004e-05, "epoch": 1.6227488151658767, "percentage": 16.24, "elapsed_time": "3:16:31", "remaining_time": "16:53:51"} -{"current_steps": 1080, "total_steps": 6590, "loss": 0.0356, "lr": 9.876192314307777e-05, "epoch": 1.637914691943128, "percentage": 16.39, "elapsed_time": "3:17:49", "remaining_time": "16:49:15"} -{"current_steps": 1090, "total_steps": 6590, "loss": 0.0366, "lr": 9.87026672947805e-05, "epoch": 1.6530805687203791, "percentage": 16.54, "elapsed_time": "3:19:06", "remaining_time": "16:44:41"} -{"current_steps": 1100, "total_steps": 6590, "loss": 0.0248, "lr": 9.864204499055624e-05, "epoch": 1.6682464454976302, "percentage": 16.69, "elapsed_time": "3:20:24", "remaining_time": "16:40:12"} -{"current_steps": 1100, "total_steps": 6590, "eval_loss": 0.03758285939693451, "epoch": 1.6682464454976302, "percentage": 16.69, "elapsed_time": "3:23:05", "remaining_time": "16:53:36"} -{"current_steps": 1110, "total_steps": 6590, "loss": 0.044, "lr": 9.858005793129143e-05, "epoch": 1.6834123222748816, "percentage": 16.84, "elapsed_time": "3:24:27", "remaining_time": "16:49:25"} -{"current_steps": 1120, "total_steps": 6590, "loss": 0.0308, "lr": 9.851670785616358e-05, "epoch": 1.6985781990521327, "percentage": 17.0, "elapsed_time": "3:25:45", "remaining_time": "16:44:54"} -{"current_steps": 1130, "total_steps": 6590, "loss": 0.0334, "lr": 9.845199654259254e-05, "epoch": 1.7137440758293838, "percentage": 17.15, "elapsed_time": "3:27:03", "remaining_time": "16:40:27"} -{"current_steps": 1140, "total_steps": 6590, "loss": 0.0316, "lr": 9.83859258061905e-05, "epoch": 1.7289099526066352, "percentage": 17.3, "elapsed_time": "3:28:21", "remaining_time": "16:36:04"} -{"current_steps": 1150, "total_steps": 6590, "loss": 0.0315, "lr": 9.831849750071118e-05, "epoch": 1.7440758293838863, "percentage": 17.45, "elapsed_time": "3:29:38", "remaining_time": "16:31:43"} -{"current_steps": 1150, "total_steps": 6590, "eval_loss": 0.038996778428554535, "epoch": 1.7440758293838863, "percentage": 17.45, "elapsed_time": "3:32:20", "remaining_time": "16:44:25"} -{"current_steps": 1160, "total_steps": 6590, "loss": 0.0422, "lr": 9.82497135179977e-05, "epoch": 1.7592417061611374, "percentage": 17.6, "elapsed_time": "3:33:42", "remaining_time": "16:40:21"} -{"current_steps": 1170, "total_steps": 6590, "loss": 0.032, "lr": 9.817957578792962e-05, "epoch": 1.7744075829383887, "percentage": 17.75, "elapsed_time": "3:34:59", "remaining_time": "16:35:58"} -{"current_steps": 1180, "total_steps": 6590, "loss": 0.0243, "lr": 9.810808627836869e-05, "epoch": 1.7895734597156399, "percentage": 17.91, "elapsed_time": "3:36:17", "remaining_time": "16:31:40"} -{"current_steps": 1190, "total_steps": 6590, "loss": 0.0444, "lr": 9.803524699510374e-05, "epoch": 1.804739336492891, "percentage": 18.06, "elapsed_time": "3:37:35", "remaining_time": "16:27:22"} -{"current_steps": 1200, "total_steps": 6590, "loss": 0.0357, "lr": 9.796105998179424e-05, "epoch": 1.8199052132701423, "percentage": 18.21, "elapsed_time": "3:38:53", "remaining_time": "16:23:09"} -{"current_steps": 1200, "total_steps": 6590, "eval_loss": 0.036896735429763794, "epoch": 1.8199052132701423, "percentage": 18.21, "elapsed_time": "3:41:34", "remaining_time": "16:35:13"} -{"current_steps": 1210, "total_steps": 6590, "loss": 0.0317, "lr": 9.788552731991316e-05, "epoch": 1.8350710900473932, "percentage": 18.36, "elapsed_time": "3:42:56", "remaining_time": "16:31:15"} -{"current_steps": 1220, "total_steps": 6590, "loss": 0.0296, "lr": 9.780865112868847e-05, "epoch": 1.8502369668246446, "percentage": 18.51, "elapsed_time": "3:44:14", "remaining_time": "16:27:00"} -{"current_steps": 1230, "total_steps": 6590, "loss": 0.0315, "lr": 9.773043356504362e-05, "epoch": 1.865402843601896, "percentage": 18.66, "elapsed_time": "3:45:31", "remaining_time": "16:22:47"} -{"current_steps": 1240, "total_steps": 6590, "loss": 0.0479, "lr": 9.765087682353715e-05, "epoch": 1.8805687203791468, "percentage": 18.82, "elapsed_time": "3:46:49", "remaining_time": "16:18:39"} -{"current_steps": 1250, "total_steps": 6590, "loss": 0.0357, "lr": 9.756998313630103e-05, "epoch": 1.8957345971563981, "percentage": 18.97, "elapsed_time": "3:48:07", "remaining_time": "16:14:32"} -{"current_steps": 1250, "total_steps": 6590, "eval_loss": 0.03444758057594299, "epoch": 1.8957345971563981, "percentage": 18.97, "elapsed_time": "3:50:48", "remaining_time": "16:26:00"} -{"current_steps": 1260, "total_steps": 6590, "loss": 0.0418, "lr": 9.748775477297807e-05, "epoch": 1.9109004739336493, "percentage": 19.12, "elapsed_time": "3:52:10", "remaining_time": "16:22:09"} -{"current_steps": 1270, "total_steps": 6590, "loss": 0.0402, "lr": 9.740419404065822e-05, "epoch": 1.9260663507109004, "percentage": 19.27, "elapsed_time": "3:53:28", "remaining_time": "16:18:00"} -{"current_steps": 1280, "total_steps": 6590, "loss": 0.0276, "lr": 9.731930328381384e-05, "epoch": 1.9412322274881517, "percentage": 19.42, "elapsed_time": "3:54:45", "remaining_time": "16:13:54"} -{"current_steps": 1290, "total_steps": 6590, "loss": 0.0478, "lr": 9.723308488423397e-05, "epoch": 1.9563981042654028, "percentage": 19.58, "elapsed_time": "3:56:03", "remaining_time": "16:09:51"} -{"current_steps": 1300, "total_steps": 6590, "loss": 0.0434, "lr": 9.714554126095742e-05, "epoch": 1.971563981042654, "percentage": 19.73, "elapsed_time": "3:57:21", "remaining_time": "16:05:50"} -{"current_steps": 1300, "total_steps": 6590, "eval_loss": 0.038428451865911484, "epoch": 1.971563981042654, "percentage": 19.73, "elapsed_time": "4:00:02", "remaining_time": "16:16:46"} -{"current_steps": 1310, "total_steps": 6590, "loss": 0.0367, "lr": 9.705667487020495e-05, "epoch": 1.9867298578199053, "percentage": 19.88, "elapsed_time": "4:01:24", "remaining_time": "16:12:59"} -{"current_steps": 1320, "total_steps": 6590, "loss": 0.045, "lr": 9.696648820531039e-05, "epoch": 2.001895734597156, "percentage": 20.03, "elapsed_time": "4:02:41", "remaining_time": "16:08:57"} -{"current_steps": 1330, "total_steps": 6590, "loss": 0.028, "lr": 9.687498379665056e-05, "epoch": 2.0170616113744075, "percentage": 20.18, "elapsed_time": "4:03:59", "remaining_time": "16:04:56"} -{"current_steps": 1340, "total_steps": 6590, "loss": 0.0252, "lr": 9.678216421157443e-05, "epoch": 2.032227488151659, "percentage": 20.33, "elapsed_time": "4:05:16", "remaining_time": "16:00:59"} -{"current_steps": 1350, "total_steps": 6590, "loss": 0.0275, "lr": 9.668803205433101e-05, "epoch": 2.0473933649289098, "percentage": 20.49, "elapsed_time": "4:06:34", "remaining_time": "15:57:04"} -{"current_steps": 1350, "total_steps": 6590, "eval_loss": 0.03524172678589821, "epoch": 2.0473933649289098, "percentage": 20.49, "elapsed_time": "4:09:15", "remaining_time": "16:07:30"} -{"current_steps": 1360, "total_steps": 6590, "loss": 0.0208, "lr": 9.659258996599624e-05, "epoch": 2.062559241706161, "percentage": 20.64, "elapsed_time": "4:10:37", "remaining_time": "16:03:47"} -{"current_steps": 1370, "total_steps": 6590, "loss": 0.0253, "lr": 9.649584062439898e-05, "epoch": 2.0777251184834125, "percentage": 20.79, "elapsed_time": "4:11:55", "remaining_time": "15:59:52"} -{"current_steps": 1380, "total_steps": 6590, "loss": 0.0213, "lr": 9.639778674404581e-05, "epoch": 2.0928909952606634, "percentage": 20.94, "elapsed_time": "4:13:12", "remaining_time": "15:55:58"} -{"current_steps": 1390, "total_steps": 6590, "loss": 0.0295, "lr": 9.629843107604491e-05, "epoch": 2.1080568720379147, "percentage": 21.09, "elapsed_time": "4:14:30", "remaining_time": "15:52:06"} -{"current_steps": 1400, "total_steps": 6590, "loss": 0.0204, "lr": 9.619777640802885e-05, "epoch": 2.123222748815166, "percentage": 21.24, "elapsed_time": "4:15:48", "remaining_time": "15:48:18"} -{"current_steps": 1400, "total_steps": 6590, "eval_loss": 0.03469180688261986, "epoch": 2.123222748815166, "percentage": 21.24, "elapsed_time": "4:18:29", "remaining_time": "15:58:15"} -{"current_steps": 1410, "total_steps": 6590, "loss": 0.0237, "lr": 9.609582556407635e-05, "epoch": 2.138388625592417, "percentage": 21.4, "elapsed_time": "4:19:52", "remaining_time": "15:54:41"} -{"current_steps": 1420, "total_steps": 6590, "loss": 0.0276, "lr": 9.599258140463314e-05, "epoch": 2.1535545023696683, "percentage": 21.55, "elapsed_time": "4:21:09", "remaining_time": "15:50:51"} -{"current_steps": 1430, "total_steps": 6590, "loss": 0.0288, "lr": 9.588804682643158e-05, "epoch": 2.1687203791469196, "percentage": 21.7, "elapsed_time": "4:22:27", "remaining_time": "15:47:03"} -{"current_steps": 1440, "total_steps": 6590, "loss": 0.0258, "lr": 9.57822247624095e-05, "epoch": 2.1838862559241705, "percentage": 21.85, "elapsed_time": "4:23:45", "remaining_time": "15:43:19"} -{"current_steps": 1450, "total_steps": 6590, "loss": 0.022, "lr": 9.56751181816278e-05, "epoch": 2.199052132701422, "percentage": 22.0, "elapsed_time": "4:25:03", "remaining_time": "15:39:35"} -{"current_steps": 1450, "total_steps": 6590, "eval_loss": 0.037667639553546906, "epoch": 2.199052132701422, "percentage": 22.0, "elapsed_time": "4:27:44", "remaining_time": "15:49:06"} -{"current_steps": 1460, "total_steps": 6590, "loss": 0.0201, "lr": 9.556673008918725e-05, "epoch": 2.2142180094786728, "percentage": 22.15, "elapsed_time": "4:29:07", "remaining_time": "15:45:37"} -{"current_steps": 1470, "total_steps": 6590, "loss": 0.0301, "lr": 9.54570635261441e-05, "epoch": 2.229383886255924, "percentage": 22.31, "elapsed_time": "4:30:25", "remaining_time": "15:41:52"} -{"current_steps": 1480, "total_steps": 6590, "loss": 0.0232, "lr": 9.534612156942479e-05, "epoch": 2.2445497630331754, "percentage": 22.46, "elapsed_time": "4:31:42", "remaining_time": "15:38:08"} -{"current_steps": 1490, "total_steps": 6590, "loss": 0.024, "lr": 9.523390733173966e-05, "epoch": 2.259715639810427, "percentage": 22.61, "elapsed_time": "4:33:00", "remaining_time": "15:34:27"} -{"current_steps": 1500, "total_steps": 6590, "loss": 0.0157, "lr": 9.512042396149549e-05, "epoch": 2.2748815165876777, "percentage": 22.76, "elapsed_time": "4:34:18", "remaining_time": "15:30:48"} -{"current_steps": 1500, "total_steps": 6590, "eval_loss": 0.03750366345047951, "epoch": 2.2748815165876777, "percentage": 22.76, "elapsed_time": "4:36:59", "remaining_time": "15:39:55"} -{"current_steps": 1510, "total_steps": 6590, "loss": 0.0412, "lr": 9.500567464270734e-05, "epoch": 2.290047393364929, "percentage": 22.91, "elapsed_time": "4:38:22", "remaining_time": "15:36:30"} -{"current_steps": 1520, "total_steps": 6590, "loss": 0.0254, "lr": 9.488966259490904e-05, "epoch": 2.30521327014218, "percentage": 23.07, "elapsed_time": "4:39:39", "remaining_time": "15:32:50"} -{"current_steps": 1530, "total_steps": 6590, "loss": 0.0349, "lr": 9.477239107306299e-05, "epoch": 2.3203791469194313, "percentage": 23.22, "elapsed_time": "4:40:57", "remaining_time": "15:29:10"} -{"current_steps": 1540, "total_steps": 6590, "loss": 0.0241, "lr": 9.46538633674688e-05, "epoch": 2.3355450236966826, "percentage": 23.37, "elapsed_time": "4:42:15", "remaining_time": "15:25:34"} -{"current_steps": 1550, "total_steps": 6590, "loss": 0.0287, "lr": 9.453408280367092e-05, "epoch": 2.3507109004739335, "percentage": 23.52, "elapsed_time": "4:43:32", "remaining_time": "15:21:58"} -{"current_steps": 1550, "total_steps": 6590, "eval_loss": 0.03478175774216652, "epoch": 2.3507109004739335, "percentage": 23.52, "elapsed_time": "4:46:13", "remaining_time": "15:30:41"} -{"current_steps": 1560, "total_steps": 6590, "loss": 0.0244, "lr": 9.441305274236536e-05, "epoch": 2.365876777251185, "percentage": 23.67, "elapsed_time": "4:47:38", "remaining_time": "15:27:28"} -{"current_steps": 1570, "total_steps": 6590, "loss": 0.0263, "lr": 9.429077657930551e-05, "epoch": 2.381042654028436, "percentage": 23.82, "elapsed_time": "4:48:56", "remaining_time": "15:23:53"} -{"current_steps": 1580, "total_steps": 6590, "loss": 0.0216, "lr": 9.416725774520667e-05, "epoch": 2.396208530805687, "percentage": 23.98, "elapsed_time": "4:50:14", "remaining_time": "15:20:19"} -{"current_steps": 1590, "total_steps": 6590, "loss": 0.0317, "lr": 9.404249970564995e-05, "epoch": 2.4113744075829384, "percentage": 24.13, "elapsed_time": "4:51:32", "remaining_time": "15:16:47"} -{"current_steps": 1600, "total_steps": 6590, "loss": 0.0279, "lr": 9.391650596098496e-05, "epoch": 2.4265402843601898, "percentage": 24.28, "elapsed_time": "4:52:49", "remaining_time": "15:13:16"} -{"current_steps": 1600, "total_steps": 6590, "eval_loss": 0.03584934026002884, "epoch": 2.4265402843601898, "percentage": 24.28, "elapsed_time": "4:55:30", "remaining_time": "15:21:37"} -{"current_steps": 1610, "total_steps": 6590, "loss": 0.0236, "lr": 9.378928004623163e-05, "epoch": 2.4417061611374407, "percentage": 24.43, "elapsed_time": "4:57:02", "remaining_time": "15:18:47"} -{"current_steps": 1620, "total_steps": 6590, "loss": 0.0313, "lr": 9.366082553098097e-05, "epoch": 2.456872037914692, "percentage": 24.58, "elapsed_time": "4:58:20", "remaining_time": "15:15:15"} -{"current_steps": 1630, "total_steps": 6590, "loss": 0.0257, "lr": 9.353114601929505e-05, "epoch": 2.472037914691943, "percentage": 24.73, "elapsed_time": "4:59:37", "remaining_time": "15:11:45"} -{"current_steps": 1640, "total_steps": 6590, "loss": 0.0277, "lr": 9.340024514960574e-05, "epoch": 2.4872037914691942, "percentage": 24.89, "elapsed_time": "5:00:55", "remaining_time": "15:08:17"} -{"current_steps": 1650, "total_steps": 6590, "loss": 0.0164, "lr": 9.32681265946127e-05, "epoch": 2.5023696682464456, "percentage": 25.04, "elapsed_time": "5:02:13", "remaining_time": "15:04:51"} -{"current_steps": 1650, "total_steps": 6590, "eval_loss": 0.038353804498910904, "epoch": 2.5023696682464456, "percentage": 25.04, "elapsed_time": "5:04:54", "remaining_time": "15:12:53"} -{"current_steps": 1660, "total_steps": 6590, "loss": 0.0284, "lr": 9.313479406118029e-05, "epoch": 2.517535545023697, "percentage": 25.19, "elapsed_time": "5:06:16", "remaining_time": "15:09:37"} -{"current_steps": 1670, "total_steps": 6590, "loss": 0.0208, "lr": 9.30002512902336e-05, "epoch": 2.532701421800948, "percentage": 25.34, "elapsed_time": "5:07:34", "remaining_time": "15:06:08"} -{"current_steps": 1680, "total_steps": 6590, "loss": 0.0374, "lr": 9.286450205665353e-05, "epoch": 2.547867298578199, "percentage": 25.49, "elapsed_time": "5:08:51", "remaining_time": "15:02:41"} -{"current_steps": 1690, "total_steps": 6590, "loss": 0.0355, "lr": 9.272755016917077e-05, "epoch": 2.56303317535545, "percentage": 25.64, "elapsed_time": "5:10:08", "remaining_time": "14:59:14"} -{"current_steps": 1700, "total_steps": 6590, "loss": 0.03, "lr": 9.258939947025901e-05, "epoch": 2.5781990521327014, "percentage": 25.8, "elapsed_time": "5:11:26", "remaining_time": "14:55:51"} -{"current_steps": 1700, "total_steps": 6590, "eval_loss": 0.03666139766573906, "epoch": 2.5781990521327014, "percentage": 25.8, "elapsed_time": "5:14:07", "remaining_time": "15:03:34"} -{"current_steps": 1710, "total_steps": 6590, "loss": 0.0366, "lr": 9.245005383602719e-05, "epoch": 2.5933649289099527, "percentage": 25.95, "elapsed_time": "5:15:29", "remaining_time": "15:00:21"} -{"current_steps": 1720, "total_steps": 6590, "loss": 0.0267, "lr": 9.230951717611056e-05, "epoch": 2.6085308056872036, "percentage": 26.1, "elapsed_time": "5:16:47", "remaining_time": "14:56:56"} -{"current_steps": 1730, "total_steps": 6590, "loss": 0.0301, "lr": 9.21677934335612e-05, "epoch": 2.623696682464455, "percentage": 26.25, "elapsed_time": "5:18:04", "remaining_time": "14:53:33"} -{"current_steps": 1740, "total_steps": 6590, "loss": 0.0243, "lr": 9.202488658473725e-05, "epoch": 2.6388625592417063, "percentage": 26.4, "elapsed_time": "5:19:22", "remaining_time": "14:50:11"} -{"current_steps": 1750, "total_steps": 6590, "loss": 0.0278, "lr": 9.188080063919137e-05, "epoch": 2.654028436018957, "percentage": 26.56, "elapsed_time": "5:20:40", "remaining_time": "14:46:52"} -{"current_steps": 1750, "total_steps": 6590, "eval_loss": 0.03990183770656586, "epoch": 2.654028436018957, "percentage": 26.56, "elapsed_time": "5:23:21", "remaining_time": "14:54:17"} -{"current_steps": 1760, "total_steps": 6590, "loss": 0.029, "lr": 9.173553963955836e-05, "epoch": 2.6691943127962086, "percentage": 26.71, "elapsed_time": "5:24:43", "remaining_time": "14:51:08"} -{"current_steps": 1770, "total_steps": 6590, "loss": 0.0234, "lr": 9.15891076614415e-05, "epoch": 2.68436018957346, "percentage": 26.86, "elapsed_time": "5:26:00", "remaining_time": "14:47:47"} -{"current_steps": 1780, "total_steps": 6590, "loss": 0.0208, "lr": 9.144150881329845e-05, "epoch": 2.699526066350711, "percentage": 27.01, "elapsed_time": "5:27:19", "remaining_time": "14:44:29"} -{"current_steps": 1790, "total_steps": 6590, "loss": 0.0342, "lr": 9.129274723632579e-05, "epoch": 2.714691943127962, "percentage": 27.16, "elapsed_time": "5:28:36", "remaining_time": "14:41:11"} -{"current_steps": 1800, "total_steps": 6590, "loss": 0.0305, "lr": 9.114282710434297e-05, "epoch": 2.729857819905213, "percentage": 27.31, "elapsed_time": "5:29:54", "remaining_time": "14:37:55"} -{"current_steps": 1800, "total_steps": 6590, "eval_loss": 0.035470809787511826, "epoch": 2.729857819905213, "percentage": 27.31, "elapsed_time": "5:32:35", "remaining_time": "14:45:03"} -{"current_steps": 1810, "total_steps": 6590, "loss": 0.0264, "lr": 9.099175262367509e-05, "epoch": 2.7450236966824644, "percentage": 27.47, "elapsed_time": "5:33:57", "remaining_time": "14:41:56"} -{"current_steps": 1820, "total_steps": 6590, "loss": 0.0303, "lr": 9.083952803303497e-05, "epoch": 2.7601895734597157, "percentage": 27.62, "elapsed_time": "5:35:14", "remaining_time": "14:38:38"} -{"current_steps": 1830, "total_steps": 6590, "loss": 0.0218, "lr": 9.068615760340416e-05, "epoch": 2.775355450236967, "percentage": 27.77, "elapsed_time": "5:36:32", "remaining_time": "14:35:23"} -{"current_steps": 1840, "total_steps": 6590, "loss": 0.0164, "lr": 9.053164563791316e-05, "epoch": 2.790521327014218, "percentage": 27.92, "elapsed_time": "5:37:50", "remaining_time": "14:32:09"} -{"current_steps": 1850, "total_steps": 6590, "loss": 0.0329, "lr": 9.037599647172066e-05, "epoch": 2.8056872037914693, "percentage": 28.07, "elapsed_time": "5:39:08", "remaining_time": "14:28:55"} -{"current_steps": 1850, "total_steps": 6590, "eval_loss": 0.037568479776382446, "epoch": 2.8056872037914693, "percentage": 28.07, "elapsed_time": "5:41:49", "remaining_time": "14:35:47"} -{"current_steps": 1860, "total_steps": 6590, "loss": 0.0276, "lr": 9.021921447189188e-05, "epoch": 2.82085308056872, "percentage": 28.22, "elapsed_time": "5:43:10", "remaining_time": "14:32:42"} -{"current_steps": 1870, "total_steps": 6590, "loss": 0.0221, "lr": 9.006130403727613e-05, "epoch": 2.8360189573459715, "percentage": 28.38, "elapsed_time": "5:44:28", "remaining_time": "14:29:28"} -{"current_steps": 1880, "total_steps": 6590, "loss": 0.0159, "lr": 8.990226959838328e-05, "epoch": 2.851184834123223, "percentage": 28.53, "elapsed_time": "5:45:46", "remaining_time": "14:26:15"} -{"current_steps": 1890, "total_steps": 6590, "loss": 0.0202, "lr": 8.974211561725956e-05, "epoch": 2.8663507109004738, "percentage": 28.68, "elapsed_time": "5:47:03", "remaining_time": "14:23:03"} -{"current_steps": 1900, "total_steps": 6590, "loss": 0.0248, "lr": 8.958084658736226e-05, "epoch": 2.881516587677725, "percentage": 28.83, "elapsed_time": "5:48:21", "remaining_time": "14:19:53"} -{"current_steps": 1900, "total_steps": 6590, "eval_loss": 0.03597626835107803, "epoch": 2.881516587677725, "percentage": 28.83, "elapsed_time": "5:51:02", "remaining_time": "14:26:30"} -{"current_steps": 1910, "total_steps": 6590, "loss": 0.0286, "lr": 8.941846703343373e-05, "epoch": 2.8966824644549765, "percentage": 28.98, "elapsed_time": "5:52:24", "remaining_time": "14:23:30"} -{"current_steps": 1920, "total_steps": 6590, "loss": 0.0272, "lr": 8.925498151137446e-05, "epoch": 2.9118483412322274, "percentage": 29.14, "elapsed_time": "5:53:42", "remaining_time": "14:20:19"} -{"current_steps": 1930, "total_steps": 6590, "loss": 0.025, "lr": 8.909039460811515e-05, "epoch": 2.9270142180094787, "percentage": 29.29, "elapsed_time": "5:54:59", "remaining_time": "14:17:08"} -{"current_steps": 1940, "total_steps": 6590, "loss": 0.033, "lr": 8.892471094148807e-05, "epoch": 2.94218009478673, "percentage": 29.44, "elapsed_time": "5:56:17", "remaining_time": "14:13:59"} -{"current_steps": 1950, "total_steps": 6590, "loss": 0.0329, "lr": 8.875793516009752e-05, "epoch": 2.957345971563981, "percentage": 29.59, "elapsed_time": "5:57:34", "remaining_time": "14:10:51"} -{"current_steps": 1950, "total_steps": 6590, "eval_loss": 0.03343908488750458, "epoch": 2.957345971563981, "percentage": 29.59, "elapsed_time": "6:00:15", "remaining_time": "14:17:14"} -{"current_steps": 1960, "total_steps": 6590, "loss": 0.0334, "lr": 8.859007194318939e-05, "epoch": 2.9725118483412323, "percentage": 29.74, "elapsed_time": "6:01:38", "remaining_time": "14:14:16"} -{"current_steps": 1970, "total_steps": 6590, "loss": 0.0341, "lr": 8.842112600051983e-05, "epoch": 2.987677725118483, "percentage": 29.89, "elapsed_time": "6:02:56", "remaining_time": "14:11:09"} -{"current_steps": 1980, "total_steps": 6590, "loss": 0.0309, "lr": 8.825110207222318e-05, "epoch": 3.0028436018957345, "percentage": 30.05, "elapsed_time": "6:04:14", "remaining_time": "14:08:03"} -{"current_steps": 1990, "total_steps": 6590, "loss": 0.0195, "lr": 8.808000492867888e-05, "epoch": 3.018009478672986, "percentage": 30.2, "elapsed_time": "6:05:32", "remaining_time": "14:04:57"} -{"current_steps": 2000, "total_steps": 6590, "loss": 0.0129, "lr": 8.790783937037777e-05, "epoch": 3.0331753554502368, "percentage": 30.35, "elapsed_time": "6:06:49", "remaining_time": "14:01:52"} -{"current_steps": 2000, "total_steps": 6590, "eval_loss": 0.03923666104674339, "epoch": 3.0331753554502368, "percentage": 30.35, "elapsed_time": "6:09:30", "remaining_time": "14:08:01"} -{"current_steps": 2010, "total_steps": 6590, "loss": 0.0297, "lr": 8.773461022778722e-05, "epoch": 3.048341232227488, "percentage": 30.5, "elapsed_time": "6:10:53", "remaining_time": "14:05:06"} -{"current_steps": 2020, "total_steps": 6590, "loss": 0.021, "lr": 8.756032236121579e-05, "epoch": 3.0635071090047394, "percentage": 30.65, "elapsed_time": "6:12:10", "remaining_time": "14:02:00"} -{"current_steps": 2030, "total_steps": 6590, "loss": 0.0157, "lr": 8.73849806606767e-05, "epoch": 3.0786729857819903, "percentage": 30.8, "elapsed_time": "6:13:28", "remaining_time": "13:58:56"} -{"current_steps": 2040, "total_steps": 6590, "loss": 0.0157, "lr": 8.720859004575074e-05, "epoch": 3.0938388625592417, "percentage": 30.96, "elapsed_time": "6:14:46", "remaining_time": "13:55:53"} -{"current_steps": 2050, "total_steps": 6590, "loss": 0.01, "lr": 8.703115546544819e-05, "epoch": 3.109004739336493, "percentage": 31.11, "elapsed_time": "6:16:03", "remaining_time": "13:52:50"} -{"current_steps": 2050, "total_steps": 6590, "eval_loss": 0.039759017527103424, "epoch": 3.109004739336493, "percentage": 31.11, "elapsed_time": "6:18:44", "remaining_time": "13:58:46"} -{"current_steps": 2060, "total_steps": 6590, "loss": 0.0217, "lr": 8.685268189807e-05, "epoch": 3.124170616113744, "percentage": 31.26, "elapsed_time": "6:20:22", "remaining_time": "13:56:27"} -{"current_steps": 2070, "total_steps": 6590, "loss": 0.0157, "lr": 8.667317435106801e-05, "epoch": 3.1393364928909953, "percentage": 31.41, "elapsed_time": "6:21:39", "remaining_time": "13:53:23"} -{"current_steps": 2080, "total_steps": 6590, "loss": 0.0242, "lr": 8.649263786090466e-05, "epoch": 3.1545023696682466, "percentage": 31.56, "elapsed_time": "6:22:57", "remaining_time": "13:50:20"} -{"current_steps": 2090, "total_steps": 6590, "loss": 0.0188, "lr": 8.63110774929115e-05, "epoch": 3.1696682464454975, "percentage": 31.71, "elapsed_time": "6:24:14", "remaining_time": "13:47:19"} -{"current_steps": 2100, "total_steps": 6590, "loss": 0.0156, "lr": 8.612849834114706e-05, "epoch": 3.184834123222749, "percentage": 31.87, "elapsed_time": "6:25:31", "remaining_time": "13:44:18"} -{"current_steps": 2100, "total_steps": 6590, "eval_loss": 0.03947887197136879, "epoch": 3.184834123222749, "percentage": 31.87, "elapsed_time": "6:28:12", "remaining_time": "13:50:02"} -{"current_steps": 2110, "total_steps": 6590, "loss": 0.0202, "lr": 8.594490552825414e-05, "epoch": 3.2, "percentage": 32.02, "elapsed_time": "6:29:40", "remaining_time": "13:47:21"} -{"current_steps": 2120, "total_steps": 6590, "loss": 0.0159, "lr": 8.576030420531581e-05, "epoch": 3.215165876777251, "percentage": 32.17, "elapsed_time": "6:30:57", "remaining_time": "13:44:19"} -{"current_steps": 2130, "total_steps": 6590, "loss": 0.0148, "lr": 8.557469955171106e-05, "epoch": 3.2303317535545024, "percentage": 32.32, "elapsed_time": "6:32:15", "remaining_time": "13:41:20"} -{"current_steps": 2140, "total_steps": 6590, "loss": 0.0196, "lr": 8.538809677496948e-05, "epoch": 3.2454976303317538, "percentage": 32.47, "elapsed_time": "6:33:32", "remaining_time": "13:38:21"} -{"current_steps": 2150, "total_steps": 6590, "loss": 0.0151, "lr": 8.520050111062501e-05, "epoch": 3.2606635071090047, "percentage": 32.63, "elapsed_time": "6:34:50", "remaining_time": "13:35:23"} -{"current_steps": 2150, "total_steps": 6590, "eval_loss": 0.0445675328373909, "epoch": 3.2606635071090047, "percentage": 32.63, "elapsed_time": "6:37:31", "remaining_time": "13:40:55"} -{"current_steps": 2160, "total_steps": 6590, "loss": 0.0168, "lr": 8.501191782206923e-05, "epoch": 3.275829383886256, "percentage": 32.78, "elapsed_time": "6:38:53", "remaining_time": "13:38:04"} -{"current_steps": 2170, "total_steps": 6590, "loss": 0.0141, "lr": 8.482235220040358e-05, "epoch": 3.2909952606635073, "percentage": 32.93, "elapsed_time": "6:40:10", "remaining_time": "13:35:06"} -{"current_steps": 2180, "total_steps": 6590, "loss": 0.0122, "lr": 8.463180956429086e-05, "epoch": 3.3061611374407582, "percentage": 33.08, "elapsed_time": "6:41:28", "remaining_time": "13:32:08"} -{"current_steps": 2190, "total_steps": 6590, "loss": 0.0259, "lr": 8.444029525980617e-05, "epoch": 3.3213270142180096, "percentage": 33.23, "elapsed_time": "6:42:45", "remaining_time": "13:29:12"} -{"current_steps": 2200, "total_steps": 6590, "loss": 0.0181, "lr": 8.424781466028675e-05, "epoch": 3.3364928909952605, "percentage": 33.38, "elapsed_time": "6:44:03", "remaining_time": "13:26:16"} -{"current_steps": 2200, "total_steps": 6590, "eval_loss": 0.036237068474292755, "epoch": 3.3364928909952605, "percentage": 33.38, "elapsed_time": "6:46:44", "remaining_time": "13:31:37"} -{"current_steps": 2210, "total_steps": 6590, "loss": 0.0227, "lr": 8.405437316618128e-05, "epoch": 3.351658767772512, "percentage": 33.54, "elapsed_time": "6:48:06", "remaining_time": "13:28:49"} -{"current_steps": 2220, "total_steps": 6590, "loss": 0.0157, "lr": 8.385997620489838e-05, "epoch": 3.366824644549763, "percentage": 33.69, "elapsed_time": "6:49:24", "remaining_time": "13:25:53"} -{"current_steps": 2230, "total_steps": 6590, "loss": 0.0227, "lr": 8.366462923065432e-05, "epoch": 3.381990521327014, "percentage": 33.84, "elapsed_time": "6:50:41", "remaining_time": "13:22:58"} -{"current_steps": 2240, "total_steps": 6590, "loss": 0.0212, "lr": 8.346833772432e-05, "epoch": 3.3971563981042654, "percentage": 33.99, "elapsed_time": "6:51:59", "remaining_time": "13:20:03"} -{"current_steps": 2250, "total_steps": 6590, "loss": 0.0114, "lr": 8.327110719326708e-05, "epoch": 3.4123222748815167, "percentage": 34.14, "elapsed_time": "6:53:16", "remaining_time": "13:17:09"} -{"current_steps": 2250, "total_steps": 6590, "eval_loss": 0.037667613476514816, "epoch": 3.4123222748815167, "percentage": 34.14, "elapsed_time": "6:55:57", "remaining_time": "13:22:20"} -{"current_steps": 2260, "total_steps": 6590, "loss": 0.0227, "lr": 8.307294317121361e-05, "epoch": 3.4274881516587676, "percentage": 34.29, "elapsed_time": "6:57:19", "remaining_time": "13:19:34"} -{"current_steps": 2270, "total_steps": 6590, "loss": 0.0171, "lr": 8.287385121806869e-05, "epoch": 3.442654028436019, "percentage": 34.45, "elapsed_time": "6:58:37", "remaining_time": "13:16:40"} -{"current_steps": 2280, "total_steps": 6590, "loss": 0.0158, "lr": 8.267383691977648e-05, "epoch": 3.4578199052132703, "percentage": 34.6, "elapsed_time": "6:59:54", "remaining_time": "13:13:46"} -{"current_steps": 2290, "total_steps": 6590, "loss": 0.0201, "lr": 8.247290588815944e-05, "epoch": 3.472985781990521, "percentage": 34.75, "elapsed_time": "7:01:12", "remaining_time": "13:10:53"} -{"current_steps": 2300, "total_steps": 6590, "loss": 0.0178, "lr": 8.227106376076095e-05, "epoch": 3.4881516587677726, "percentage": 34.9, "elapsed_time": "7:02:29", "remaining_time": "13:08:03"} -{"current_steps": 2300, "total_steps": 6590, "eval_loss": 0.03822999820113182, "epoch": 3.4881516587677726, "percentage": 34.9, "elapsed_time": "7:05:10", "remaining_time": "13:13:03"} -{"current_steps": 2310, "total_steps": 6590, "loss": 0.0256, "lr": 8.20683162006871e-05, "epoch": 3.5033175355450235, "percentage": 35.05, "elapsed_time": "7:06:33", "remaining_time": "13:10:19"} -{"current_steps": 2320, "total_steps": 6590, "loss": 0.0159, "lr": 8.186466889644775e-05, "epoch": 3.518483412322275, "percentage": 35.2, "elapsed_time": "7:07:50", "remaining_time": "13:07:26"} -{"current_steps": 2330, "total_steps": 6590, "loss": 0.0125, "lr": 8.166012756179706e-05, "epoch": 3.533649289099526, "percentage": 35.36, "elapsed_time": "7:09:08", "remaining_time": "13:04:36"} -{"current_steps": 2340, "total_steps": 6590, "loss": 0.021, "lr": 8.145469793557306e-05, "epoch": 3.5488151658767775, "percentage": 35.51, "elapsed_time": "7:10:26", "remaining_time": "13:01:46"} -{"current_steps": 2350, "total_steps": 6590, "loss": 0.0131, "lr": 8.124838578153664e-05, "epoch": 3.5639810426540284, "percentage": 35.66, "elapsed_time": "7:11:43", "remaining_time": "12:58:57"} -{"current_steps": 2350, "total_steps": 6590, "eval_loss": 0.038201410323381424, "epoch": 3.5639810426540284, "percentage": 35.66, "elapsed_time": "7:14:24", "remaining_time": "13:03:47"} -{"current_steps": 2360, "total_steps": 6590, "loss": 0.0164, "lr": 8.10411968882099e-05, "epoch": 3.5791469194312797, "percentage": 35.81, "elapsed_time": "7:15:46", "remaining_time": "13:01:05"} -{"current_steps": 2370, "total_steps": 6590, "loss": 0.0152, "lr": 8.083313706871372e-05, "epoch": 3.5943127962085306, "percentage": 35.96, "elapsed_time": "7:17:04", "remaining_time": "12:58:15"} -{"current_steps": 2380, "total_steps": 6590, "loss": 0.0213, "lr": 8.062421216060463e-05, "epoch": 3.609478672985782, "percentage": 36.12, "elapsed_time": "7:18:22", "remaining_time": "12:55:26"} -{"current_steps": 2390, "total_steps": 6590, "loss": 0.0241, "lr": 8.041442802571103e-05, "epoch": 3.6246445497630333, "percentage": 36.27, "elapsed_time": "7:19:40", "remaining_time": "12:52:38"} -{"current_steps": 2400, "total_steps": 6590, "loss": 0.0207, "lr": 8.020379054996874e-05, "epoch": 3.639810426540284, "percentage": 36.42, "elapsed_time": "7:20:57", "remaining_time": "12:49:50"} -{"current_steps": 2400, "total_steps": 6590, "eval_loss": 0.03543415665626526, "epoch": 3.639810426540284, "percentage": 36.42, "elapsed_time": "7:23:38", "remaining_time": "12:54:31"} -{"current_steps": 2410, "total_steps": 6590, "loss": 0.0183, "lr": 7.99923056432559e-05, "epoch": 3.6549763033175355, "percentage": 36.57, "elapsed_time": "7:25:00", "remaining_time": "12:51:50"} -{"current_steps": 2420, "total_steps": 6590, "loss": 0.0111, "lr": 7.977997923922707e-05, "epoch": 3.670142180094787, "percentage": 36.72, "elapsed_time": "7:26:18", "remaining_time": "12:49:03"} -{"current_steps": 2430, "total_steps": 6590, "loss": 0.0094, "lr": 7.956681729514677e-05, "epoch": 3.6853080568720378, "percentage": 36.87, "elapsed_time": "7:27:36", "remaining_time": "12:46:16"} -{"current_steps": 2440, "total_steps": 6590, "loss": 0.0119, "lr": 7.935282579172239e-05, "epoch": 3.700473933649289, "percentage": 37.03, "elapsed_time": "7:28:54", "remaining_time": "12:43:30"} -{"current_steps": 2450, "total_steps": 6590, "loss": 0.0211, "lr": 7.913801073293639e-05, "epoch": 3.7156398104265405, "percentage": 37.18, "elapsed_time": "7:30:11", "remaining_time": "12:40:44"} -{"current_steps": 2450, "total_steps": 6590, "eval_loss": 0.03907341510057449, "epoch": 3.7156398104265405, "percentage": 37.18, "elapsed_time": "7:32:52", "remaining_time": "12:45:16"} -{"current_steps": 2460, "total_steps": 6590, "loss": 0.0216, "lr": 7.89223781458777e-05, "epoch": 3.7308056872037914, "percentage": 37.33, "elapsed_time": "7:34:15", "remaining_time": "12:42:37"} -{"current_steps": 2470, "total_steps": 6590, "loss": 0.0164, "lr": 7.870593408057287e-05, "epoch": 3.7459715639810427, "percentage": 37.48, "elapsed_time": "7:35:32", "remaining_time": "12:39:51"} -{"current_steps": 2480, "total_steps": 6590, "loss": 0.0177, "lr": 7.848868460981606e-05, "epoch": 3.7611374407582936, "percentage": 37.63, "elapsed_time": "7:36:50", "remaining_time": "12:37:06"} -{"current_steps": 2490, "total_steps": 6590, "loss": 0.025, "lr": 7.827063582899885e-05, "epoch": 3.776303317535545, "percentage": 37.78, "elapsed_time": "7:38:08", "remaining_time": "12:34:22"} -{"current_steps": 2500, "total_steps": 6590, "loss": 0.0254, "lr": 7.805179385593912e-05, "epoch": 3.7914691943127963, "percentage": 37.94, "elapsed_time": "7:39:26", "remaining_time": "12:31:38"} -{"current_steps": 2500, "total_steps": 6590, "eval_loss": 0.040060922503471375, "epoch": 3.7914691943127963, "percentage": 37.94, "elapsed_time": "7:42:07", "remaining_time": "12:36:02"} -{"current_steps": 2510, "total_steps": 6590, "loss": 0.0228, "lr": 7.783216483070941e-05, "epoch": 3.8066350710900476, "percentage": 38.09, "elapsed_time": "7:43:29", "remaining_time": "12:33:23"} -{"current_steps": 2520, "total_steps": 6590, "loss": 0.0133, "lr": 7.761175491546471e-05, "epoch": 3.8218009478672985, "percentage": 38.24, "elapsed_time": "7:44:47", "remaining_time": "12:30:39"} -{"current_steps": 2530, "total_steps": 6590, "loss": 0.0173, "lr": 7.73905702942695e-05, "epoch": 3.83696682464455, "percentage": 38.39, "elapsed_time": "7:46:04", "remaining_time": "12:27:56"} -{"current_steps": 2540, "total_steps": 6590, "loss": 0.0125, "lr": 7.716861717292425e-05, "epoch": 3.8521327014218008, "percentage": 38.54, "elapsed_time": "7:47:22", "remaining_time": "12:25:13"} -{"current_steps": 2550, "total_steps": 6590, "loss": 0.0171, "lr": 7.694590177879137e-05, "epoch": 3.867298578199052, "percentage": 38.69, "elapsed_time": "7:48:40", "remaining_time": "12:22:31"} -{"current_steps": 2550, "total_steps": 6590, "eval_loss": 0.03894200548529625, "epoch": 3.867298578199052, "percentage": 38.69, "elapsed_time": "7:51:21", "remaining_time": "12:26:46"} -{"current_steps": 2560, "total_steps": 6590, "loss": 0.0112, "lr": 7.67224303606204e-05, "epoch": 3.8824644549763034, "percentage": 38.85, "elapsed_time": "7:52:43", "remaining_time": "12:24:10"} -{"current_steps": 2570, "total_steps": 6590, "loss": 0.0159, "lr": 7.649820918837276e-05, "epoch": 3.8976303317535548, "percentage": 39.0, "elapsed_time": "7:54:01", "remaining_time": "12:21:28"} -{"current_steps": 2580, "total_steps": 6590, "loss": 0.0254, "lr": 7.627324455304575e-05, "epoch": 3.9127962085308057, "percentage": 39.15, "elapsed_time": "7:55:19", "remaining_time": "12:18:46"} -{"current_steps": 2590, "total_steps": 6590, "loss": 0.0253, "lr": 7.604754276649608e-05, "epoch": 3.927962085308057, "percentage": 39.3, "elapsed_time": "7:56:37", "remaining_time": "12:16:05"} -{"current_steps": 2600, "total_steps": 6590, "loss": 0.0203, "lr": 7.582111016126292e-05, "epoch": 3.943127962085308, "percentage": 39.45, "elapsed_time": "7:57:54", "remaining_time": "12:13:25"} -{"current_steps": 2600, "total_steps": 6590, "eval_loss": 0.03857457637786865, "epoch": 3.943127962085308, "percentage": 39.45, "elapsed_time": "8:00:35", "remaining_time": "12:17:31"} -{"current_steps": 2610, "total_steps": 6590, "loss": 0.0164, "lr": 7.559395309038994e-05, "epoch": 3.9582938388625593, "percentage": 39.61, "elapsed_time": "8:01:58", "remaining_time": "12:14:57"} -{"current_steps": 2620, "total_steps": 6590, "loss": 0.0188, "lr": 7.536607792724732e-05, "epoch": 3.9734597156398106, "percentage": 39.76, "elapsed_time": "8:03:15", "remaining_time": "12:12:16"} -{"current_steps": 2630, "total_steps": 6590, "loss": 0.0161, "lr": 7.513749106535278e-05, "epoch": 3.9886255924170615, "percentage": 39.91, "elapsed_time": "8:04:33", "remaining_time": "12:09:35"} -{"current_steps": 2640, "total_steps": 6590, "loss": 0.0258, "lr": 7.490819891819228e-05, "epoch": 4.003791469194312, "percentage": 40.06, "elapsed_time": "8:05:51", "remaining_time": "12:06:56"} -{"current_steps": 2650, "total_steps": 6590, "loss": 0.0128, "lr": 7.467820791904004e-05, "epoch": 4.018957345971564, "percentage": 40.21, "elapsed_time": "8:07:09", "remaining_time": "12:04:17"} -{"current_steps": 2650, "total_steps": 6590, "eval_loss": 0.03858537971973419, "epoch": 4.018957345971564, "percentage": 40.21, "elapsed_time": "8:09:49", "remaining_time": "12:08:16"} -{"current_steps": 2660, "total_steps": 6590, "loss": 0.007, "lr": 7.444752452077801e-05, "epoch": 4.034123222748815, "percentage": 40.36, "elapsed_time": "8:11:12", "remaining_time": "12:05:43"} -{"current_steps": 2670, "total_steps": 6590, "loss": 0.0065, "lr": 7.421615519571489e-05, "epoch": 4.049289099526066, "percentage": 40.52, "elapsed_time": "8:12:30", "remaining_time": "12:03:04"} -{"current_steps": 2680, "total_steps": 6590, "loss": 0.0047, "lr": 7.39841064354045e-05, "epoch": 4.064454976303318, "percentage": 40.67, "elapsed_time": "8:13:48", "remaining_time": "12:00:26"} -{"current_steps": 2690, "total_steps": 6590, "loss": 0.0125, "lr": 7.375138475046363e-05, "epoch": 4.079620853080569, "percentage": 40.82, "elapsed_time": "8:15:05", "remaining_time": "11:57:48"} -{"current_steps": 2700, "total_steps": 6590, "loss": 0.0072, "lr": 7.351799667038942e-05, "epoch": 4.0947867298578196, "percentage": 40.97, "elapsed_time": "8:16:23", "remaining_time": "11:55:10"} -{"current_steps": 2700, "total_steps": 6590, "eval_loss": 0.04654594510793686, "epoch": 4.0947867298578196, "percentage": 40.97, "elapsed_time": "8:19:04", "remaining_time": "11:59:02"} -{"current_steps": 2710, "total_steps": 6590, "loss": 0.0084, "lr": 7.32839487433761e-05, "epoch": 4.109952606635071, "percentage": 41.12, "elapsed_time": "8:20:27", "remaining_time": "11:56:31"} -{"current_steps": 2720, "total_steps": 6590, "loss": 0.0078, "lr": 7.304924753613127e-05, "epoch": 4.125118483412322, "percentage": 41.27, "elapsed_time": "8:21:44", "remaining_time": "11:53:53"} -{"current_steps": 2730, "total_steps": 6590, "loss": 0.0092, "lr": 7.281389963369174e-05, "epoch": 4.140284360189574, "percentage": 41.43, "elapsed_time": "8:23:02", "remaining_time": "11:51:15"} -{"current_steps": 2740, "total_steps": 6590, "loss": 0.0055, "lr": 7.257791163923869e-05, "epoch": 4.155450236966825, "percentage": 41.58, "elapsed_time": "8:24:20", "remaining_time": "11:48:39"} -{"current_steps": 2750, "total_steps": 6590, "loss": 0.01, "lr": 7.234129017391245e-05, "epoch": 4.170616113744076, "percentage": 41.73, "elapsed_time": "8:25:38", "remaining_time": "11:46:03"} -{"current_steps": 2750, "total_steps": 6590, "eval_loss": 0.052549898624420166, "epoch": 4.170616113744076, "percentage": 41.73, "elapsed_time": "8:28:19", "remaining_time": "11:49:48"} -{"current_steps": 2760, "total_steps": 6590, "loss": 0.0066, "lr": 7.210404187662668e-05, "epoch": 4.185781990521327, "percentage": 41.88, "elapsed_time": "8:29:51", "remaining_time": "11:47:31"} -{"current_steps": 2770, "total_steps": 6590, "loss": 0.0123, "lr": 7.186617340388211e-05, "epoch": 4.200947867298578, "percentage": 42.03, "elapsed_time": "8:31:09", "remaining_time": "11:44:54"} -{"current_steps": 2780, "total_steps": 6590, "loss": 0.011, "lr": 7.162769142957987e-05, "epoch": 4.216113744075829, "percentage": 42.19, "elapsed_time": "8:32:26", "remaining_time": "11:42:18"} -{"current_steps": 2790, "total_steps": 6590, "loss": 0.0164, "lr": 7.138860264483413e-05, "epoch": 4.231279620853081, "percentage": 42.34, "elapsed_time": "8:33:44", "remaining_time": "11:39:42"} -{"current_steps": 2800, "total_steps": 6590, "loss": 0.015, "lr": 7.114891375778438e-05, "epoch": 4.246445497630332, "percentage": 42.49, "elapsed_time": "8:35:02", "remaining_time": "11:37:08"} -{"current_steps": 2800, "total_steps": 6590, "eval_loss": 0.041996706277132034, "epoch": 4.246445497630332, "percentage": 42.49, "elapsed_time": "8:37:42", "remaining_time": "11:40:45"} -{"current_steps": 2810, "total_steps": 6590, "loss": 0.0093, "lr": 7.090863149340731e-05, "epoch": 4.2616113744075825, "percentage": 42.64, "elapsed_time": "8:39:04", "remaining_time": "11:38:15"} -{"current_steps": 2820, "total_steps": 6590, "loss": 0.0132, "lr": 7.066776259332797e-05, "epoch": 4.276777251184834, "percentage": 42.79, "elapsed_time": "8:40:22", "remaining_time": "11:35:40"} -{"current_steps": 2830, "total_steps": 6590, "loss": 0.0075, "lr": 7.042631381563081e-05, "epoch": 4.291943127962085, "percentage": 42.94, "elapsed_time": "8:41:40", "remaining_time": "11:33:05"} -{"current_steps": 2840, "total_steps": 6590, "loss": 0.0105, "lr": 7.018429193466988e-05, "epoch": 4.3071090047393366, "percentage": 43.1, "elapsed_time": "8:42:57", "remaining_time": "11:30:31"} -{"current_steps": 2850, "total_steps": 6590, "loss": 0.0122, "lr": 6.994170374087893e-05, "epoch": 4.322274881516588, "percentage": 43.25, "elapsed_time": "8:44:15", "remaining_time": "11:27:58"} -{"current_steps": 2850, "total_steps": 6590, "eval_loss": 0.04366535320878029, "epoch": 4.322274881516588, "percentage": 43.25, "elapsed_time": "8:46:56", "remaining_time": "11:31:29"} -{"current_steps": 2860, "total_steps": 6590, "loss": 0.0183, "lr": 6.969855604058072e-05, "epoch": 4.337440758293839, "percentage": 43.4, "elapsed_time": "8:48:18", "remaining_time": "11:29:01"} -{"current_steps": 2870, "total_steps": 6590, "loss": 0.016, "lr": 6.945485565579622e-05, "epoch": 4.35260663507109, "percentage": 43.55, "elapsed_time": "8:49:36", "remaining_time": "11:26:27"} -{"current_steps": 2880, "total_steps": 6590, "loss": 0.0095, "lr": 6.92106094240531e-05, "epoch": 4.367772511848341, "percentage": 43.7, "elapsed_time": "8:50:54", "remaining_time": "11:23:54"} -{"current_steps": 2890, "total_steps": 6590, "loss": 0.0125, "lr": 6.896582419819392e-05, "epoch": 4.382938388625592, "percentage": 43.85, "elapsed_time": "8:52:12", "remaining_time": "11:21:22"} -{"current_steps": 2900, "total_steps": 6590, "loss": 0.0147, "lr": 6.872050684618382e-05, "epoch": 4.398104265402844, "percentage": 44.01, "elapsed_time": "8:53:29", "remaining_time": "11:18:49"} -{"current_steps": 2900, "total_steps": 6590, "eval_loss": 0.04488484561443329, "epoch": 4.398104265402844, "percentage": 44.01, "elapsed_time": "8:56:10", "remaining_time": "11:22:14"} -{"current_steps": 2910, "total_steps": 6590, "loss": 0.0067, "lr": 6.847466425091792e-05, "epoch": 4.413270142180095, "percentage": 44.16, "elapsed_time": "8:57:33", "remaining_time": "11:19:47"} -{"current_steps": 2920, "total_steps": 6590, "loss": 0.0154, "lr": 6.822830331002812e-05, "epoch": 4.4284360189573455, "percentage": 44.31, "elapsed_time": "8:58:50", "remaining_time": "11:17:14"} -{"current_steps": 2930, "total_steps": 6590, "loss": 0.0145, "lr": 6.798143093568958e-05, "epoch": 4.443601895734597, "percentage": 44.46, "elapsed_time": "9:00:08", "remaining_time": "11:14:42"} -{"current_steps": 2940, "total_steps": 6590, "loss": 0.0104, "lr": 6.773405405442683e-05, "epoch": 4.458767772511848, "percentage": 44.61, "elapsed_time": "9:01:25", "remaining_time": "11:12:11"} -{"current_steps": 2950, "total_steps": 6590, "loss": 0.0139, "lr": 6.748617960691937e-05, "epoch": 4.4739336492890995, "percentage": 44.76, "elapsed_time": "9:02:43", "remaining_time": "11:09:40"} -{"current_steps": 2950, "total_steps": 6590, "eval_loss": 0.04246136173605919, "epoch": 4.4739336492890995, "percentage": 44.76, "elapsed_time": "9:05:24", "remaining_time": "11:12:58"} -{"current_steps": 2960, "total_steps": 6590, "loss": 0.012, "lr": 6.723781454780702e-05, "epoch": 4.489099526066351, "percentage": 44.92, "elapsed_time": "9:06:47", "remaining_time": "11:10:33"} -{"current_steps": 2970, "total_steps": 6590, "loss": 0.016, "lr": 6.69889658454947e-05, "epoch": 4.504265402843602, "percentage": 45.07, "elapsed_time": "9:08:05", "remaining_time": "11:08:02"} -{"current_steps": 2980, "total_steps": 6590, "loss": 0.0105, "lr": 6.6739640481957e-05, "epoch": 4.519431279620854, "percentage": 45.22, "elapsed_time": "9:09:22", "remaining_time": "11:05:31"} -{"current_steps": 2990, "total_steps": 6590, "loss": 0.0128, "lr": 6.648984545254217e-05, "epoch": 4.534597156398104, "percentage": 45.37, "elapsed_time": "9:10:40", "remaining_time": "11:03:01"} -{"current_steps": 3000, "total_steps": 6590, "loss": 0.011, "lr": 6.623958776577599e-05, "epoch": 4.549763033175355, "percentage": 45.52, "elapsed_time": "9:11:58", "remaining_time": "11:00:31"} -{"current_steps": 3000, "total_steps": 6590, "eval_loss": 0.044334445148706436, "epoch": 4.549763033175355, "percentage": 45.52, "elapsed_time": "9:14:38", "remaining_time": "11:03:43"} -{"current_steps": 3010, "total_steps": 6590, "loss": 0.0136, "lr": 6.598887444316506e-05, "epoch": 4.564928909952607, "percentage": 45.68, "elapsed_time": "9:16:01", "remaining_time": "11:01:19"} -{"current_steps": 3020, "total_steps": 6590, "loss": 0.0101, "lr": 6.573771251899981e-05, "epoch": 4.580094786729858, "percentage": 45.83, "elapsed_time": "9:17:19", "remaining_time": "10:58:49"} -{"current_steps": 3030, "total_steps": 6590, "loss": 0.0119, "lr": 6.548610904015709e-05, "epoch": 4.595260663507109, "percentage": 45.98, "elapsed_time": "9:18:37", "remaining_time": "10:56:20"} -{"current_steps": 3040, "total_steps": 6590, "loss": 0.0112, "lr": 6.523407106590252e-05, "epoch": 4.61042654028436, "percentage": 46.13, "elapsed_time": "9:19:55", "remaining_time": "10:53:51"} -{"current_steps": 3050, "total_steps": 6590, "loss": 0.0061, "lr": 6.49816056676924e-05, "epoch": 4.625592417061611, "percentage": 46.28, "elapsed_time": "9:21:12", "remaining_time": "10:51:22"} -{"current_steps": 3050, "total_steps": 6590, "eval_loss": 0.04450962319970131, "epoch": 4.625592417061611, "percentage": 46.28, "elapsed_time": "9:23:53", "remaining_time": "10:54:28"} -{"current_steps": 3060, "total_steps": 6590, "loss": 0.0076, "lr": 6.472871992897536e-05, "epoch": 4.6407582938388625, "percentage": 46.43, "elapsed_time": "9:25:17", "remaining_time": "10:52:06"} -{"current_steps": 3070, "total_steps": 6590, "loss": 0.0087, "lr": 6.447542094499347e-05, "epoch": 4.655924170616114, "percentage": 46.59, "elapsed_time": "9:26:34", "remaining_time": "10:49:37"} -{"current_steps": 3080, "total_steps": 6590, "loss": 0.0083, "lr": 6.422171582258334e-05, "epoch": 4.671090047393365, "percentage": 46.74, "elapsed_time": "9:27:52", "remaining_time": "10:47:09"} -{"current_steps": 3090, "total_steps": 6590, "loss": 0.0108, "lr": 6.396761167997664e-05, "epoch": 4.6862559241706165, "percentage": 46.89, "elapsed_time": "9:29:09", "remaining_time": "10:44:40"} -{"current_steps": 3100, "total_steps": 6590, "loss": 0.0159, "lr": 6.371311564660039e-05, "epoch": 4.701421800947867, "percentage": 47.04, "elapsed_time": "9:30:27", "remaining_time": "10:42:13"} -{"current_steps": 3100, "total_steps": 6590, "eval_loss": 0.04513256624341011, "epoch": 4.701421800947867, "percentage": 47.04, "elapsed_time": "9:33:07", "remaining_time": "10:45:14"} -{"current_steps": 3110, "total_steps": 6590, "loss": 0.0096, "lr": 6.345823486287687e-05, "epoch": 4.716587677725118, "percentage": 47.19, "elapsed_time": "9:34:31", "remaining_time": "10:42:52"} -{"current_steps": 3120, "total_steps": 6590, "loss": 0.0155, "lr": 6.320297648002346e-05, "epoch": 4.73175355450237, "percentage": 47.34, "elapsed_time": "9:35:48", "remaining_time": "10:40:24"} -{"current_steps": 3130, "total_steps": 6590, "loss": 0.0168, "lr": 6.294734765985176e-05, "epoch": 4.746919431279621, "percentage": 47.5, "elapsed_time": "9:37:06", "remaining_time": "10:37:57"} -{"current_steps": 3140, "total_steps": 6590, "loss": 0.0081, "lr": 6.269135557456686e-05, "epoch": 4.762085308056872, "percentage": 47.65, "elapsed_time": "9:38:24", "remaining_time": "10:35:30"} -{"current_steps": 3150, "total_steps": 6590, "loss": 0.0111, "lr": 6.243500740656594e-05, "epoch": 4.777251184834123, "percentage": 47.8, "elapsed_time": "9:39:41", "remaining_time": "10:33:03"} -{"current_steps": 3150, "total_steps": 6590, "eval_loss": 0.040830329060554504, "epoch": 4.777251184834123, "percentage": 47.8, "elapsed_time": "9:42:22", "remaining_time": "10:35:59"} -{"current_steps": 3160, "total_steps": 6590, "loss": 0.0091, "lr": 6.217831034823694e-05, "epoch": 4.792417061611374, "percentage": 47.95, "elapsed_time": "9:43:45", "remaining_time": "10:33:37"} -{"current_steps": 3170, "total_steps": 6590, "loss": 0.0119, "lr": 6.19212716017565e-05, "epoch": 4.8075829383886255, "percentage": 48.1, "elapsed_time": "9:45:02", "remaining_time": "10:31:10"} -{"current_steps": 3180, "total_steps": 6590, "loss": 0.0145, "lr": 6.166389837888819e-05, "epoch": 4.822748815165877, "percentage": 48.25, "elapsed_time": "9:46:19", "remaining_time": "10:28:44"} -{"current_steps": 3190, "total_steps": 6590, "loss": 0.0109, "lr": 6.140619790077991e-05, "epoch": 4.837914691943128, "percentage": 48.41, "elapsed_time": "9:47:37", "remaining_time": "10:26:18"} -{"current_steps": 3200, "total_steps": 6590, "loss": 0.0058, "lr": 6.114817739776147e-05, "epoch": 4.8530805687203795, "percentage": 48.56, "elapsed_time": "9:48:54", "remaining_time": "10:23:52"} -{"current_steps": 3200, "total_steps": 6590, "eval_loss": 0.04339787736535072, "epoch": 4.8530805687203795, "percentage": 48.56, "elapsed_time": "9:51:35", "remaining_time": "10:26:42"} -{"current_steps": 3210, "total_steps": 6590, "loss": 0.0065, "lr": 6.0889844109141626e-05, "epoch": 4.86824644549763, "percentage": 48.71, "elapsed_time": "9:52:59", "remaining_time": "10:24:23"} -{"current_steps": 3220, "total_steps": 6590, "loss": 0.007, "lr": 6.0631205283004967e-05, "epoch": 4.883412322274881, "percentage": 48.86, "elapsed_time": "9:54:16", "remaining_time": "10:21:57"} -{"current_steps": 3230, "total_steps": 6590, "loss": 0.0132, "lr": 6.0372268176008605e-05, "epoch": 4.898578199052133, "percentage": 49.01, "elapsed_time": "9:55:34", "remaining_time": "10:19:33"} -{"current_steps": 3240, "total_steps": 6590, "loss": 0.0118, "lr": 6.011304005317856e-05, "epoch": 4.913744075829384, "percentage": 49.17, "elapsed_time": "9:56:52", "remaining_time": "10:17:08"} -{"current_steps": 3250, "total_steps": 6590, "loss": 0.0106, "lr": 5.985352818770591e-05, "epoch": 4.928909952606635, "percentage": 49.32, "elapsed_time": "9:58:09", "remaining_time": "10:14:43"} -{"current_steps": 3250, "total_steps": 6590, "eval_loss": 0.04381377622485161, "epoch": 4.928909952606635, "percentage": 49.32, "elapsed_time": "10:00:50", "remaining_time": "10:17:28"} -{"current_steps": 3260, "total_steps": 6590, "loss": 0.0091, "lr": 5.95937398607427e-05, "epoch": 4.944075829383886, "percentage": 49.47, "elapsed_time": "10:02:14", "remaining_time": "10:15:10"} -{"current_steps": 3270, "total_steps": 6590, "loss": 0.0091, "lr": 5.933368236119773e-05, "epoch": 4.959241706161137, "percentage": 49.62, "elapsed_time": "10:03:32", "remaining_time": "10:12:45"} -{"current_steps": 3280, "total_steps": 6590, "loss": 0.0168, "lr": 5.907336298553197e-05, "epoch": 4.9744075829383885, "percentage": 49.77, "elapsed_time": "10:04:49", "remaining_time": "10:10:21"} -{"current_steps": 3290, "total_steps": 6590, "loss": 0.012, "lr": 5.8812789037553894e-05, "epoch": 4.98957345971564, "percentage": 49.92, "elapsed_time": "10:06:07", "remaining_time": "10:07:57"} -{"current_steps": 3300, "total_steps": 6590, "loss": 0.0123, "lr": 5.855196782821452e-05, "epoch": 5.004739336492891, "percentage": 50.08, "elapsed_time": "10:07:24", "remaining_time": "10:05:34"} -{"current_steps": 3300, "total_steps": 6590, "eval_loss": 0.04007617011666298, "epoch": 5.004739336492891, "percentage": 50.08, "elapsed_time": "10:10:05", "remaining_time": "10:08:14"} -{"current_steps": 3310, "total_steps": 6590, "loss": 0.0062, "lr": 5.829090667540231e-05, "epoch": 5.0199052132701425, "percentage": 50.23, "elapsed_time": "10:11:28", "remaining_time": "10:05:56"} -{"current_steps": 3320, "total_steps": 6590, "loss": 0.0074, "lr": 5.802961290373788e-05, "epoch": 5.035071090047393, "percentage": 50.38, "elapsed_time": "10:12:46", "remaining_time": "10:03:33"} -{"current_steps": 3330, "total_steps": 6590, "loss": 0.0045, "lr": 5.776809384436843e-05, "epoch": 5.050236966824644, "percentage": 50.53, "elapsed_time": "10:14:03", "remaining_time": "10:01:09"} -{"current_steps": 3340, "total_steps": 6590, "loss": 0.0071, "lr": 5.7506356834762064e-05, "epoch": 5.065402843601896, "percentage": 50.68, "elapsed_time": "10:15:21", "remaining_time": "9:58:46"} -{"current_steps": 3350, "total_steps": 6590, "loss": 0.0043, "lr": 5.724440921850196e-05, "epoch": 5.080568720379147, "percentage": 50.83, "elapsed_time": "10:16:38", "remaining_time": "9:56:23"} -{"current_steps": 3350, "total_steps": 6590, "eval_loss": 0.0507822260260582, "epoch": 5.080568720379147, "percentage": 50.83, "elapsed_time": "10:19:19", "remaining_time": "9:58:59"} -{"current_steps": 3360, "total_steps": 6590, "loss": 0.0044, "lr": 5.6982258345080284e-05, "epoch": 5.095734597156398, "percentage": 50.99, "elapsed_time": "10:20:43", "remaining_time": "9:56:42"} -{"current_steps": 3370, "total_steps": 6590, "loss": 0.007, "lr": 5.671991156969209e-05, "epoch": 5.11090047393365, "percentage": 51.14, "elapsed_time": "10:22:01", "remaining_time": "9:54:19"} -{"current_steps": 3380, "total_steps": 6590, "loss": 0.0042, "lr": 5.645737625302875e-05, "epoch": 5.1260663507109, "percentage": 51.29, "elapsed_time": "10:23:18", "remaining_time": "9:51:57"} -{"current_steps": 3390, "total_steps": 6590, "loss": 0.0059, "lr": 5.619465976107168e-05, "epoch": 5.1412322274881515, "percentage": 51.44, "elapsed_time": "10:24:36", "remaining_time": "9:49:36"} -{"current_steps": 3400, "total_steps": 6590, "loss": 0.0051, "lr": 5.5931769464885455e-05, "epoch": 5.156398104265403, "percentage": 51.59, "elapsed_time": "10:25:54", "remaining_time": "9:47:14"} -{"current_steps": 3400, "total_steps": 6590, "eval_loss": 0.052639201283454895, "epoch": 5.156398104265403, "percentage": 51.59, "elapsed_time": "10:28:34", "remaining_time": "9:49:45"} -{"current_steps": 3410, "total_steps": 6590, "loss": 0.0117, "lr": 5.566871274041114e-05, "epoch": 5.171563981042654, "percentage": 51.75, "elapsed_time": "10:29:58", "remaining_time": "9:47:28"} -{"current_steps": 3420, "total_steps": 6590, "loss": 0.0032, "lr": 5.540549696825932e-05, "epoch": 5.1867298578199055, "percentage": 51.9, "elapsed_time": "10:31:15", "remaining_time": "9:45:06"} -{"current_steps": 3430, "total_steps": 6590, "loss": 0.0066, "lr": 5.514212953350293e-05, "epoch": 5.201895734597157, "percentage": 52.05, "elapsed_time": "10:32:33", "remaining_time": "9:42:45"} -{"current_steps": 3440, "total_steps": 6590, "loss": 0.0075, "lr": 5.487861782547018e-05, "epoch": 5.217061611374407, "percentage": 52.2, "elapsed_time": "10:33:50", "remaining_time": "9:40:24"} -{"current_steps": 3450, "total_steps": 6590, "loss": 0.0043, "lr": 5.4614969237537115e-05, "epoch": 5.232227488151659, "percentage": 52.35, "elapsed_time": "10:35:07", "remaining_time": "9:38:03"} -{"current_steps": 3450, "total_steps": 6590, "eval_loss": 0.05088622868061066, "epoch": 5.232227488151659, "percentage": 52.35, "elapsed_time": "10:37:48", "remaining_time": "9:40:29"} -{"current_steps": 3460, "total_steps": 6590, "loss": 0.0064, "lr": 5.435119116692032e-05, "epoch": 5.24739336492891, "percentage": 52.5, "elapsed_time": "10:39:11", "remaining_time": "9:38:14"} -{"current_steps": 3470, "total_steps": 6590, "loss": 0.0078, "lr": 5.40872910144692e-05, "epoch": 5.262559241706161, "percentage": 52.66, "elapsed_time": "10:40:29", "remaining_time": "9:35:53"} -{"current_steps": 3480, "total_steps": 6590, "loss": 0.0057, "lr": 5.382327618445847e-05, "epoch": 5.277725118483413, "percentage": 52.81, "elapsed_time": "10:41:47", "remaining_time": "9:33:33"} -{"current_steps": 3490, "total_steps": 6590, "loss": 0.005, "lr": 5.355915408438034e-05, "epoch": 5.292890995260663, "percentage": 52.96, "elapsed_time": "10:43:04", "remaining_time": "9:31:13"} -{"current_steps": 3500, "total_steps": 6590, "loss": 0.0049, "lr": 5.329493212473673e-05, "epoch": 5.308056872037914, "percentage": 53.11, "elapsed_time": "10:44:22", "remaining_time": "9:28:53"} -{"current_steps": 3500, "total_steps": 6590, "eval_loss": 0.048039890825748444, "epoch": 5.308056872037914, "percentage": 53.11, "elapsed_time": "10:47:02", "remaining_time": "9:31:14"} -{"current_steps": 3510, "total_steps": 6590, "loss": 0.0074, "lr": 5.303061771883133e-05, "epoch": 5.323222748815166, "percentage": 53.26, "elapsed_time": "10:48:26", "remaining_time": "9:28:59"} -{"current_steps": 3520, "total_steps": 6590, "loss": 0.0044, "lr": 5.27662182825616e-05, "epoch": 5.338388625592417, "percentage": 53.41, "elapsed_time": "10:49:43", "remaining_time": "9:26:39"} -{"current_steps": 3530, "total_steps": 6590, "loss": 0.007, "lr": 5.250174123421068e-05, "epoch": 5.3535545023696685, "percentage": 53.57, "elapsed_time": "10:51:00", "remaining_time": "9:24:20"} -{"current_steps": 3540, "total_steps": 6590, "loss": 0.0104, "lr": 5.223719399423931e-05, "epoch": 5.36872037914692, "percentage": 53.72, "elapsed_time": "10:52:18", "remaining_time": "9:22:00"} -{"current_steps": 3550, "total_steps": 6590, "loss": 0.0043, "lr": 5.197258398507762e-05, "epoch": 5.38388625592417, "percentage": 53.87, "elapsed_time": "10:53:35", "remaining_time": "9:19:41"} -{"current_steps": 3550, "total_steps": 6590, "eval_loss": 0.04626436531543732, "epoch": 5.38388625592417, "percentage": 53.87, "elapsed_time": "10:56:16", "remaining_time": "9:21:59"} -{"current_steps": 3560, "total_steps": 6590, "loss": 0.0062, "lr": 5.170791863091682e-05, "epoch": 5.399052132701422, "percentage": 54.02, "elapsed_time": "10:57:39", "remaining_time": "9:19:45"} -{"current_steps": 3570, "total_steps": 6590, "loss": 0.0017, "lr": 5.144320535750096e-05, "epoch": 5.414218009478673, "percentage": 54.17, "elapsed_time": "10:58:57", "remaining_time": "9:17:26"} -{"current_steps": 3580, "total_steps": 6590, "loss": 0.0041, "lr": 5.1178451591918574e-05, "epoch": 5.429383886255924, "percentage": 54.32, "elapsed_time": "11:00:15", "remaining_time": "9:15:07"} -{"current_steps": 3590, "total_steps": 6590, "loss": 0.0055, "lr": 5.091366476239425e-05, "epoch": 5.444549763033176, "percentage": 54.48, "elapsed_time": "11:01:32", "remaining_time": "9:12:49"} -{"current_steps": 3600, "total_steps": 6590, "loss": 0.0052, "lr": 5.064885229808034e-05, "epoch": 5.459715639810426, "percentage": 54.63, "elapsed_time": "11:02:50", "remaining_time": "9:10:31"} -{"current_steps": 3600, "total_steps": 6590, "eval_loss": 0.05071334168314934, "epoch": 5.459715639810426, "percentage": 54.63, "elapsed_time": "11:05:30", "remaining_time": "9:12:44"} -{"current_steps": 3610, "total_steps": 6590, "loss": 0.0042, "lr": 5.0384021628848334e-05, "epoch": 5.474881516587677, "percentage": 54.78, "elapsed_time": "11:06:55", "remaining_time": "9:10:31"} -{"current_steps": 3620, "total_steps": 6590, "loss": 0.0038, "lr": 5.011918018508057e-05, "epoch": 5.490047393364929, "percentage": 54.93, "elapsed_time": "11:08:12", "remaining_time": "9:08:13"} -{"current_steps": 3630, "total_steps": 6590, "loss": 0.0035, "lr": 4.985433539746164e-05, "epoch": 5.50521327014218, "percentage": 55.08, "elapsed_time": "11:09:29", "remaining_time": "9:05:55"} -{"current_steps": 3640, "total_steps": 6590, "loss": 0.0014, "lr": 4.958949469677001e-05, "epoch": 5.520379146919431, "percentage": 55.24, "elapsed_time": "11:10:47", "remaining_time": "9:03:38"} -{"current_steps": 3650, "total_steps": 6590, "loss": 0.0086, "lr": 4.9324665513669385e-05, "epoch": 5.535545023696683, "percentage": 55.39, "elapsed_time": "11:12:05", "remaining_time": "9:01:21"} -{"current_steps": 3650, "total_steps": 6590, "eval_loss": 0.0571274608373642, "epoch": 5.535545023696683, "percentage": 55.39, "elapsed_time": "11:14:45", "remaining_time": "9:03:30"} -{"current_steps": 3660, "total_steps": 6590, "loss": 0.0059, "lr": 4.9059855278500446e-05, "epoch": 5.550710900473934, "percentage": 55.54, "elapsed_time": "11:16:09", "remaining_time": "9:01:18"} -{"current_steps": 3670, "total_steps": 6590, "loss": 0.0089, "lr": 4.879507142107215e-05, "epoch": 5.565876777251185, "percentage": 55.69, "elapsed_time": "11:17:27", "remaining_time": "8:59:00"} -{"current_steps": 3680, "total_steps": 6590, "loss": 0.0053, "lr": 4.853032137045343e-05, "epoch": 5.581042654028436, "percentage": 55.84, "elapsed_time": "11:18:44", "remaining_time": "8:56:43"} -{"current_steps": 3690, "total_steps": 6590, "loss": 0.0037, "lr": 4.826561255476463e-05, "epoch": 5.596208530805687, "percentage": 55.99, "elapsed_time": "11:20:02", "remaining_time": "8:54:26"} -{"current_steps": 3700, "total_steps": 6590, "loss": 0.0026, "lr": 4.800095240096925e-05, "epoch": 5.611374407582939, "percentage": 56.15, "elapsed_time": "11:21:19", "remaining_time": "8:52:10"} -{"current_steps": 3700, "total_steps": 6590, "eval_loss": 0.04951642081141472, "epoch": 5.611374407582939, "percentage": 56.15, "elapsed_time": "11:24:00", "remaining_time": "8:54:15"} -{"current_steps": 3710, "total_steps": 6590, "loss": 0.0089, "lr": 4.773634833466542e-05, "epoch": 5.62654028436019, "percentage": 56.3, "elapsed_time": "11:25:24", "remaining_time": "8:52:03"} -{"current_steps": 3720, "total_steps": 6590, "loss": 0.009, "lr": 4.747180777987761e-05, "epoch": 5.64170616113744, "percentage": 56.45, "elapsed_time": "11:26:41", "remaining_time": "8:49:47"} -{"current_steps": 3730, "total_steps": 6590, "loss": 0.0027, "lr": 4.720733815884836e-05, "epoch": 5.656872037914692, "percentage": 56.6, "elapsed_time": "11:27:59", "remaining_time": "8:47:31"} -{"current_steps": 3740, "total_steps": 6590, "loss": 0.0063, "lr": 4.694294689183005e-05, "epoch": 5.672037914691943, "percentage": 56.75, "elapsed_time": "11:29:17", "remaining_time": "8:45:15"} -{"current_steps": 3750, "total_steps": 6590, "loss": 0.0032, "lr": 4.667864139687661e-05, "epoch": 5.687203791469194, "percentage": 56.9, "elapsed_time": "11:30:35", "remaining_time": "8:43:00"} -{"current_steps": 3750, "total_steps": 6590, "eval_loss": 0.04893982410430908, "epoch": 5.687203791469194, "percentage": 56.9, "elapsed_time": "11:33:15", "remaining_time": "8:45:01"} -{"current_steps": 3760, "total_steps": 6590, "loss": 0.0085, "lr": 4.641442908963549e-05, "epoch": 5.702369668246446, "percentage": 57.06, "elapsed_time": "11:34:39", "remaining_time": "8:42:50"} -{"current_steps": 3770, "total_steps": 6590, "loss": 0.003, "lr": 4.615031738313954e-05, "epoch": 5.717535545023697, "percentage": 57.21, "elapsed_time": "11:35:56", "remaining_time": "8:40:34"} -{"current_steps": 3780, "total_steps": 6590, "loss": 0.0066, "lr": 4.588631368759908e-05, "epoch": 5.7327014218009475, "percentage": 57.36, "elapsed_time": "11:37:14", "remaining_time": "8:38:19"} -{"current_steps": 3790, "total_steps": 6590, "loss": 0.0097, "lr": 4.562242541019392e-05, "epoch": 5.747867298578199, "percentage": 57.51, "elapsed_time": "11:38:32", "remaining_time": "8:36:04"} -{"current_steps": 3800, "total_steps": 6590, "loss": 0.0034, "lr": 4.535865995486559e-05, "epoch": 5.76303317535545, "percentage": 57.66, "elapsed_time": "11:39:50", "remaining_time": "8:33:49"} -{"current_steps": 3800, "total_steps": 6590, "eval_loss": 0.050715312361717224, "epoch": 5.76303317535545, "percentage": 57.66, "elapsed_time": "11:42:30", "remaining_time": "8:35:47"} -{"current_steps": 3810, "total_steps": 6590, "loss": 0.0082, "lr": 4.509502472210956e-05, "epoch": 5.778199052132702, "percentage": 57.81, "elapsed_time": "11:43:54", "remaining_time": "8:33:36"} -{"current_steps": 3820, "total_steps": 6590, "loss": 0.0068, "lr": 4.483152710876768e-05, "epoch": 5.793364928909953, "percentage": 57.97, "elapsed_time": "11:45:11", "remaining_time": "8:31:21"} -{"current_steps": 3830, "total_steps": 6590, "loss": 0.0045, "lr": 4.456817450782058e-05, "epoch": 5.808530805687203, "percentage": 58.12, "elapsed_time": "11:46:28", "remaining_time": "8:29:06"} -{"current_steps": 3840, "total_steps": 6590, "loss": 0.0066, "lr": 4.4304974308180225e-05, "epoch": 5.823696682464455, "percentage": 58.27, "elapsed_time": "11:47:46", "remaining_time": "8:26:51"} -{"current_steps": 3850, "total_steps": 6590, "loss": 0.0019, "lr": 4.4041933894482675e-05, "epoch": 5.838862559241706, "percentage": 58.42, "elapsed_time": "11:49:03", "remaining_time": "8:24:37"} -{"current_steps": 3850, "total_steps": 6590, "eval_loss": 0.0481330044567585, "epoch": 5.838862559241706, "percentage": 58.42, "elapsed_time": "11:51:44", "remaining_time": "8:26:32"} -{"current_steps": 3860, "total_steps": 6590, "loss": 0.0058, "lr": 4.3779060646880844e-05, "epoch": 5.854028436018957, "percentage": 58.57, "elapsed_time": "11:53:08", "remaining_time": "8:24:22"} -{"current_steps": 3870, "total_steps": 6590, "loss": 0.0059, "lr": 4.3516361940837485e-05, "epoch": 5.869194312796209, "percentage": 58.73, "elapsed_time": "11:54:25", "remaining_time": "8:22:07"} -{"current_steps": 3880, "total_steps": 6590, "loss": 0.0078, "lr": 4.325384514691818e-05, "epoch": 5.88436018957346, "percentage": 58.88, "elapsed_time": "11:55:43", "remaining_time": "8:19:53"} -{"current_steps": 3890, "total_steps": 6590, "loss": 0.0065, "lr": 4.299151763058458e-05, "epoch": 5.8995260663507105, "percentage": 59.03, "elapsed_time": "11:57:00", "remaining_time": "8:17:40"} -{"current_steps": 3900, "total_steps": 6590, "loss": 0.0024, "lr": 4.272938675198778e-05, "epoch": 5.914691943127962, "percentage": 59.18, "elapsed_time": "11:58:18", "remaining_time": "8:15:26"} -{"current_steps": 3900, "total_steps": 6590, "eval_loss": 0.050162095576524734, "epoch": 5.914691943127962, "percentage": 59.18, "elapsed_time": "12:00:58", "remaining_time": "8:17:17"} -{"current_steps": 3910, "total_steps": 6590, "loss": 0.0038, "lr": 4.2467459865761775e-05, "epoch": 5.929857819905213, "percentage": 59.33, "elapsed_time": "12:02:22", "remaining_time": "8:15:08"} -{"current_steps": 3920, "total_steps": 6590, "loss": 0.008, "lr": 4.220574432081714e-05, "epoch": 5.9450236966824646, "percentage": 59.48, "elapsed_time": "12:03:40", "remaining_time": "8:12:54"} -{"current_steps": 3930, "total_steps": 6590, "loss": 0.0078, "lr": 4.194424746013481e-05, "epoch": 5.960189573459716, "percentage": 59.64, "elapsed_time": "12:04:57", "remaining_time": "8:10:41"} -{"current_steps": 3940, "total_steps": 6590, "loss": 0.0082, "lr": 4.168297662056005e-05, "epoch": 5.975355450236966, "percentage": 59.79, "elapsed_time": "12:06:15", "remaining_time": "8:08:28"} -{"current_steps": 3950, "total_steps": 6590, "loss": 0.0089, "lr": 4.1421939132596676e-05, "epoch": 5.990521327014218, "percentage": 59.94, "elapsed_time": "12:07:33", "remaining_time": "8:06:15"} -{"current_steps": 3950, "total_steps": 6590, "eval_loss": 0.04755592718720436, "epoch": 5.990521327014218, "percentage": 59.94, "elapsed_time": "12:10:13", "remaining_time": "8:08:03"} -{"current_steps": 3960, "total_steps": 6590, "loss": 0.0053, "lr": 4.116114232020132e-05, "epoch": 6.005687203791469, "percentage": 60.09, "elapsed_time": "12:11:36", "remaining_time": "8:05:53"} -{"current_steps": 3970, "total_steps": 6590, "loss": 0.0063, "lr": 4.0900593500577925e-05, "epoch": 6.02085308056872, "percentage": 60.24, "elapsed_time": "12:12:53", "remaining_time": "8:03:40"} -{"current_steps": 3980, "total_steps": 6590, "loss": 0.0036, "lr": 4.0640299983972474e-05, "epoch": 6.036018957345972, "percentage": 60.39, "elapsed_time": "12:14:11", "remaining_time": "8:01:27"} -{"current_steps": 3990, "total_steps": 6590, "loss": 0.0053, "lr": 4.0380269073467944e-05, "epoch": 6.051184834123223, "percentage": 60.55, "elapsed_time": "12:15:28", "remaining_time": "7:59:15"} -{"current_steps": 4000, "total_steps": 6590, "loss": 0.0029, "lr": 4.012050806477928e-05, "epoch": 6.0663507109004735, "percentage": 60.7, "elapsed_time": "12:16:46", "remaining_time": "7:57:03"} -{"current_steps": 4000, "total_steps": 6590, "eval_loss": 0.047806721180677414, "epoch": 6.0663507109004735, "percentage": 60.7, "elapsed_time": "12:19:26", "remaining_time": "7:58:47"} -{"current_steps": 4010, "total_steps": 6590, "loss": 0.0039, "lr": 3.986102424604881e-05, "epoch": 6.081516587677725, "percentage": 60.85, "elapsed_time": "12:20:50", "remaining_time": "7:56:38"} -{"current_steps": 4020, "total_steps": 6590, "loss": 0.006, "lr": 3.960182489764165e-05, "epoch": 6.096682464454976, "percentage": 61.0, "elapsed_time": "12:22:07", "remaining_time": "7:54:26"} -{"current_steps": 4030, "total_steps": 6590, "loss": 0.002, "lr": 3.934291729194159e-05, "epoch": 6.1118483412322275, "percentage": 61.15, "elapsed_time": "12:23:25", "remaining_time": "7:52:15"} -{"current_steps": 4040, "total_steps": 6590, "loss": 0.0056, "lr": 3.9084308693146884e-05, "epoch": 6.127014218009479, "percentage": 61.31, "elapsed_time": "12:24:42", "remaining_time": "7:50:03"} -{"current_steps": 4050, "total_steps": 6590, "loss": 0.004, "lr": 3.8826006357066583e-05, "epoch": 6.14218009478673, "percentage": 61.46, "elapsed_time": "12:26:00", "remaining_time": "7:47:51"} -{"current_steps": 4050, "total_steps": 6590, "eval_loss": 0.052365612238645554, "epoch": 6.14218009478673, "percentage": 61.46, "elapsed_time": "12:28:40", "remaining_time": "7:49:32"} -{"current_steps": 4060, "total_steps": 6590, "loss": 0.0028, "lr": 3.8568017530916816e-05, "epoch": 6.157345971563981, "percentage": 61.61, "elapsed_time": "12:30:04", "remaining_time": "7:47:24"} -{"current_steps": 4070, "total_steps": 6590, "loss": 0.0022, "lr": 3.8310349453117624e-05, "epoch": 6.172511848341232, "percentage": 61.76, "elapsed_time": "12:31:21", "remaining_time": "7:45:13"} -{"current_steps": 4080, "total_steps": 6590, "loss": 0.0071, "lr": 3.805300935308968e-05, "epoch": 6.187677725118483, "percentage": 61.91, "elapsed_time": "12:32:39", "remaining_time": "7:43:01"} -{"current_steps": 4090, "total_steps": 6590, "loss": 0.0056, "lr": 3.779600445105165e-05, "epoch": 6.202843601895735, "percentage": 62.06, "elapsed_time": "12:33:56", "remaining_time": "7:40:50"} -{"current_steps": 4100, "total_steps": 6590, "loss": 0.0007, "lr": 3.7539341957817424e-05, "epoch": 6.218009478672986, "percentage": 62.22, "elapsed_time": "12:35:14", "remaining_time": "7:38:40"} -{"current_steps": 4100, "total_steps": 6590, "eval_loss": 0.0558902844786644, "epoch": 6.218009478672986, "percentage": 62.22, "elapsed_time": "12:37:54", "remaining_time": "7:40:17"} -{"current_steps": 4110, "total_steps": 6590, "loss": 0.0038, "lr": 3.7283029074593924e-05, "epoch": 6.233175355450237, "percentage": 62.37, "elapsed_time": "12:39:18", "remaining_time": "7:38:10"} -{"current_steps": 4120, "total_steps": 6590, "loss": 0.0017, "lr": 3.702707299277906e-05, "epoch": 6.248341232227488, "percentage": 62.52, "elapsed_time": "12:40:36", "remaining_time": "7:35:59"} -{"current_steps": 4130, "total_steps": 6590, "loss": 0.0018, "lr": 3.677148089375988e-05, "epoch": 6.263507109004739, "percentage": 62.67, "elapsed_time": "12:41:53", "remaining_time": "7:33:48"} -{"current_steps": 4140, "total_steps": 6590, "loss": 0.0025, "lr": 3.6516259948711164e-05, "epoch": 6.2786729857819905, "percentage": 62.82, "elapsed_time": "12:43:11", "remaining_time": "7:31:38"} -{"current_steps": 4150, "total_steps": 6590, "loss": 0.0038, "lr": 3.626141731839414e-05, "epoch": 6.293838862559242, "percentage": 62.97, "elapsed_time": "12:44:28", "remaining_time": "7:29:28"} -{"current_steps": 4150, "total_steps": 6590, "eval_loss": 0.05632086843252182, "epoch": 6.293838862559242, "percentage": 62.97, "elapsed_time": "12:47:09", "remaining_time": "7:31:02"} -{"current_steps": 4160, "total_steps": 6590, "loss": 0.0059, "lr": 3.6006960152955685e-05, "epoch": 6.309004739336493, "percentage": 63.13, "elapsed_time": "12:48:31", "remaining_time": "7:28:55"} -{"current_steps": 4170, "total_steps": 6590, "loss": 0.0014, "lr": 3.5752895591727575e-05, "epoch": 6.324170616113744, "percentage": 63.28, "elapsed_time": "12:49:49", "remaining_time": "7:26:45"} -{"current_steps": 4180, "total_steps": 6590, "loss": 0.0062, "lr": 3.5499230763026316e-05, "epoch": 6.339336492890995, "percentage": 63.43, "elapsed_time": "12:51:06", "remaining_time": "7:24:35"} -{"current_steps": 4190, "total_steps": 6590, "loss": 0.0032, "lr": 3.5245972783953e-05, "epoch": 6.354502369668246, "percentage": 63.58, "elapsed_time": "12:52:24", "remaining_time": "7:22:25"} -{"current_steps": 4200, "total_steps": 6590, "loss": 0.0012, "lr": 3.499312876019378e-05, "epoch": 6.369668246445498, "percentage": 63.73, "elapsed_time": "12:53:41", "remaining_time": "7:20:16"} -{"current_steps": 4200, "total_steps": 6590, "eval_loss": 0.05449463054537773, "epoch": 6.369668246445498, "percentage": 63.73, "elapsed_time": "12:56:22", "remaining_time": "7:21:47"} -{"current_steps": 4210, "total_steps": 6590, "loss": 0.0019, "lr": 3.474070578582037e-05, "epoch": 6.384834123222749, "percentage": 63.88, "elapsed_time": "12:57:44", "remaining_time": "7:19:40"} -{"current_steps": 4220, "total_steps": 6590, "loss": 0.0041, "lr": 3.4488710943091045e-05, "epoch": 6.4, "percentage": 64.04, "elapsed_time": "12:59:01", "remaining_time": "7:17:30"} -{"current_steps": 4230, "total_steps": 6590, "loss": 0.003, "lr": 3.423715130225196e-05, "epoch": 6.415165876777251, "percentage": 64.19, "elapsed_time": "13:00:19", "remaining_time": "7:15:21"} -{"current_steps": 4240, "total_steps": 6590, "loss": 0.0022, "lr": 3.398603392133881e-05, "epoch": 6.430331753554502, "percentage": 64.34, "elapsed_time": "13:01:36", "remaining_time": "7:13:12"} -{"current_steps": 4250, "total_steps": 6590, "loss": 0.0021, "lr": 3.3735365845978696e-05, "epoch": 6.4454976303317535, "percentage": 64.49, "elapsed_time": "13:02:54", "remaining_time": "7:11:03"} -{"current_steps": 4250, "total_steps": 6590, "eval_loss": 0.0590050145983696, "epoch": 6.4454976303317535, "percentage": 64.49, "elapsed_time": "13:05:34", "remaining_time": "7:12:31"} -{"current_steps": 4260, "total_steps": 6590, "loss": 0.0048, "lr": 3.34851541091925e-05, "epoch": 6.460663507109005, "percentage": 64.64, "elapsed_time": "13:06:56", "remaining_time": "7:10:25"} -{"current_steps": 4270, "total_steps": 6590, "loss": 0.0014, "lr": 3.32354057311976e-05, "epoch": 6.475829383886256, "percentage": 64.8, "elapsed_time": "13:08:13", "remaining_time": "7:08:15"} -{"current_steps": 4280, "total_steps": 6590, "loss": 0.0029, "lr": 3.298612771921088e-05, "epoch": 6.4909952606635075, "percentage": 64.95, "elapsed_time": "13:09:31", "remaining_time": "7:06:07"} -{"current_steps": 4290, "total_steps": 6590, "loss": 0.0039, "lr": 3.2737327067252074e-05, "epoch": 6.506161137440758, "percentage": 65.1, "elapsed_time": "13:10:48", "remaining_time": "7:03:58"} -{"current_steps": 4300, "total_steps": 6590, "loss": 0.0027, "lr": 3.24890107559476e-05, "epoch": 6.521327014218009, "percentage": 65.25, "elapsed_time": "13:12:05", "remaining_time": "7:01:50"} -{"current_steps": 4300, "total_steps": 6590, "eval_loss": 0.056247007101774216, "epoch": 6.521327014218009, "percentage": 65.25, "elapsed_time": "13:14:46", "remaining_time": "7:03:15"} -{"current_steps": 4310, "total_steps": 6590, "loss": 0.003, "lr": 3.2241185752334634e-05, "epoch": 6.536492890995261, "percentage": 65.4, "elapsed_time": "13:16:08", "remaining_time": "7:01:09"} -{"current_steps": 4320, "total_steps": 6590, "loss": 0.0026, "lr": 3.1993859009665744e-05, "epoch": 6.551658767772512, "percentage": 65.55, "elapsed_time": "13:17:26", "remaining_time": "6:59:01"} -{"current_steps": 4330, "total_steps": 6590, "loss": 0.0043, "lr": 3.1747037467213725e-05, "epoch": 6.566824644549763, "percentage": 65.71, "elapsed_time": "13:18:43", "remaining_time": "6:56:53"} -{"current_steps": 4340, "total_steps": 6590, "loss": 0.0074, "lr": 3.150072805007688e-05, "epoch": 6.581990521327015, "percentage": 65.86, "elapsed_time": "13:20:01", "remaining_time": "6:54:45"} -{"current_steps": 4350, "total_steps": 6590, "loss": 0.0045, "lr": 3.125493766898477e-05, "epoch": 6.597156398104265, "percentage": 66.01, "elapsed_time": "13:21:19", "remaining_time": "6:52:38"} -{"current_steps": 4350, "total_steps": 6590, "eval_loss": 0.049974557012319565, "epoch": 6.597156398104265, "percentage": 66.01, "elapsed_time": "13:23:59", "remaining_time": "6:54:00"} -{"current_steps": 4360, "total_steps": 6590, "loss": 0.0015, "lr": 3.1009673220104305e-05, "epoch": 6.6123222748815165, "percentage": 66.16, "elapsed_time": "13:25:21", "remaining_time": "6:51:54"} -{"current_steps": 4370, "total_steps": 6590, "loss": 0.0024, "lr": 3.076494158484631e-05, "epoch": 6.627488151658768, "percentage": 66.31, "elapsed_time": "13:26:39", "remaining_time": "6:49:47"} -{"current_steps": 4380, "total_steps": 6590, "loss": 0.0025, "lr": 3.0520749629672334e-05, "epoch": 6.642654028436019, "percentage": 66.46, "elapsed_time": "13:27:56", "remaining_time": "6:47:39"} -{"current_steps": 4390, "total_steps": 6590, "loss": 0.0009, "lr": 3.027710420590208e-05, "epoch": 6.6578199052132705, "percentage": 66.62, "elapsed_time": "13:29:14", "remaining_time": "6:45:32"} -{"current_steps": 4400, "total_steps": 6590, "loss": 0.0024, "lr": 3.0034012149521173e-05, "epoch": 6.672985781990521, "percentage": 66.77, "elapsed_time": "13:30:31", "remaining_time": "6:43:25"} -{"current_steps": 4400, "total_steps": 6590, "eval_loss": 0.05433971434831619, "epoch": 6.672985781990521, "percentage": 66.77, "elapsed_time": "13:33:12", "remaining_time": "6:44:45"} -{"current_steps": 4410, "total_steps": 6590, "loss": 0.0014, "lr": 2.979148028098936e-05, "epoch": 6.688151658767772, "percentage": 66.92, "elapsed_time": "13:34:34", "remaining_time": "6:42:40"} -{"current_steps": 4420, "total_steps": 6590, "loss": 0.0036, "lr": 2.9549515405049122e-05, "epoch": 6.703317535545024, "percentage": 67.07, "elapsed_time": "13:35:51", "remaining_time": "6:40:32"} -{"current_steps": 4430, "total_steps": 6590, "loss": 0.0011, "lr": 2.9308124310534774e-05, "epoch": 6.718483412322275, "percentage": 67.22, "elapsed_time": "13:37:09", "remaining_time": "6:38:25"} -{"current_steps": 4440, "total_steps": 6590, "loss": 0.0015, "lr": 2.9067313770181944e-05, "epoch": 6.733649289099526, "percentage": 67.37, "elapsed_time": "13:38:26", "remaining_time": "6:36:19"} -{"current_steps": 4450, "total_steps": 6590, "loss": 0.0025, "lr": 2.88270905404377e-05, "epoch": 6.748815165876778, "percentage": 67.53, "elapsed_time": "13:39:44", "remaining_time": "6:34:12"} -{"current_steps": 4450, "total_steps": 6590, "eval_loss": 0.06043895706534386, "epoch": 6.748815165876778, "percentage": 67.53, "elapsed_time": "13:42:24", "remaining_time": "6:35:29"} -{"current_steps": 4460, "total_steps": 6590, "loss": 0.0028, "lr": 2.858746136127074e-05, "epoch": 6.763981042654028, "percentage": 67.68, "elapsed_time": "13:43:46", "remaining_time": "6:33:25"} -{"current_steps": 4470, "total_steps": 6590, "loss": 0.0039, "lr": 2.834843295598251e-05, "epoch": 6.7791469194312794, "percentage": 67.83, "elapsed_time": "13:45:04", "remaining_time": "6:31:18"} -{"current_steps": 4480, "total_steps": 6590, "loss": 0.0022, "lr": 2.811001203101845e-05, "epoch": 6.794312796208531, "percentage": 67.98, "elapsed_time": "13:46:21", "remaining_time": "6:29:12"} -{"current_steps": 4490, "total_steps": 6590, "loss": 0.0022, "lr": 2.787220527577986e-05, "epoch": 6.809478672985782, "percentage": 68.13, "elapsed_time": "13:47:39", "remaining_time": "6:27:05"} -{"current_steps": 4500, "total_steps": 6590, "loss": 0.0015, "lr": 2.7635019362436244e-05, "epoch": 6.8246445497630335, "percentage": 68.29, "elapsed_time": "13:48:56", "remaining_time": "6:25:00"} -{"current_steps": 4500, "total_steps": 6590, "eval_loss": 0.057198572903871536, "epoch": 6.8246445497630335, "percentage": 68.29, "elapsed_time": "13:51:37", "remaining_time": "6:26:14"} -{"current_steps": 4510, "total_steps": 6590, "loss": 0.0014, "lr": 2.7398460945737997e-05, "epoch": 6.839810426540284, "percentage": 68.44, "elapsed_time": "13:52:58", "remaining_time": "6:24:10"} -{"current_steps": 4520, "total_steps": 6590, "loss": 0.0046, "lr": 2.7162536662829842e-05, "epoch": 6.854976303317535, "percentage": 68.59, "elapsed_time": "13:54:15", "remaining_time": "6:22:03"} -{"current_steps": 4530, "total_steps": 6590, "loss": 0.0041, "lr": 2.6927253133064577e-05, "epoch": 6.870142180094787, "percentage": 68.74, "elapsed_time": "13:55:33", "remaining_time": "6:19:57"} -{"current_steps": 4540, "total_steps": 6590, "loss": 0.0011, "lr": 2.6692616957817233e-05, "epoch": 6.885308056872038, "percentage": 68.89, "elapsed_time": "13:56:50", "remaining_time": "6:17:52"} -{"current_steps": 4550, "total_steps": 6590, "loss": 0.0043, "lr": 2.645863472029999e-05, "epoch": 6.900473933649289, "percentage": 69.04, "elapsed_time": "13:58:08", "remaining_time": "6:15:46"} -{"current_steps": 4550, "total_steps": 6590, "eval_loss": 0.052840739488601685, "epoch": 6.900473933649289, "percentage": 69.04, "elapsed_time": "14:00:49", "remaining_time": "6:16:58"} -{"current_steps": 4560, "total_steps": 6590, "loss": 0.0021, "lr": 2.6225312985377447e-05, "epoch": 6.915639810426541, "percentage": 69.2, "elapsed_time": "14:02:11", "remaining_time": "6:14:55"} -{"current_steps": 4570, "total_steps": 6590, "loss": 0.0027, "lr": 2.5992658299382333e-05, "epoch": 6.930805687203791, "percentage": 69.35, "elapsed_time": "14:03:28", "remaining_time": "6:12:49"} -{"current_steps": 4580, "total_steps": 6590, "loss": 0.0005, "lr": 2.5760677189932044e-05, "epoch": 6.945971563981042, "percentage": 69.5, "elapsed_time": "14:04:46", "remaining_time": "6:10:44"} -{"current_steps": 4590, "total_steps": 6590, "loss": 0.0031, "lr": 2.5529376165745233e-05, "epoch": 6.961137440758294, "percentage": 69.65, "elapsed_time": "14:06:03", "remaining_time": "6:08:39"} -{"current_steps": 4600, "total_steps": 6590, "loss": 0.0064, "lr": 2.5298761716459406e-05, "epoch": 6.976303317535545, "percentage": 69.8, "elapsed_time": "14:07:21", "remaining_time": "6:06:34"} -{"current_steps": 4600, "total_steps": 6590, "eval_loss": 0.052640076726675034, "epoch": 6.976303317535545, "percentage": 69.8, "elapsed_time": "14:10:01", "remaining_time": "6:07:43"} -{"current_steps": 4610, "total_steps": 6590, "loss": 0.0014, "lr": 2.506884031244875e-05, "epoch": 6.9914691943127965, "percentage": 69.95, "elapsed_time": "14:11:23", "remaining_time": "6:05:40"} -{"current_steps": 4620, "total_steps": 6590, "loss": 0.0009, "lr": 2.4839618404642602e-05, "epoch": 7.006635071090048, "percentage": 70.11, "elapsed_time": "14:12:41", "remaining_time": "6:03:35"} -{"current_steps": 4630, "total_steps": 6590, "loss": 0.0006, "lr": 2.4611102424344473e-05, "epoch": 7.021800947867298, "percentage": 70.26, "elapsed_time": "14:13:58", "remaining_time": "6:01:30"} -{"current_steps": 4640, "total_steps": 6590, "loss": 0.0016, "lr": 2.4383298783051543e-05, "epoch": 7.03696682464455, "percentage": 70.41, "elapsed_time": "14:15:16", "remaining_time": "5:59:26"} -{"current_steps": 4650, "total_steps": 6590, "loss": 0.0009, "lr": 2.4156213872274874e-05, "epoch": 7.052132701421801, "percentage": 70.56, "elapsed_time": "14:16:34", "remaining_time": "5:57:21"} -{"current_steps": 4650, "total_steps": 6590, "eval_loss": 0.05745341256260872, "epoch": 7.052132701421801, "percentage": 70.56, "elapsed_time": "14:19:15", "remaining_time": "5:58:28"} -{"current_steps": 4660, "total_steps": 6590, "loss": 0.0007, "lr": 2.3929854063360013e-05, "epoch": 7.067298578199052, "percentage": 70.71, "elapsed_time": "14:20:36", "remaining_time": "5:56:26"} -{"current_steps": 4670, "total_steps": 6590, "loss": 0.0036, "lr": 2.3704225707308243e-05, "epoch": 7.082464454976304, "percentage": 70.86, "elapsed_time": "14:21:54", "remaining_time": "5:54:21"} -{"current_steps": 4680, "total_steps": 6590, "loss": 0.0024, "lr": 2.3479335134598407e-05, "epoch": 7.097630331753554, "percentage": 71.02, "elapsed_time": "14:23:11", "remaining_time": "5:52:17"} -{"current_steps": 4690, "total_steps": 6590, "loss": 0.0014, "lr": 2.325518865500923e-05, "epoch": 7.112796208530805, "percentage": 71.17, "elapsed_time": "14:24:29", "remaining_time": "5:50:13"} -{"current_steps": 4700, "total_steps": 6590, "loss": 0.0006, "lr": 2.303179255744243e-05, "epoch": 7.127962085308057, "percentage": 71.32, "elapsed_time": "14:25:46", "remaining_time": "5:48:09"} -{"current_steps": 4700, "total_steps": 6590, "eval_loss": 0.06053081154823303, "epoch": 7.127962085308057, "percentage": 71.32, "elapsed_time": "14:28:27", "remaining_time": "5:49:13"} -{"current_steps": 4710, "total_steps": 6590, "loss": 0.0007, "lr": 2.280915310974612e-05, "epoch": 7.143127962085308, "percentage": 71.47, "elapsed_time": "14:29:49", "remaining_time": "5:47:11"} -{"current_steps": 4720, "total_steps": 6590, "loss": 0.0057, "lr": 2.2587276558538978e-05, "epoch": 7.158293838862559, "percentage": 71.62, "elapsed_time": "14:31:06", "remaining_time": "5:45:07"} -{"current_steps": 4730, "total_steps": 6590, "loss": 0.0002, "lr": 2.236616912903507e-05, "epoch": 7.173459715639811, "percentage": 71.78, "elapsed_time": "14:32:24", "remaining_time": "5:43:03"} -{"current_steps": 4740, "total_steps": 6590, "loss": 0.0035, "lr": 2.2145837024869116e-05, "epoch": 7.188625592417061, "percentage": 71.93, "elapsed_time": "14:33:41", "remaining_time": "5:40:59"} -{"current_steps": 4750, "total_steps": 6590, "loss": 0.0007, "lr": 2.1926286427922436e-05, "epoch": 7.203791469194313, "percentage": 72.08, "elapsed_time": "14:34:59", "remaining_time": "5:38:56"} -{"current_steps": 4750, "total_steps": 6590, "eval_loss": 0.058909617364406586, "epoch": 7.203791469194313, "percentage": 72.08, "elapsed_time": "14:37:39", "remaining_time": "5:39:58"} -{"current_steps": 4760, "total_steps": 6590, "loss": 0.0003, "lr": 2.170752349814955e-05, "epoch": 7.218957345971564, "percentage": 72.23, "elapsed_time": "14:39:02", "remaining_time": "5:37:56"} -{"current_steps": 4770, "total_steps": 6590, "loss": 0.001, "lr": 2.148955437340526e-05, "epoch": 7.234123222748815, "percentage": 72.38, "elapsed_time": "14:40:19", "remaining_time": "5:35:53"} -{"current_steps": 4780, "total_steps": 6590, "loss": 0.0015, "lr": 2.1272385169272547e-05, "epoch": 7.249289099526067, "percentage": 72.53, "elapsed_time": "14:41:37", "remaining_time": "5:33:50"} -{"current_steps": 4790, "total_steps": 6590, "loss": 0.0014, "lr": 2.1056021978890916e-05, "epoch": 7.264454976303318, "percentage": 72.69, "elapsed_time": "14:42:55", "remaining_time": "5:31:47"} -{"current_steps": 4800, "total_steps": 6590, "loss": 0.0005, "lr": 2.0840470872785462e-05, "epoch": 7.279620853080568, "percentage": 72.84, "elapsed_time": "14:44:13", "remaining_time": "5:29:44"} -{"current_steps": 4800, "total_steps": 6590, "eval_loss": 0.06057117506861687, "epoch": 7.279620853080568, "percentage": 72.84, "elapsed_time": "14:46:53", "remaining_time": "5:30:44"} -{"current_steps": 4810, "total_steps": 6590, "loss": 0.0013, "lr": 2.0625737898696552e-05, "epoch": 7.29478672985782, "percentage": 72.99, "elapsed_time": "14:48:15", "remaining_time": "5:28:42"} -{"current_steps": 4820, "total_steps": 6590, "loss": 0.0004, "lr": 2.0411829081410084e-05, "epoch": 7.309952606635071, "percentage": 73.14, "elapsed_time": "14:49:32", "remaining_time": "5:26:39"} -{"current_steps": 4830, "total_steps": 6590, "loss": 0.0019, "lr": 2.019875042258859e-05, "epoch": 7.325118483412322, "percentage": 73.29, "elapsed_time": "14:50:50", "remaining_time": "5:24:36"} -{"current_steps": 4840, "total_steps": 6590, "loss": 0.0021, "lr": 1.9986507900602714e-05, "epoch": 7.340284360189574, "percentage": 73.44, "elapsed_time": "14:52:08", "remaining_time": "5:22:34"} -{"current_steps": 4850, "total_steps": 6590, "loss": 0.0002, "lr": 1.9775107470363473e-05, "epoch": 7.355450236966824, "percentage": 73.6, "elapsed_time": "14:53:25", "remaining_time": "5:20:31"} -{"current_steps": 4850, "total_steps": 6590, "eval_loss": 0.06296084821224213, "epoch": 7.355450236966824, "percentage": 73.6, "elapsed_time": "14:56:06", "remaining_time": "5:21:29"} -{"current_steps": 4860, "total_steps": 6590, "loss": 0.0015, "lr": 1.9564555063155298e-05, "epoch": 7.3706161137440755, "percentage": 73.75, "elapsed_time": "14:57:27", "remaining_time": "5:19:28"} -{"current_steps": 4870, "total_steps": 6590, "loss": 0.0002, "lr": 1.9354856586469512e-05, "epoch": 7.385781990521327, "percentage": 73.9, "elapsed_time": "14:58:45", "remaining_time": "5:17:25"} -{"current_steps": 4880, "total_steps": 6590, "loss": 0.0008, "lr": 1.914601792383862e-05, "epoch": 7.400947867298578, "percentage": 74.05, "elapsed_time": "15:00:02", "remaining_time": "5:15:23"} -{"current_steps": 4890, "total_steps": 6590, "loss": 0.0001, "lr": 1.8938044934671266e-05, "epoch": 7.41611374407583, "percentage": 74.2, "elapsed_time": "15:01:20", "remaining_time": "5:13:20"} -{"current_steps": 4900, "total_steps": 6590, "loss": 0.0003, "lr": 1.8730943454087714e-05, "epoch": 7.431279620853081, "percentage": 74.36, "elapsed_time": "15:02:37", "remaining_time": "5:11:18"} -{"current_steps": 4900, "total_steps": 6590, "eval_loss": 0.06590699404478073, "epoch": 7.431279620853081, "percentage": 74.36, "elapsed_time": "15:05:18", "remaining_time": "5:12:14"} -{"current_steps": 4910, "total_steps": 6590, "loss": 0.0002, "lr": 1.852471929275635e-05, "epoch": 7.446445497630331, "percentage": 74.51, "elapsed_time": "15:06:40", "remaining_time": "5:10:13"} -{"current_steps": 4920, "total_steps": 6590, "loss": 0.001, "lr": 1.831937823673039e-05, "epoch": 7.461611374407583, "percentage": 74.66, "elapsed_time": "15:07:57", "remaining_time": "5:08:11"} -{"current_steps": 4930, "total_steps": 6590, "loss": 0.0002, "lr": 1.8114926047285753e-05, "epoch": 7.476777251184834, "percentage": 74.81, "elapsed_time": "15:09:15", "remaining_time": "5:06:09"} -{"current_steps": 4940, "total_steps": 6590, "loss": 0.0008, "lr": 1.7911368460759305e-05, "epoch": 7.491943127962085, "percentage": 74.96, "elapsed_time": "15:10:32", "remaining_time": "5:04:07"} -{"current_steps": 4950, "total_steps": 6590, "loss": 0.0017, "lr": 1.770871118838794e-05, "epoch": 7.507109004739337, "percentage": 75.11, "elapsed_time": "15:11:50", "remaining_time": "5:02:06"} -{"current_steps": 4950, "total_steps": 6590, "eval_loss": 0.06954542547464371, "epoch": 7.507109004739337, "percentage": 75.11, "elapsed_time": "15:14:30", "remaining_time": "5:02:59"} -{"current_steps": 4960, "total_steps": 6590, "loss": 0.0027, "lr": 1.7506959916148374e-05, "epoch": 7.522274881516587, "percentage": 75.27, "elapsed_time": "15:15:52", "remaining_time": "5:00:58"} -{"current_steps": 4970, "total_steps": 6590, "loss": 0.0014, "lr": 1.730612030459752e-05, "epoch": 7.5374407582938385, "percentage": 75.42, "elapsed_time": "15:17:09", "remaining_time": "4:58:57"} -{"current_steps": 4980, "total_steps": 6590, "loss": 0.0018, "lr": 1.7106197988713764e-05, "epoch": 7.55260663507109, "percentage": 75.57, "elapsed_time": "15:18:27", "remaining_time": "4:56:55"} -{"current_steps": 4990, "total_steps": 6590, "loss": 0.0003, "lr": 1.6907198577738877e-05, "epoch": 7.567772511848341, "percentage": 75.72, "elapsed_time": "15:19:45", "remaining_time": "4:54:54"} -{"current_steps": 5000, "total_steps": 6590, "loss": 0.0011, "lr": 1.6709127655020495e-05, "epoch": 7.5829383886255926, "percentage": 75.87, "elapsed_time": "15:21:03", "remaining_time": "4:52:53"} -{"current_steps": 5000, "total_steps": 6590, "eval_loss": 0.0661698505282402, "epoch": 7.5829383886255926, "percentage": 75.87, "elapsed_time": "15:23:43", "remaining_time": "4:53:44"} -{"current_steps": 5010, "total_steps": 6590, "loss": 0.0038, "lr": 1.6511990777855617e-05, "epoch": 7.598104265402844, "percentage": 76.02, "elapsed_time": "15:25:08", "remaining_time": "4:51:45"} -{"current_steps": 5020, "total_steps": 6590, "loss": 0.0043, "lr": 1.631579347733465e-05, "epoch": 7.613270142180095, "percentage": 76.18, "elapsed_time": "15:26:25", "remaining_time": "4:49:44"} -{"current_steps": 5030, "total_steps": 6590, "loss": 0.0024, "lr": 1.61205412581861e-05, "epoch": 7.628436018957346, "percentage": 76.33, "elapsed_time": "15:27:43", "remaining_time": "4:47:43"} -{"current_steps": 5040, "total_steps": 6590, "loss": 0.0004, "lr": 1.5926239598622355e-05, "epoch": 7.643601895734597, "percentage": 76.48, "elapsed_time": "15:29:00", "remaining_time": "4:45:42"} -{"current_steps": 5050, "total_steps": 6590, "loss": 0.0017, "lr": 1.5732893950185752e-05, "epoch": 7.658767772511848, "percentage": 76.63, "elapsed_time": "15:30:18", "remaining_time": "4:43:41"} -{"current_steps": 5050, "total_steps": 6590, "eval_loss": 0.059014737606048584, "epoch": 7.658767772511848, "percentage": 76.63, "elapsed_time": "15:32:58", "remaining_time": "4:44:30"} -{"current_steps": 5060, "total_steps": 6590, "loss": 0.0006, "lr": 1.5540509737595754e-05, "epoch": 7.6739336492891, "percentage": 76.78, "elapsed_time": "15:34:22", "remaining_time": "4:42:31"} -{"current_steps": 5070, "total_steps": 6590, "loss": 0.0019, "lr": 1.5349092358596728e-05, "epoch": 7.689099526066351, "percentage": 76.93, "elapsed_time": "15:35:39", "remaining_time": "4:40:30"} -{"current_steps": 5080, "total_steps": 6590, "loss": 0.0017, "lr": 1.515864718380648e-05, "epoch": 7.7042654028436015, "percentage": 77.09, "elapsed_time": "15:36:57", "remaining_time": "4:38:30"} -{"current_steps": 5090, "total_steps": 6590, "loss": 0.0019, "lr": 1.4969179556565583e-05, "epoch": 7.719431279620853, "percentage": 77.24, "elapsed_time": "15:38:14", "remaining_time": "4:36:29"} -{"current_steps": 5100, "total_steps": 6590, "loss": 0.0005, "lr": 1.4780694792787425e-05, "epoch": 7.734597156398104, "percentage": 77.39, "elapsed_time": "15:39:32", "remaining_time": "4:34:29"} -{"current_steps": 5100, "total_steps": 6590, "eval_loss": 0.06153266876935959, "epoch": 7.734597156398104, "percentage": 77.39, "elapsed_time": "15:42:12", "remaining_time": "4:35:16"} -{"current_steps": 5110, "total_steps": 6590, "loss": 0.0044, "lr": 1.4593198180809109e-05, "epoch": 7.7497630331753555, "percentage": 77.54, "elapsed_time": "15:43:34", "remaining_time": "4:33:17"} -{"current_steps": 5120, "total_steps": 6590, "loss": 0.0018, "lr": 1.4406694981243101e-05, "epoch": 7.764928909952607, "percentage": 77.69, "elapsed_time": "15:44:51", "remaining_time": "4:31:16"} -{"current_steps": 5130, "total_steps": 6590, "loss": 0.0041, "lr": 1.4221190426829512e-05, "epoch": 7.780094786729858, "percentage": 77.85, "elapsed_time": "15:46:09", "remaining_time": "4:29:16"} -{"current_steps": 5140, "total_steps": 6590, "loss": 0.0016, "lr": 1.403668972228941e-05, "epoch": 7.795260663507109, "percentage": 78.0, "elapsed_time": "15:47:26", "remaining_time": "4:27:16"} -{"current_steps": 5150, "total_steps": 6590, "loss": 0.0019, "lr": 1.3853198044178722e-05, "epoch": 7.81042654028436, "percentage": 78.15, "elapsed_time": "15:48:44", "remaining_time": "4:25:16"} -{"current_steps": 5150, "total_steps": 6590, "eval_loss": 0.05827568471431732, "epoch": 7.81042654028436, "percentage": 78.15, "elapsed_time": "15:51:24", "remaining_time": "4:26:01"} -{"current_steps": 5160, "total_steps": 6590, "loss": 0.0017, "lr": 1.367072054074302e-05, "epoch": 7.825592417061611, "percentage": 78.3, "elapsed_time": "15:52:47", "remaining_time": "4:24:02"} -{"current_steps": 5170, "total_steps": 6590, "loss": 0.0015, "lr": 1.3489262331773079e-05, "epoch": 7.840758293838863, "percentage": 78.45, "elapsed_time": "15:54:04", "remaining_time": "4:22:02"} -{"current_steps": 5180, "total_steps": 6590, "loss": 0.0014, "lr": 1.330882850846118e-05, "epoch": 7.855924170616114, "percentage": 78.6, "elapsed_time": "15:55:22", "remaining_time": "4:20:03"} -{"current_steps": 5190, "total_steps": 6590, "loss": 0.0006, "lr": 1.312942413325835e-05, "epoch": 7.8710900473933645, "percentage": 78.76, "elapsed_time": "15:56:40", "remaining_time": "4:18:03"} -{"current_steps": 5200, "total_steps": 6590, "loss": 0.0009, "lr": 1.2951054239732263e-05, "epoch": 7.886255924170616, "percentage": 78.91, "elapsed_time": "15:57:57", "remaining_time": "4:16:04"} -{"current_steps": 5200, "total_steps": 6590, "eval_loss": 0.060263097286224365, "epoch": 7.886255924170616, "percentage": 78.91, "elapsed_time": "16:00:38", "remaining_time": "4:16:47"} -{"current_steps": 5210, "total_steps": 6590, "loss": 0.0011, "lr": 1.2773723832426032e-05, "epoch": 7.901421800947867, "percentage": 79.06, "elapsed_time": "16:02:00", "remaining_time": "4:14:48"} -{"current_steps": 5220, "total_steps": 6590, "loss": 0.0004, "lr": 1.2597437886717805e-05, "epoch": 7.9165876777251185, "percentage": 79.21, "elapsed_time": "16:03:18", "remaining_time": "4:12:49"} -{"current_steps": 5230, "total_steps": 6590, "loss": 0.0022, "lr": 1.2422201348681134e-05, "epoch": 7.93175355450237, "percentage": 79.36, "elapsed_time": "16:04:35", "remaining_time": "4:10:49"} -{"current_steps": 5240, "total_steps": 6590, "loss": 0.0055, "lr": 1.2248019134946225e-05, "epoch": 7.946919431279621, "percentage": 79.51, "elapsed_time": "16:05:53", "remaining_time": "4:08:50"} -{"current_steps": 5250, "total_steps": 6590, "loss": 0.0015, "lr": 1.2074896132562075e-05, "epoch": 7.9620853080568725, "percentage": 79.67, "elapsed_time": "16:07:11", "remaining_time": "4:06:51"} -{"current_steps": 5250, "total_steps": 6590, "eval_loss": 0.05999268218874931, "epoch": 7.9620853080568725, "percentage": 79.67, "elapsed_time": "16:09:51", "remaining_time": "4:07:32"} -{"current_steps": 5260, "total_steps": 6590, "loss": 0.0006, "lr": 1.1902837198859157e-05, "epoch": 7.977251184834123, "percentage": 79.82, "elapsed_time": "16:11:14", "remaining_time": "4:05:34"} -{"current_steps": 5270, "total_steps": 6590, "loss": 0.0009, "lr": 1.1731847161313325e-05, "epoch": 7.992417061611374, "percentage": 79.97, "elapsed_time": "16:12:31", "remaining_time": "4:03:35"} -{"current_steps": 5280, "total_steps": 6590, "loss": 0.0017, "lr": 1.15619308174103e-05, "epoch": 8.007582938388625, "percentage": 80.12, "elapsed_time": "16:13:49", "remaining_time": "4:01:36"} -{"current_steps": 5290, "total_steps": 6590, "loss": 0.0008, "lr": 1.1393092934511035e-05, "epoch": 8.022748815165876, "percentage": 80.27, "elapsed_time": "16:15:07", "remaining_time": "3:59:37"} -{"current_steps": 5300, "total_steps": 6590, "loss": 0.0012, "lr": 1.1225338249718032e-05, "epoch": 8.037914691943127, "percentage": 80.42, "elapsed_time": "16:16:24", "remaining_time": "3:57:39"} -{"current_steps": 5300, "total_steps": 6590, "eval_loss": 0.061292365193367004, "epoch": 8.037914691943127, "percentage": 80.42, "elapsed_time": "16:19:04", "remaining_time": "3:58:18"} -{"current_steps": 5310, "total_steps": 6590, "loss": 0.0007, "lr": 1.1058671469742331e-05, "epoch": 8.053080568720379, "percentage": 80.58, "elapsed_time": "16:20:26", "remaining_time": "3:56:20"} -{"current_steps": 5320, "total_steps": 6590, "loss": 0.0003, "lr": 1.0893097270771552e-05, "epoch": 8.06824644549763, "percentage": 80.73, "elapsed_time": "16:21:44", "remaining_time": "3:54:21"} -{"current_steps": 5330, "total_steps": 6590, "loss": 0.0012, "lr": 1.0728620298338649e-05, "epoch": 8.083412322274881, "percentage": 80.88, "elapsed_time": "16:23:01", "remaining_time": "3:52:23"} -{"current_steps": 5340, "total_steps": 6590, "loss": 0.0003, "lr": 1.0565245167191556e-05, "epoch": 8.098578199052133, "percentage": 81.03, "elapsed_time": "16:24:19", "remaining_time": "3:50:24"} -{"current_steps": 5350, "total_steps": 6590, "loss": 0.0003, "lr": 1.040297646116376e-05, "epoch": 8.113744075829384, "percentage": 81.18, "elapsed_time": "16:25:37", "remaining_time": "3:48:26"} -{"current_steps": 5350, "total_steps": 6590, "eval_loss": 0.0645313709974289, "epoch": 8.113744075829384, "percentage": 81.18, "elapsed_time": "16:28:17", "remaining_time": "3:49:03"} -{"current_steps": 5360, "total_steps": 6590, "loss": 0.0003, "lr": 1.0241818733045604e-05, "epoch": 8.128909952606636, "percentage": 81.34, "elapsed_time": "16:29:39", "remaining_time": "3:47:06"} -{"current_steps": 5370, "total_steps": 6590, "loss": 0.0002, "lr": 1.008177650445669e-05, "epoch": 8.144075829383887, "percentage": 81.49, "elapsed_time": "16:30:56", "remaining_time": "3:45:07"} -{"current_steps": 5380, "total_steps": 6590, "loss": 0.0012, "lr": 9.922854265718845e-06, "epoch": 8.159241706161138, "percentage": 81.64, "elapsed_time": "16:32:14", "remaining_time": "3:43:09"} -{"current_steps": 5390, "total_steps": 6590, "loss": 0.0011, "lr": 9.765056475730272e-06, "epoch": 8.174407582938388, "percentage": 81.79, "elapsed_time": "16:33:32", "remaining_time": "3:41:11"} -{"current_steps": 5400, "total_steps": 6590, "loss": 0.0004, "lr": 9.608387561840381e-06, "epoch": 8.189573459715639, "percentage": 81.94, "elapsed_time": "16:34:50", "remaining_time": "3:39:13"} -{"current_steps": 5400, "total_steps": 6590, "eval_loss": 0.06526435166597366, "epoch": 8.189573459715639, "percentage": 81.94, "elapsed_time": "16:37:30", "remaining_time": "3:39:49"} -{"current_steps": 5410, "total_steps": 6590, "loss": 0.0004, "lr": 9.45285191972559e-06, "epoch": 8.20473933649289, "percentage": 82.09, "elapsed_time": "16:38:52", "remaining_time": "3:37:52"} -{"current_steps": 5420, "total_steps": 6590, "loss": 0.0004, "lr": 9.298453913265981e-06, "epoch": 8.219905213270142, "percentage": 82.25, "elapsed_time": "16:40:10", "remaining_time": "3:35:54"} -{"current_steps": 5430, "total_steps": 6590, "loss": 0.0012, "lr": 9.145197874422901e-06, "epoch": 8.235071090047393, "percentage": 82.4, "elapsed_time": "16:41:27", "remaining_time": "3:33:56"} -{"current_steps": 5440, "total_steps": 6590, "loss": 0.0014, "lr": 8.993088103117314e-06, "epoch": 8.250236966824644, "percentage": 82.55, "elapsed_time": "16:42:45", "remaining_time": "3:31:58"} -{"current_steps": 5450, "total_steps": 6590, "loss": 0.0002, "lr": 8.842128867109345e-06, "epoch": 8.265402843601896, "percentage": 82.7, "elapsed_time": "16:44:02", "remaining_time": "3:30:01"} -{"current_steps": 5450, "total_steps": 6590, "eval_loss": 0.06632176041603088, "epoch": 8.265402843601896, "percentage": 82.7, "elapsed_time": "16:46:43", "remaining_time": "3:30:34"} -{"current_steps": 5460, "total_steps": 6590, "loss": 0.0003, "lr": 8.692324401878326e-06, "epoch": 8.280568720379147, "percentage": 82.85, "elapsed_time": "16:48:04", "remaining_time": "3:28:37"} -{"current_steps": 5470, "total_steps": 6590, "loss": 0.0005, "lr": 8.543678910504122e-06, "epoch": 8.295734597156398, "percentage": 83.0, "elapsed_time": "16:49:22", "remaining_time": "3:26:40"} -{"current_steps": 5480, "total_steps": 6590, "loss": 0.0013, "lr": 8.39619656354913e-06, "epoch": 8.31090047393365, "percentage": 83.16, "elapsed_time": "16:50:39", "remaining_time": "3:24:42"} -{"current_steps": 5490, "total_steps": 6590, "loss": 0.0001, "lr": 8.249881498941248e-06, "epoch": 8.326066350710901, "percentage": 83.31, "elapsed_time": "16:51:57", "remaining_time": "3:22:45"} -{"current_steps": 5500, "total_steps": 6590, "loss": 0.0006, "lr": 8.104737821857883e-06, "epoch": 8.341232227488153, "percentage": 83.46, "elapsed_time": "16:53:15", "remaining_time": "3:20:48"} -{"current_steps": 5500, "total_steps": 6590, "eval_loss": 0.06748320162296295, "epoch": 8.341232227488153, "percentage": 83.46, "elapsed_time": "16:55:55", "remaining_time": "3:21:20"} -{"current_steps": 5510, "total_steps": 6590, "loss": 0.0011, "lr": 7.960769604610619e-06, "epoch": 8.356398104265402, "percentage": 83.61, "elapsed_time": "16:57:18", "remaining_time": "3:19:23"} -{"current_steps": 5520, "total_steps": 6590, "loss": 0.0001, "lr": 7.817980886531078e-06, "epoch": 8.371563981042653, "percentage": 83.76, "elapsed_time": "16:58:35", "remaining_time": "3:17:26"} -{"current_steps": 5530, "total_steps": 6590, "loss": 0.0028, "lr": 7.67637567385755e-06, "epoch": 8.386729857819905, "percentage": 83.92, "elapsed_time": "16:59:53", "remaining_time": "3:15:29"} -{"current_steps": 5540, "total_steps": 6590, "loss": 0.0002, "lr": 7.535957939622573e-06, "epoch": 8.401895734597156, "percentage": 84.07, "elapsed_time": "17:01:10", "remaining_time": "3:13:32"} -{"current_steps": 5550, "total_steps": 6590, "loss": 0.0004, "lr": 7.396731623541481e-06, "epoch": 8.417061611374407, "percentage": 84.22, "elapsed_time": "17:02:28", "remaining_time": "3:11:35"} -{"current_steps": 5550, "total_steps": 6590, "eval_loss": 0.06695921719074249, "epoch": 8.417061611374407, "percentage": 84.22, "elapsed_time": "17:05:09", "remaining_time": "3:12:06"} -{"current_steps": 5560, "total_steps": 6590, "loss": 0.002, "lr": 7.2587006319018766e-06, "epoch": 8.432227488151659, "percentage": 84.37, "elapsed_time": "17:06:31", "remaining_time": "3:10:09"} -{"current_steps": 5570, "total_steps": 6590, "loss": 0.0011, "lr": 7.1218688374539765e-06, "epoch": 8.44739336492891, "percentage": 84.52, "elapsed_time": "17:07:48", "remaining_time": "3:08:13"} -{"current_steps": 5580, "total_steps": 6590, "loss": 0.0003, "lr": 6.986240079302053e-06, "epoch": 8.462559241706161, "percentage": 84.67, "elapsed_time": "17:09:06", "remaining_time": "3:06:16"} -{"current_steps": 5590, "total_steps": 6590, "loss": 0.0017, "lr": 6.851818162796603e-06, "epoch": 8.477725118483413, "percentage": 84.83, "elapsed_time": "17:10:24", "remaining_time": "3:04:19"} -{"current_steps": 5600, "total_steps": 6590, "loss": 0.0005, "lr": 6.718606859427673e-06, "epoch": 8.492890995260664, "percentage": 84.98, "elapsed_time": "17:11:41", "remaining_time": "3:02:23"} -{"current_steps": 5600, "total_steps": 6590, "eval_loss": 0.06707433611154556, "epoch": 8.492890995260664, "percentage": 84.98, "elapsed_time": "17:14:22", "remaining_time": "3:02:51"} -{"current_steps": 5610, "total_steps": 6590, "loss": 0.0002, "lr": 6.586609906719005e-06, "epoch": 8.508056872037915, "percentage": 85.13, "elapsed_time": "17:15:43", "remaining_time": "3:00:55"} -{"current_steps": 5620, "total_steps": 6590, "loss": 0.0024, "lr": 6.4558310081231585e-06, "epoch": 8.523222748815165, "percentage": 85.28, "elapsed_time": "17:17:01", "remaining_time": "2:58:59"} -{"current_steps": 5630, "total_steps": 6590, "loss": 0.0013, "lr": 6.326273832917651e-06, "epoch": 8.538388625592416, "percentage": 85.43, "elapsed_time": "17:18:18", "remaining_time": "2:57:02"} -{"current_steps": 5640, "total_steps": 6590, "loss": 0.0001, "lr": 6.197942016101932e-06, "epoch": 8.553554502369668, "percentage": 85.58, "elapsed_time": "17:19:36", "remaining_time": "2:55:06"} -{"current_steps": 5650, "total_steps": 6590, "loss": 0.0018, "lr": 6.070839158295455e-06, "epoch": 8.568720379146919, "percentage": 85.74, "elapsed_time": "17:20:54", "remaining_time": "2:53:10"} -{"current_steps": 5650, "total_steps": 6590, "eval_loss": 0.06664544343948364, "epoch": 8.568720379146919, "percentage": 85.74, "elapsed_time": "17:23:35", "remaining_time": "2:53:37"} -{"current_steps": 5660, "total_steps": 6590, "loss": 0.0006, "lr": 5.944968825636687e-06, "epoch": 8.58388625592417, "percentage": 85.89, "elapsed_time": "17:24:57", "remaining_time": "2:51:41"} -{"current_steps": 5670, "total_steps": 6590, "loss": 0.002, "lr": 5.820334549682938e-06, "epoch": 8.599052132701422, "percentage": 86.04, "elapsed_time": "17:26:14", "remaining_time": "2:49:45"} -{"current_steps": 5680, "total_steps": 6590, "loss": 0.0016, "lr": 5.696939827311387e-06, "epoch": 8.614218009478673, "percentage": 86.19, "elapsed_time": "17:27:32", "remaining_time": "2:47:49"} -{"current_steps": 5690, "total_steps": 6590, "loss": 0.0021, "lr": 5.574788120620894e-06, "epoch": 8.629383886255924, "percentage": 86.34, "elapsed_time": "17:28:50", "remaining_time": "2:45:53"} -{"current_steps": 5700, "total_steps": 6590, "loss": 0.0003, "lr": 5.453882856834908e-06, "epoch": 8.644549763033176, "percentage": 86.49, "elapsed_time": "17:30:07", "remaining_time": "2:43:58"} -{"current_steps": 5700, "total_steps": 6590, "eval_loss": 0.06454561650753021, "epoch": 8.644549763033176, "percentage": 86.49, "elapsed_time": "17:32:48", "remaining_time": "2:44:23"} -{"current_steps": 5710, "total_steps": 6590, "loss": 0.0002, "lr": 5.334227428205335e-06, "epoch": 8.659715639810427, "percentage": 86.65, "elapsed_time": "17:34:11", "remaining_time": "2:42:28"} -{"current_steps": 5720, "total_steps": 6590, "loss": 0.0002, "lr": 5.215825191917256e-06, "epoch": 8.674881516587678, "percentage": 86.8, "elapsed_time": "17:35:29", "remaining_time": "2:40:32"} -{"current_steps": 5730, "total_steps": 6590, "loss": 0.0004, "lr": 5.0986794699948495e-06, "epoch": 8.690047393364928, "percentage": 86.95, "elapsed_time": "17:36:46", "remaining_time": "2:38:36"} -{"current_steps": 5740, "total_steps": 6590, "loss": 0.0006, "lr": 4.9827935492081145e-06, "epoch": 8.70521327014218, "percentage": 87.1, "elapsed_time": "17:38:04", "remaining_time": "2:36:40"} -{"current_steps": 5750, "total_steps": 6590, "loss": 0.0008, "lr": 4.868170680980683e-06, "epoch": 8.72037914691943, "percentage": 87.25, "elapsed_time": "17:39:21", "remaining_time": "2:34:45"} -{"current_steps": 5750, "total_steps": 6590, "eval_loss": 0.06558696925640106, "epoch": 8.72037914691943, "percentage": 87.25, "elapsed_time": "17:42:02", "remaining_time": "2:35:09"} -{"current_steps": 5760, "total_steps": 6590, "loss": 0.0006, "lr": 4.754814081298597e-06, "epoch": 8.735545023696682, "percentage": 87.41, "elapsed_time": "17:43:24", "remaining_time": "2:33:14"} -{"current_steps": 5770, "total_steps": 6590, "loss": 0.0001, "lr": 4.642726930620034e-06, "epoch": 8.750710900473933, "percentage": 87.56, "elapsed_time": "17:44:42", "remaining_time": "2:31:18"} -{"current_steps": 5780, "total_steps": 6590, "loss": 0.0018, "lr": 4.53191237378614e-06, "epoch": 8.765876777251185, "percentage": 87.71, "elapsed_time": "17:45:59", "remaining_time": "2:29:23"} -{"current_steps": 5790, "total_steps": 6590, "loss": 0.0006, "lr": 4.422373519932743e-06, "epoch": 8.781042654028436, "percentage": 87.86, "elapsed_time": "17:47:17", "remaining_time": "2:27:28"} -{"current_steps": 5800, "total_steps": 6590, "loss": 0.0009, "lr": 4.31411344240314e-06, "epoch": 8.796208530805687, "percentage": 88.01, "elapsed_time": "17:48:35", "remaining_time": "2:25:32"} -{"current_steps": 5800, "total_steps": 6590, "eval_loss": 0.06653338670730591, "epoch": 8.796208530805687, "percentage": 88.01, "elapsed_time": "17:51:15", "remaining_time": "2:25:54"} -{"current_steps": 5810, "total_steps": 6590, "loss": 0.0007, "lr": 4.207135178661875e-06, "epoch": 8.811374407582939, "percentage": 88.16, "elapsed_time": "17:52:38", "remaining_time": "2:24:00"} -{"current_steps": 5820, "total_steps": 6590, "loss": 0.0002, "lr": 4.101441730209471e-06, "epoch": 8.82654028436019, "percentage": 88.32, "elapsed_time": "17:53:55", "remaining_time": "2:22:05"} -{"current_steps": 5830, "total_steps": 6590, "loss": 0.0001, "lr": 3.997036062498299e-06, "epoch": 8.841706161137441, "percentage": 88.47, "elapsed_time": "17:55:13", "remaining_time": "2:20:09"} -{"current_steps": 5840, "total_steps": 6590, "loss": 0.0001, "lr": 3.893921104849308e-06, "epoch": 8.856872037914691, "percentage": 88.62, "elapsed_time": "17:56:31", "remaining_time": "2:18:15"} -{"current_steps": 5850, "total_steps": 6590, "loss": 0.0005, "lr": 3.7920997503698318e-06, "epoch": 8.872037914691942, "percentage": 88.77, "elapsed_time": "17:57:48", "remaining_time": "2:16:20"} -{"current_steps": 5850, "total_steps": 6590, "eval_loss": 0.06765168160200119, "epoch": 8.872037914691942, "percentage": 88.77, "elapsed_time": "18:00:29", "remaining_time": "2:16:40"} -{"current_steps": 5860, "total_steps": 6590, "loss": 0.0005, "lr": 3.691574855872476e-06, "epoch": 8.887203791469194, "percentage": 88.92, "elapsed_time": "18:01:51", "remaining_time": "2:14:46"} -{"current_steps": 5870, "total_steps": 6590, "loss": 0.0001, "lr": 3.592349241794929e-06, "epoch": 8.902369668246445, "percentage": 89.07, "elapsed_time": "18:03:08", "remaining_time": "2:12:51"} -{"current_steps": 5880, "total_steps": 6590, "loss": 0.0015, "lr": 3.4944256921208064e-06, "epoch": 8.917535545023696, "percentage": 89.23, "elapsed_time": "18:04:26", "remaining_time": "2:10:56"} -{"current_steps": 5890, "total_steps": 6590, "loss": 0.0007, "lr": 3.3978069543015966e-06, "epoch": 8.932701421800948, "percentage": 89.38, "elapsed_time": "18:05:44", "remaining_time": "2:09:02"} -{"current_steps": 5900, "total_steps": 6590, "loss": 0.0008, "lr": 3.3024957391794897e-06, "epoch": 8.947867298578199, "percentage": 89.53, "elapsed_time": "18:07:02", "remaining_time": "2:07:07"} -{"current_steps": 5900, "total_steps": 6590, "eval_loss": 0.06804511696100235, "epoch": 8.947867298578199, "percentage": 89.53, "elapsed_time": "18:09:42", "remaining_time": "2:07:26"} -{"current_steps": 5910, "total_steps": 6590, "loss": 0.0015, "lr": 3.208494720911448e-06, "epoch": 8.96303317535545, "percentage": 89.68, "elapsed_time": "18:11:04", "remaining_time": "2:05:32"} -{"current_steps": 5920, "total_steps": 6590, "loss": 0.0017, "lr": 3.115806536894034e-06, "epoch": 8.978199052132702, "percentage": 89.83, "elapsed_time": "18:12:22", "remaining_time": "2:03:37"} -{"current_steps": 5930, "total_steps": 6590, "loss": 0.0003, "lr": 3.0244337876895124e-06, "epoch": 8.993364928909953, "percentage": 89.98, "elapsed_time": "18:13:40", "remaining_time": "2:01:43"} -{"current_steps": 5940, "total_steps": 6590, "loss": 0.0001, "lr": 2.9343790369528502e-06, "epoch": 9.008530805687204, "percentage": 90.14, "elapsed_time": "18:14:58", "remaining_time": "1:59:49"} -{"current_steps": 5950, "total_steps": 6590, "loss": 0.0007, "lr": 2.8456448113597657e-06, "epoch": 9.023696682464456, "percentage": 90.29, "elapsed_time": "18:16:15", "remaining_time": "1:57:55"} -{"current_steps": 5950, "total_steps": 6590, "eval_loss": 0.06828483194112778, "epoch": 9.023696682464456, "percentage": 90.29, "elapsed_time": "18:18:56", "remaining_time": "1:58:12"} -{"current_steps": 5960, "total_steps": 6590, "loss": 0.0004, "lr": 2.7582336005359144e-06, "epoch": 9.038862559241705, "percentage": 90.44, "elapsed_time": "18:20:19", "remaining_time": "1:56:18"} -{"current_steps": 5970, "total_steps": 6590, "loss": 0.0001, "lr": 2.6721478569869397e-06, "epoch": 9.054028436018957, "percentage": 90.59, "elapsed_time": "18:21:37", "remaining_time": "1:54:24"} -{"current_steps": 5980, "total_steps": 6590, "loss": 0.0002, "lr": 2.587389996029721e-06, "epoch": 9.069194312796208, "percentage": 90.74, "elapsed_time": "18:22:54", "remaining_time": "1:52:30"} -{"current_steps": 5990, "total_steps": 6590, "loss": 0.0016, "lr": 2.503962395724596e-06, "epoch": 9.08436018957346, "percentage": 90.9, "elapsed_time": "18:24:12", "remaining_time": "1:50:36"} -{"current_steps": 6000, "total_steps": 6590, "loss": 0.0002, "lr": 2.421867396808647e-06, "epoch": 9.09952606635071, "percentage": 91.05, "elapsed_time": "18:25:30", "remaining_time": "1:48:42"} -{"current_steps": 6000, "total_steps": 6590, "eval_loss": 0.06908756494522095, "epoch": 9.09952606635071, "percentage": 91.05, "elapsed_time": "18:28:10", "remaining_time": "1:48:58"} -{"current_steps": 6010, "total_steps": 6590, "loss": 0.0006, "lr": 2.3411073026299968e-06, "epoch": 9.114691943127962, "percentage": 91.2, "elapsed_time": "18:29:32", "remaining_time": "1:47:04"} -{"current_steps": 6020, "total_steps": 6590, "loss": 0.0018, "lr": 2.2616843790832287e-06, "epoch": 9.129857819905213, "percentage": 91.35, "elapsed_time": "18:30:50", "remaining_time": "1:45:10"} -{"current_steps": 6030, "total_steps": 6590, "loss": 0.0003, "lr": 2.1836008545457586e-06, "epoch": 9.145023696682465, "percentage": 91.5, "elapsed_time": "18:32:07", "remaining_time": "1:43:16"} -{"current_steps": 6040, "total_steps": 6590, "loss": 0.0015, "lr": 2.1068589198153686e-06, "epoch": 9.160189573459716, "percentage": 91.65, "elapsed_time": "18:33:25", "remaining_time": "1:41:23"} -{"current_steps": 6050, "total_steps": 6590, "loss": 0.0009, "lr": 2.0314607280486953e-06, "epoch": 9.175355450236967, "percentage": 91.81, "elapsed_time": "18:34:42", "remaining_time": "1:39:29"} -{"current_steps": 6050, "total_steps": 6590, "eval_loss": 0.06927720457315445, "epoch": 9.175355450236967, "percentage": 91.81, "elapsed_time": "18:37:23", "remaining_time": "1:39:44"} -{"current_steps": 6060, "total_steps": 6590, "loss": 0.0007, "lr": 1.957408394700844e-06, "epoch": 9.190521327014219, "percentage": 91.96, "elapsed_time": "18:38:45", "remaining_time": "1:37:50"} -{"current_steps": 6070, "total_steps": 6590, "loss": 0.0001, "lr": 1.8847039974660142e-06, "epoch": 9.205687203791468, "percentage": 92.11, "elapsed_time": "18:40:02", "remaining_time": "1:35:57"} -{"current_steps": 6080, "total_steps": 6590, "loss": 0.0001, "lr": 1.8133495762192421e-06, "epoch": 9.22085308056872, "percentage": 92.26, "elapsed_time": "18:41:20", "remaining_time": "1:34:03"} -{"current_steps": 6090, "total_steps": 6590, "loss": 0.0002, "lr": 1.7433471329591223e-06, "epoch": 9.236018957345971, "percentage": 92.41, "elapsed_time": "18:42:38", "remaining_time": "1:32:10"} -{"current_steps": 6100, "total_steps": 6590, "loss": 0.0007, "lr": 1.6746986317516645e-06, "epoch": 9.251184834123222, "percentage": 92.56, "elapsed_time": "18:43:55", "remaining_time": "1:30:16"} -{"current_steps": 6100, "total_steps": 6590, "eval_loss": 0.06962603330612183, "epoch": 9.251184834123222, "percentage": 92.56, "elapsed_time": "18:46:36", "remaining_time": "1:30:29"} -{"current_steps": 6110, "total_steps": 6590, "loss": 0.0002, "lr": 1.6074059986751765e-06, "epoch": 9.266350710900474, "percentage": 92.72, "elapsed_time": "18:47:58", "remaining_time": "1:28:36"} -{"current_steps": 6120, "total_steps": 6590, "loss": 0.0002, "lr": 1.5414711217662581e-06, "epoch": 9.281516587677725, "percentage": 92.87, "elapsed_time": "18:49:16", "remaining_time": "1:26:43"} -{"current_steps": 6130, "total_steps": 6590, "loss": 0.0007, "lr": 1.476895850966764e-06, "epoch": 9.296682464454976, "percentage": 93.02, "elapsed_time": "18:50:34", "remaining_time": "1:24:50"} -{"current_steps": 6140, "total_steps": 6590, "loss": 0.0001, "lr": 1.4136819980719474e-06, "epoch": 9.311848341232228, "percentage": 93.17, "elapsed_time": "18:51:52", "remaining_time": "1:22:57"} -{"current_steps": 6150, "total_steps": 6590, "loss": 0.0006, "lr": 1.3518313366796265e-06, "epoch": 9.327014218009479, "percentage": 93.32, "elapsed_time": "18:53:09", "remaining_time": "1:21:04"} -{"current_steps": 6150, "total_steps": 6590, "eval_loss": 0.07017911970615387, "epoch": 9.327014218009479, "percentage": 93.32, "elapsed_time": "18:55:50", "remaining_time": "1:21:15"} -{"current_steps": 6160, "total_steps": 6590, "loss": 0.0008, "lr": 1.2913456021403814e-06, "epoch": 9.34218009478673, "percentage": 93.47, "elapsed_time": "18:57:12", "remaining_time": "1:19:23"} -{"current_steps": 6170, "total_steps": 6590, "loss": 0.0007, "lr": 1.2322264915089365e-06, "epoch": 9.357345971563982, "percentage": 93.63, "elapsed_time": "18:58:30", "remaining_time": "1:17:29"} -{"current_steps": 6180, "total_steps": 6590, "loss": 0.0015, "lr": 1.174475663496466e-06, "epoch": 9.372511848341233, "percentage": 93.78, "elapsed_time": "18:59:48", "remaining_time": "1:15:37"} -{"current_steps": 6190, "total_steps": 6590, "loss": 0.0001, "lr": 1.1180947384241025e-06, "epoch": 9.387677725118483, "percentage": 93.93, "elapsed_time": "19:01:06", "remaining_time": "1:13:44"} -{"current_steps": 6200, "total_steps": 6590, "loss": 0.0002, "lr": 1.0630852981774797e-06, "epoch": 9.402843601895734, "percentage": 94.08, "elapsed_time": "19:02:23", "remaining_time": "1:11:51"} -{"current_steps": 6200, "total_steps": 6590, "eval_loss": 0.07030041515827179, "epoch": 9.402843601895734, "percentage": 94.08, "elapsed_time": "19:05:04", "remaining_time": "1:12:01"} -{"current_steps": 6210, "total_steps": 6590, "loss": 0.0003, "lr": 1.0094488861623175e-06, "epoch": 9.418009478672985, "percentage": 94.23, "elapsed_time": "19:06:27", "remaining_time": "1:10:09"} -{"current_steps": 6220, "total_steps": 6590, "loss": 0.0011, "lr": 9.571870072611567e-07, "epoch": 9.433175355450237, "percentage": 94.39, "elapsed_time": "19:07:44", "remaining_time": "1:08:16"} -{"current_steps": 6230, "total_steps": 6590, "loss": 0.0001, "lr": 9.063011277910871e-07, "epoch": 9.448341232227488, "percentage": 94.54, "elapsed_time": "19:09:02", "remaining_time": "1:06:23"} -{"current_steps": 6240, "total_steps": 6590, "loss": 0.0002, "lr": 8.567926754626587e-07, "epoch": 9.46350710900474, "percentage": 94.69, "elapsed_time": "19:10:20", "remaining_time": "1:04:31"} -{"current_steps": 6250, "total_steps": 6590, "loss": 0.0001, "lr": 8.086630393398075e-07, "epoch": 9.47867298578199, "percentage": 94.84, "elapsed_time": "19:11:38", "remaining_time": "1:02:38"} -{"current_steps": 6250, "total_steps": 6590, "eval_loss": 0.07060568034648895, "epoch": 9.47867298578199, "percentage": 94.84, "elapsed_time": "19:14:19", "remaining_time": "1:02:47"} -{"current_steps": 6260, "total_steps": 6590, "loss": 0.0001, "lr": 7.619135698008428e-07, "epoch": 9.493838862559242, "percentage": 94.99, "elapsed_time": "19:15:40", "remaining_time": "1:00:55"} -{"current_steps": 6270, "total_steps": 6590, "loss": 0.0001, "lr": 7.165455785006326e-07, "epoch": 9.509004739336493, "percentage": 95.14, "elapsed_time": "19:16:58", "remaining_time": "0:59:02"} -{"current_steps": 6280, "total_steps": 6590, "loss": 0.0003, "lr": 6.725603383337275e-07, "epoch": 9.524170616113745, "percentage": 95.3, "elapsed_time": "19:18:15", "remaining_time": "0:57:10"} -{"current_steps": 6290, "total_steps": 6590, "loss": 0.0004, "lr": 6.299590833987123e-07, "epoch": 9.539336492890996, "percentage": 95.45, "elapsed_time": "19:19:33", "remaining_time": "0:55:18"} -{"current_steps": 6300, "total_steps": 6590, "loss": 0.0006, "lr": 5.887430089635382e-07, "epoch": 9.554502369668246, "percentage": 95.6, "elapsed_time": "19:20:50", "remaining_time": "0:53:26"} -{"current_steps": 6300, "total_steps": 6590, "eval_loss": 0.07060205936431885, "epoch": 9.554502369668246, "percentage": 95.6, "elapsed_time": "19:23:31", "remaining_time": "0:53:33"} -{"current_steps": 6310, "total_steps": 6590, "loss": 0.0003, "lr": 5.489132714319833e-07, "epoch": 9.569668246445497, "percentage": 95.75, "elapsed_time": "19:24:53", "remaining_time": "0:51:41"} -{"current_steps": 6320, "total_steps": 6590, "loss": 0.0003, "lr": 5.104709883112513e-07, "epoch": 9.584834123222748, "percentage": 95.9, "elapsed_time": "19:26:10", "remaining_time": "0:49:49"} -{"current_steps": 6330, "total_steps": 6590, "loss": 0.0001, "lr": 4.7341723818056794e-07, "epoch": 9.6, "percentage": 96.05, "elapsed_time": "19:27:28", "remaining_time": "0:47:57"} -{"current_steps": 6340, "total_steps": 6590, "loss": 0.0003, "lr": 4.3775306066096146e-07, "epoch": 9.615165876777251, "percentage": 96.21, "elapsed_time": "19:28:46", "remaining_time": "0:46:05"} -{"current_steps": 6350, "total_steps": 6590, "loss": 0.0004, "lr": 4.034794563860522e-07, "epoch": 9.630331753554502, "percentage": 96.36, "elapsed_time": "19:30:03", "remaining_time": "0:44:13"} -{"current_steps": 6350, "total_steps": 6590, "eval_loss": 0.07052826881408691, "epoch": 9.630331753554502, "percentage": 96.36, "elapsed_time": "19:32:44", "remaining_time": "0:44:19"} -{"current_steps": 6360, "total_steps": 6590, "loss": 0.0004, "lr": 3.705973869740087e-07, "epoch": 9.645497630331754, "percentage": 96.51, "elapsed_time": "19:34:06", "remaining_time": "0:42:27"} -{"current_steps": 6370, "total_steps": 6590, "loss": 0.001, "lr": 3.3910777500056333e-07, "epoch": 9.660663507109005, "percentage": 96.66, "elapsed_time": "19:35:23", "remaining_time": "0:40:35"} -{"current_steps": 6380, "total_steps": 6590, "loss": 0.0001, "lr": 3.090115039731112e-07, "epoch": 9.675829383886256, "percentage": 96.81, "elapsed_time": "19:36:41", "remaining_time": "0:38:43"} -{"current_steps": 6390, "total_steps": 6590, "loss": 0.0004, "lr": 2.803094183059352e-07, "epoch": 9.690995260663508, "percentage": 96.97, "elapsed_time": "19:37:58", "remaining_time": "0:36:52"} -{"current_steps": 6400, "total_steps": 6590, "loss": 0.0008, "lr": 2.5300232329651395e-07, "epoch": 9.706161137440759, "percentage": 97.12, "elapsed_time": "19:39:16", "remaining_time": "0:35:00"} -{"current_steps": 6400, "total_steps": 6590, "eval_loss": 0.07091958820819855, "epoch": 9.706161137440759, "percentage": 97.12, "elapsed_time": "19:41:56", "remaining_time": "0:35:05"} -{"current_steps": 6410, "total_steps": 6590, "loss": 0.0011, "lr": 2.2709098510292348e-07, "epoch": 9.721327014218009, "percentage": 97.27, "elapsed_time": "19:43:18", "remaining_time": "0:33:13"} -{"current_steps": 6420, "total_steps": 6590, "loss": 0.0001, "lr": 2.0257613072233728e-07, "epoch": 9.73649289099526, "percentage": 97.42, "elapsed_time": "19:44:36", "remaining_time": "0:31:22"} -{"current_steps": 6430, "total_steps": 6590, "loss": 0.0001, "lr": 1.7945844797063737e-07, "epoch": 9.751658767772511, "percentage": 97.57, "elapsed_time": "19:45:54", "remaining_time": "0:29:30"} -{"current_steps": 6440, "total_steps": 6590, "loss": 0.0013, "lr": 1.5773858546311858e-07, "epoch": 9.766824644549763, "percentage": 97.72, "elapsed_time": "19:47:11", "remaining_time": "0:27:39"} -{"current_steps": 6450, "total_steps": 6590, "loss": 0.0004, "lr": 1.374171525962753e-07, "epoch": 9.781990521327014, "percentage": 97.88, "elapsed_time": "19:48:29", "remaining_time": "0:25:47"} -{"current_steps": 6450, "total_steps": 6590, "eval_loss": 0.07092708349227905, "epoch": 9.781990521327014, "percentage": 97.88, "elapsed_time": "19:51:09", "remaining_time": "0:25:51"} -{"current_steps": 6460, "total_steps": 6590, "loss": 0.0005, "lr": 1.1849471953070957e-07, "epoch": 9.797156398104265, "percentage": 98.03, "elapsed_time": "19:52:31", "remaining_time": "0:23:59"} -{"current_steps": 6470, "total_steps": 6590, "loss": 0.0001, "lr": 1.0097181717514947e-07, "epoch": 9.812322274881517, "percentage": 98.18, "elapsed_time": "19:53:49", "remaining_time": "0:22:08"} -{"current_steps": 6480, "total_steps": 6590, "loss": 0.0016, "lr": 8.484893717153331e-08, "epoch": 9.827488151658768, "percentage": 98.33, "elapsed_time": "19:55:06", "remaining_time": "0:20:17"} -{"current_steps": 6490, "total_steps": 6590, "loss": 0.0009, "lr": 7.012653188122053e-08, "epoch": 9.84265402843602, "percentage": 98.48, "elapsed_time": "19:56:24", "remaining_time": "0:18:26"} -{"current_steps": 6500, "total_steps": 6590, "loss": 0.0002, "lr": 5.6805014372307564e-08, "epoch": 9.85781990521327, "percentage": 98.63, "elapsed_time": "19:57:42", "remaining_time": "0:16:35"} -{"current_steps": 6500, "total_steps": 6590, "eval_loss": 0.07085718214511871, "epoch": 9.85781990521327, "percentage": 98.63, "elapsed_time": "20:00:23", "remaining_time": "0:16:37"} -{"current_steps": 6510, "total_steps": 6590, "loss": 0.0001, "lr": 4.488475840803141e-08, "epoch": 9.872985781990522, "percentage": 98.79, "elapsed_time": "20:01:45", "remaining_time": "0:14:46"} -{"current_steps": 6520, "total_steps": 6590, "loss": 0.0002, "lr": 3.436609843628369e-08, "epoch": 9.888151658767772, "percentage": 98.94, "elapsed_time": "20:03:02", "remaining_time": "0:12:54"} -{"current_steps": 6530, "total_steps": 6590, "loss": 0.0004, "lr": 2.5249329580229185e-08, "epoch": 9.903317535545023, "percentage": 99.09, "elapsed_time": "20:04:20", "remaining_time": "0:11:03"} -{"current_steps": 6540, "total_steps": 6590, "loss": 0.0004, "lr": 1.753470763002363e-08, "epoch": 9.918483412322274, "percentage": 99.24, "elapsed_time": "20:05:38", "remaining_time": "0:09:13"} -{"current_steps": 6550, "total_steps": 6590, "loss": 0.0001, "lr": 1.1222449035630522e-08, "epoch": 9.933649289099526, "percentage": 99.39, "elapsed_time": "20:06:55", "remaining_time": "0:07:22"} -{"current_steps": 6550, "total_steps": 6590, "eval_loss": 0.07075422257184982, "epoch": 9.933649289099526, "percentage": 99.39, "elapsed_time": "20:09:36", "remaining_time": "0:07:23"} -{"current_steps": 6560, "total_steps": 6590, "loss": 0.0004, "lr": 6.312730900770447e-09, "epoch": 9.948815165876777, "percentage": 99.54, "elapsed_time": "20:10:57", "remaining_time": "0:05:32"} -{"current_steps": 6570, "total_steps": 6590, "loss": 0.0002, "lr": 2.8056909779250463e-09, "epoch": 9.963981042654028, "percentage": 99.7, "elapsed_time": "20:12:15", "remaining_time": "0:03:41"} -{"current_steps": 6580, "total_steps": 6590, "loss": 0.0011, "lr": 7.014276644901063e-10, "epoch": 9.97914691943128, "percentage": 99.85, "elapsed_time": "20:13:33", "remaining_time": "0:01:50"} -{"current_steps": 6590, "total_steps": 6590, "loss": 0.0003, "lr": 0.0, "epoch": 9.994312796208531, "percentage": 100.0, "elapsed_time": "20:14:51", "remaining_time": "0:00:00"} -{"current_steps": 6590, "total_steps": 6590, "epoch": 9.994312796208531, "percentage": 100.0, "elapsed_time": "20:14:56", "remaining_time": "0:00:00"} +{"current_steps": 10, "total_steps": 3295, "loss": 1.5168, "lr": 3.0303030303030305e-06, "epoch": 0.015165876777251185, "percentage": 0.3, "elapsed_time": "0:01:16", "remaining_time": "7:00:04"} +{"current_steps": 20, "total_steps": 3295, "loss": 1.4858, "lr": 6.060606060606061e-06, "epoch": 0.03033175355450237, "percentage": 0.61, "elapsed_time": "0:02:32", "remaining_time": "6:56:25"} +{"current_steps": 30, "total_steps": 3295, "loss": 1.384, "lr": 9.090909090909091e-06, "epoch": 0.04549763033175355, "percentage": 0.91, "elapsed_time": "0:03:47", "remaining_time": "6:53:27"} +{"current_steps": 40, "total_steps": 3295, "loss": 0.8608, "lr": 1.2121212121212122e-05, "epoch": 0.06066350710900474, "percentage": 1.21, "elapsed_time": "0:05:03", "remaining_time": "6:51:31"} +{"current_steps": 50, "total_steps": 3295, "loss": 0.6474, "lr": 1.5151515151515153e-05, "epoch": 0.07582938388625593, "percentage": 1.52, "elapsed_time": "0:06:19", "remaining_time": "6:50:07"} +{"current_steps": 50, "total_steps": 3295, "eval_loss": 0.41726887226104736, "epoch": 0.07582938388625593, "percentage": 1.52, "elapsed_time": "0:08:56", "remaining_time": "9:39:56"}