| {"current_steps": 10, "total_steps": 1200, "loss": 1.1278, "lr": 5e-06, "epoch": 0.025, "percentage": 0.83, "elapsed_time": "0:05:33", "remaining_time": "11:01:36"} | |
| {"current_steps": 20, "total_steps": 1200, "loss": 1.0093, "lr": 5e-06, "epoch": 0.05, "percentage": 1.67, "elapsed_time": "0:10:57", "remaining_time": "10:46:57"} | |
| {"current_steps": 30, "total_steps": 1200, "loss": 0.9776, "lr": 5e-06, "epoch": 0.075, "percentage": 2.5, "elapsed_time": "0:16:20", "remaining_time": "10:37:25"} | |
| {"current_steps": 40, "total_steps": 1200, "loss": 0.9461, "lr": 5e-06, "epoch": 0.1, "percentage": 3.33, "elapsed_time": "0:21:43", "remaining_time": "10:30:11"} | |
| {"current_steps": 50, "total_steps": 1200, "loss": 0.9341, "lr": 5e-06, "epoch": 0.125, "percentage": 4.17, "elapsed_time": "0:27:07", "remaining_time": "10:23:41"} | |
| {"current_steps": 60, "total_steps": 1200, "loss": 0.9133, "lr": 5e-06, "epoch": 0.15, "percentage": 5.0, "elapsed_time": "0:32:31", "remaining_time": "10:17:51"} | |
| {"current_steps": 70, "total_steps": 1200, "loss": 0.9034, "lr": 5e-06, "epoch": 0.175, "percentage": 5.83, "elapsed_time": "0:37:53", "remaining_time": "10:11:46"} | |
| {"current_steps": 80, "total_steps": 1200, "loss": 0.8946, "lr": 5e-06, "epoch": 0.2, "percentage": 6.67, "elapsed_time": "0:43:16", "remaining_time": "10:05:52"} | |
| {"current_steps": 90, "total_steps": 1200, "loss": 0.8897, "lr": 5e-06, "epoch": 0.225, "percentage": 7.5, "elapsed_time": "0:48:40", "remaining_time": "10:00:15"} | |
| {"current_steps": 100, "total_steps": 1200, "loss": 0.8838, "lr": 5e-06, "epoch": 0.25, "percentage": 8.33, "elapsed_time": "0:54:02", "remaining_time": "9:54:26"} | |
| {"current_steps": 110, "total_steps": 1200, "loss": 0.8804, "lr": 5e-06, "epoch": 0.275, "percentage": 9.17, "elapsed_time": "0:59:26", "remaining_time": "9:49:00"} | |
| {"current_steps": 120, "total_steps": 1200, "loss": 0.8742, "lr": 5e-06, "epoch": 0.3, "percentage": 10.0, "elapsed_time": "1:04:52", "remaining_time": "9:43:51"} | |
| {"current_steps": 130, "total_steps": 1200, "loss": 0.8689, "lr": 5e-06, "epoch": 0.325, "percentage": 10.83, "elapsed_time": "1:10:16", "remaining_time": "9:38:24"} | |
| {"current_steps": 140, "total_steps": 1200, "loss": 0.8664, "lr": 5e-06, "epoch": 0.35, "percentage": 11.67, "elapsed_time": "1:15:41", "remaining_time": "9:33:04"} | |
| {"current_steps": 150, "total_steps": 1200, "loss": 0.8647, "lr": 5e-06, "epoch": 0.375, "percentage": 12.5, "elapsed_time": "1:21:09", "remaining_time": "9:28:06"} | |
| {"current_steps": 160, "total_steps": 1200, "loss": 0.8614, "lr": 5e-06, "epoch": 0.4, "percentage": 13.33, "elapsed_time": "1:26:35", "remaining_time": "9:22:50"} | |
| {"current_steps": 170, "total_steps": 1200, "loss": 0.8591, "lr": 5e-06, "epoch": 0.425, "percentage": 14.17, "elapsed_time": "1:32:01", "remaining_time": "9:17:36"} | |
| {"current_steps": 180, "total_steps": 1200, "loss": 0.8538, "lr": 5e-06, "epoch": 0.45, "percentage": 15.0, "elapsed_time": "1:37:27", "remaining_time": "9:12:16"} | |
| {"current_steps": 190, "total_steps": 1200, "loss": 0.8519, "lr": 5e-06, "epoch": 0.475, "percentage": 15.83, "elapsed_time": "1:42:55", "remaining_time": "9:07:06"} | |
| {"current_steps": 200, "total_steps": 1200, "loss": 0.8519, "lr": 5e-06, "epoch": 0.5, "percentage": 16.67, "elapsed_time": "1:48:21", "remaining_time": "9:01:46"} | |
| {"current_steps": 210, "total_steps": 1200, "loss": 0.8486, "lr": 5e-06, "epoch": 0.525, "percentage": 17.5, "elapsed_time": "1:53:47", "remaining_time": "8:56:24"} | |
| {"current_steps": 220, "total_steps": 1200, "loss": 0.844, "lr": 5e-06, "epoch": 0.55, "percentage": 18.33, "elapsed_time": "1:59:12", "remaining_time": "8:51:02"} | |
| {"current_steps": 230, "total_steps": 1200, "loss": 0.8447, "lr": 5e-06, "epoch": 0.575, "percentage": 19.17, "elapsed_time": "2:04:39", "remaining_time": "8:45:46"} | |
| {"current_steps": 240, "total_steps": 1200, "loss": 0.8448, "lr": 5e-06, "epoch": 0.6, "percentage": 20.0, "elapsed_time": "2:10:07", "remaining_time": "8:40:29"} | |
| {"current_steps": 250, "total_steps": 1200, "loss": 0.8415, "lr": 5e-06, "epoch": 0.625, "percentage": 20.83, "elapsed_time": "2:15:34", "remaining_time": "8:35:11"} | |
| {"current_steps": 260, "total_steps": 1200, "loss": 0.8412, "lr": 5e-06, "epoch": 0.65, "percentage": 21.67, "elapsed_time": "2:21:00", "remaining_time": "8:29:46"} | |
| {"current_steps": 270, "total_steps": 1200, "loss": 0.8446, "lr": 5e-06, "epoch": 0.675, "percentage": 22.5, "elapsed_time": "2:26:27", "remaining_time": "8:24:27"} | |
| {"current_steps": 280, "total_steps": 1200, "loss": 0.8371, "lr": 5e-06, "epoch": 0.7, "percentage": 23.33, "elapsed_time": "2:31:53", "remaining_time": "8:19:05"} | |
| {"current_steps": 290, "total_steps": 1200, "loss": 0.8368, "lr": 5e-06, "epoch": 0.725, "percentage": 24.17, "elapsed_time": "2:37:21", "remaining_time": "8:13:46"} | |
| {"current_steps": 300, "total_steps": 1200, "loss": 0.8384, "lr": 5e-06, "epoch": 0.75, "percentage": 25.0, "elapsed_time": "2:42:48", "remaining_time": "8:08:24"} | |
| {"current_steps": 310, "total_steps": 1200, "loss": 0.8346, "lr": 5e-06, "epoch": 0.775, "percentage": 25.83, "elapsed_time": "2:48:14", "remaining_time": "8:02:59"} | |
| {"current_steps": 320, "total_steps": 1200, "loss": 0.8331, "lr": 5e-06, "epoch": 0.8, "percentage": 26.67, "elapsed_time": "2:53:39", "remaining_time": "7:57:32"} | |
| {"current_steps": 330, "total_steps": 1200, "loss": 0.8324, "lr": 5e-06, "epoch": 0.825, "percentage": 27.5, "elapsed_time": "2:59:07", "remaining_time": "7:52:13"} | |
| {"current_steps": 340, "total_steps": 1200, "loss": 0.8354, "lr": 5e-06, "epoch": 0.85, "percentage": 28.33, "elapsed_time": "3:04:33", "remaining_time": "7:46:49"} | |
| {"current_steps": 350, "total_steps": 1200, "loss": 0.829, "lr": 5e-06, "epoch": 0.875, "percentage": 29.17, "elapsed_time": "3:09:59", "remaining_time": "7:41:25"} | |
| {"current_steps": 360, "total_steps": 1200, "loss": 0.8307, "lr": 5e-06, "epoch": 0.9, "percentage": 30.0, "elapsed_time": "3:15:26", "remaining_time": "7:36:02"} | |
| {"current_steps": 370, "total_steps": 1200, "loss": 0.8267, "lr": 5e-06, "epoch": 0.925, "percentage": 30.83, "elapsed_time": "3:20:53", "remaining_time": "7:30:38"} | |
| {"current_steps": 380, "total_steps": 1200, "loss": 0.8247, "lr": 5e-06, "epoch": 0.95, "percentage": 31.67, "elapsed_time": "3:26:19", "remaining_time": "7:25:13"} | |
| {"current_steps": 390, "total_steps": 1200, "loss": 0.8256, "lr": 5e-06, "epoch": 0.975, "percentage": 32.5, "elapsed_time": "3:31:46", "remaining_time": "7:19:50"} | |
| {"current_steps": 400, "total_steps": 1200, "loss": 0.8272, "lr": 5e-06, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "3:37:12", "remaining_time": "7:14:24"} | |
| {"current_steps": 400, "total_steps": 1200, "eval_loss": 0.8262304067611694, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "3:41:55", "remaining_time": "7:23:51"} | |
| {"current_steps": 410, "total_steps": 1200, "loss": 0.7842, "lr": 5e-06, "epoch": 1.025, "percentage": 34.17, "elapsed_time": "3:48:33", "remaining_time": "7:20:23"} | |
| {"current_steps": 420, "total_steps": 1200, "loss": 0.7849, "lr": 5e-06, "epoch": 1.05, "percentage": 35.0, "elapsed_time": "3:53:59", "remaining_time": "7:14:33"} | |
| {"current_steps": 430, "total_steps": 1200, "loss": 0.7849, "lr": 5e-06, "epoch": 1.075, "percentage": 35.83, "elapsed_time": "3:59:26", "remaining_time": "7:08:45"} | |
| {"current_steps": 440, "total_steps": 1200, "loss": 0.779, "lr": 5e-06, "epoch": 1.1, "percentage": 36.67, "elapsed_time": "4:04:52", "remaining_time": "7:02:57"} | |
| {"current_steps": 450, "total_steps": 1200, "loss": 0.7831, "lr": 5e-06, "epoch": 1.125, "percentage": 37.5, "elapsed_time": "4:10:19", "remaining_time": "6:57:12"} | |
| {"current_steps": 460, "total_steps": 1200, "loss": 0.7818, "lr": 5e-06, "epoch": 1.15, "percentage": 38.33, "elapsed_time": "4:15:47", "remaining_time": "6:51:28"} | |
| {"current_steps": 470, "total_steps": 1200, "loss": 0.7772, "lr": 5e-06, "epoch": 1.175, "percentage": 39.17, "elapsed_time": "4:21:14", "remaining_time": "6:45:46"} | |
| {"current_steps": 480, "total_steps": 1200, "loss": 0.7813, "lr": 5e-06, "epoch": 1.2, "percentage": 40.0, "elapsed_time": "4:26:41", "remaining_time": "6:40:01"} | |
| {"current_steps": 490, "total_steps": 1200, "loss": 0.7836, "lr": 5e-06, "epoch": 1.225, "percentage": 40.83, "elapsed_time": "4:32:07", "remaining_time": "6:34:18"} | |
| {"current_steps": 500, "total_steps": 1200, "loss": 0.7801, "lr": 5e-06, "epoch": 1.25, "percentage": 41.67, "elapsed_time": "4:37:33", "remaining_time": "6:28:34"} | |
| {"current_steps": 510, "total_steps": 1200, "loss": 0.7806, "lr": 5e-06, "epoch": 1.275, "percentage": 42.5, "elapsed_time": "4:42:59", "remaining_time": "6:22:51"} | |
| {"current_steps": 520, "total_steps": 1200, "loss": 0.7776, "lr": 5e-06, "epoch": 1.3, "percentage": 43.33, "elapsed_time": "4:48:25", "remaining_time": "6:17:10"} | |
| {"current_steps": 530, "total_steps": 1200, "loss": 0.7796, "lr": 5e-06, "epoch": 1.325, "percentage": 44.17, "elapsed_time": "4:53:52", "remaining_time": "6:11:29"} | |
| {"current_steps": 540, "total_steps": 1200, "loss": 0.7823, "lr": 5e-06, "epoch": 1.35, "percentage": 45.0, "elapsed_time": "4:59:18", "remaining_time": "6:05:49"} | |
| {"current_steps": 550, "total_steps": 1200, "loss": 0.7783, "lr": 5e-06, "epoch": 1.375, "percentage": 45.83, "elapsed_time": "5:04:43", "remaining_time": "6:00:08"} | |
| {"current_steps": 560, "total_steps": 1200, "loss": 0.7755, "lr": 5e-06, "epoch": 1.4, "percentage": 46.67, "elapsed_time": "5:10:11", "remaining_time": "5:54:30"} | |
| {"current_steps": 570, "total_steps": 1200, "loss": 0.7811, "lr": 5e-06, "epoch": 1.425, "percentage": 47.5, "elapsed_time": "5:15:38", "remaining_time": "5:48:52"} | |
| {"current_steps": 580, "total_steps": 1200, "loss": 0.7783, "lr": 5e-06, "epoch": 1.45, "percentage": 48.33, "elapsed_time": "5:21:06", "remaining_time": "5:43:14"} | |
| {"current_steps": 590, "total_steps": 1200, "loss": 0.7789, "lr": 5e-06, "epoch": 1.475, "percentage": 49.17, "elapsed_time": "5:26:31", "remaining_time": "5:37:35"} | |
| {"current_steps": 600, "total_steps": 1200, "loss": 0.7732, "lr": 5e-06, "epoch": 1.5, "percentage": 50.0, "elapsed_time": "5:31:56", "remaining_time": "5:31:56"} | |
| {"current_steps": 610, "total_steps": 1200, "loss": 0.7803, "lr": 5e-06, "epoch": 1.525, "percentage": 50.83, "elapsed_time": "5:37:22", "remaining_time": "5:26:19"} | |
| {"current_steps": 620, "total_steps": 1200, "loss": 0.7771, "lr": 5e-06, "epoch": 1.55, "percentage": 51.67, "elapsed_time": "5:42:50", "remaining_time": "5:20:43"} | |
| {"current_steps": 630, "total_steps": 1200, "loss": 0.7781, "lr": 5e-06, "epoch": 1.575, "percentage": 52.5, "elapsed_time": "5:48:16", "remaining_time": "5:15:06"} | |
| {"current_steps": 640, "total_steps": 1200, "loss": 0.7803, "lr": 5e-06, "epoch": 1.6, "percentage": 53.33, "elapsed_time": "5:53:43", "remaining_time": "5:09:30"} | |
| {"current_steps": 650, "total_steps": 1200, "loss": 0.7755, "lr": 5e-06, "epoch": 1.625, "percentage": 54.17, "elapsed_time": "5:59:07", "remaining_time": "5:03:52"} | |
| {"current_steps": 660, "total_steps": 1200, "loss": 0.7784, "lr": 5e-06, "epoch": 1.65, "percentage": 55.0, "elapsed_time": "6:04:34", "remaining_time": "4:58:17"} | |
| {"current_steps": 670, "total_steps": 1200, "loss": 0.7798, "lr": 5e-06, "epoch": 1.675, "percentage": 55.83, "elapsed_time": "6:10:01", "remaining_time": "4:52:42"} | |
| {"current_steps": 680, "total_steps": 1200, "loss": 0.7779, "lr": 5e-06, "epoch": 1.7, "percentage": 56.67, "elapsed_time": "6:15:28", "remaining_time": "4:47:07"} | |
| {"current_steps": 690, "total_steps": 1200, "loss": 0.7743, "lr": 5e-06, "epoch": 1.725, "percentage": 57.5, "elapsed_time": "6:20:56", "remaining_time": "4:41:33"} | |
| {"current_steps": 700, "total_steps": 1200, "loss": 0.7764, "lr": 5e-06, "epoch": 1.75, "percentage": 58.33, "elapsed_time": "6:26:23", "remaining_time": "4:35:59"} | |
| {"current_steps": 710, "total_steps": 1200, "loss": 0.7743, "lr": 5e-06, "epoch": 1.775, "percentage": 59.17, "elapsed_time": "6:31:50", "remaining_time": "4:30:25"} | |
| {"current_steps": 720, "total_steps": 1200, "loss": 0.7795, "lr": 5e-06, "epoch": 1.8, "percentage": 60.0, "elapsed_time": "6:37:17", "remaining_time": "4:24:51"} | |
| {"current_steps": 730, "total_steps": 1200, "loss": 0.7727, "lr": 5e-06, "epoch": 1.825, "percentage": 60.83, "elapsed_time": "6:42:44", "remaining_time": "4:19:17"} | |
| {"current_steps": 740, "total_steps": 1200, "loss": 0.7716, "lr": 5e-06, "epoch": 1.85, "percentage": 61.67, "elapsed_time": "6:48:11", "remaining_time": "4:13:44"} | |
| {"current_steps": 750, "total_steps": 1200, "loss": 0.7759, "lr": 5e-06, "epoch": 1.875, "percentage": 62.5, "elapsed_time": "6:53:38", "remaining_time": "4:08:11"} | |
| {"current_steps": 760, "total_steps": 1200, "loss": 0.7725, "lr": 5e-06, "epoch": 1.9, "percentage": 63.33, "elapsed_time": "6:59:03", "remaining_time": "4:02:36"} | |
| {"current_steps": 770, "total_steps": 1200, "loss": 0.7746, "lr": 5e-06, "epoch": 1.925, "percentage": 64.17, "elapsed_time": "7:04:28", "remaining_time": "3:57:02"} | |
| {"current_steps": 780, "total_steps": 1200, "loss": 0.7762, "lr": 5e-06, "epoch": 1.95, "percentage": 65.0, "elapsed_time": "7:09:54", "remaining_time": "3:51:29"} | |
| {"current_steps": 790, "total_steps": 1200, "loss": 0.771, "lr": 5e-06, "epoch": 1.975, "percentage": 65.83, "elapsed_time": "7:15:21", "remaining_time": "3:45:56"} | |
| {"current_steps": 800, "total_steps": 1200, "loss": 0.7753, "lr": 5e-06, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "7:20:47", "remaining_time": "3:40:23"} | |
| {"current_steps": 800, "total_steps": 1200, "eval_loss": 0.8092445731163025, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "7:25:26", "remaining_time": "3:42:43"} | |
| {"current_steps": 810, "total_steps": 1200, "loss": 0.731, "lr": 5e-06, "epoch": 2.025, "percentage": 67.5, "elapsed_time": "7:32:09", "remaining_time": "3:37:42"} | |
| {"current_steps": 820, "total_steps": 1200, "loss": 0.7254, "lr": 5e-06, "epoch": 2.05, "percentage": 68.33, "elapsed_time": "7:37:36", "remaining_time": "3:32:03"} | |
| {"current_steps": 830, "total_steps": 1200, "loss": 0.722, "lr": 5e-06, "epoch": 2.075, "percentage": 69.17, "elapsed_time": "7:43:02", "remaining_time": "3:26:25"} | |
| {"current_steps": 840, "total_steps": 1200, "loss": 0.7251, "lr": 5e-06, "epoch": 2.1, "percentage": 70.0, "elapsed_time": "7:48:30", "remaining_time": "3:20:47"} | |
| {"current_steps": 850, "total_steps": 1200, "loss": 0.7329, "lr": 5e-06, "epoch": 2.125, "percentage": 70.83, "elapsed_time": "7:53:56", "remaining_time": "3:15:08"} | |
| {"current_steps": 860, "total_steps": 1200, "loss": 0.7282, "lr": 5e-06, "epoch": 2.15, "percentage": 71.67, "elapsed_time": "7:59:23", "remaining_time": "3:09:31"} | |
| {"current_steps": 870, "total_steps": 1200, "loss": 0.7283, "lr": 5e-06, "epoch": 2.175, "percentage": 72.5, "elapsed_time": "8:04:49", "remaining_time": "3:03:53"} | |
| {"current_steps": 880, "total_steps": 1200, "loss": 0.7333, "lr": 5e-06, "epoch": 2.2, "percentage": 73.33, "elapsed_time": "8:10:13", "remaining_time": "2:58:15"} | |
| {"current_steps": 890, "total_steps": 1200, "loss": 0.7307, "lr": 5e-06, "epoch": 2.225, "percentage": 74.17, "elapsed_time": "8:15:38", "remaining_time": "2:52:38"} | |
| {"current_steps": 900, "total_steps": 1200, "loss": 0.7276, "lr": 5e-06, "epoch": 2.25, "percentage": 75.0, "elapsed_time": "8:21:02", "remaining_time": "2:47:00"} | |
| {"current_steps": 910, "total_steps": 1200, "loss": 0.7284, "lr": 5e-06, "epoch": 2.275, "percentage": 75.83, "elapsed_time": "8:26:27", "remaining_time": "2:41:23"} | |
| {"current_steps": 920, "total_steps": 1200, "loss": 0.7287, "lr": 5e-06, "epoch": 2.3, "percentage": 76.67, "elapsed_time": "8:31:53", "remaining_time": "2:35:47"} | |
| {"current_steps": 930, "total_steps": 1200, "loss": 0.7272, "lr": 5e-06, "epoch": 2.325, "percentage": 77.5, "elapsed_time": "8:37:20", "remaining_time": "2:30:11"} | |
| {"current_steps": 940, "total_steps": 1200, "loss": 0.7301, "lr": 5e-06, "epoch": 2.35, "percentage": 78.33, "elapsed_time": "8:42:47", "remaining_time": "2:24:36"} | |
| {"current_steps": 950, "total_steps": 1200, "loss": 0.7333, "lr": 5e-06, "epoch": 2.375, "percentage": 79.17, "elapsed_time": "8:48:14", "remaining_time": "2:19:00"} | |
| {"current_steps": 960, "total_steps": 1200, "loss": 0.7279, "lr": 5e-06, "epoch": 2.4, "percentage": 80.0, "elapsed_time": "8:53:42", "remaining_time": "2:13:25"} | |
| {"current_steps": 970, "total_steps": 1200, "loss": 0.7307, "lr": 5e-06, "epoch": 2.425, "percentage": 80.83, "elapsed_time": "8:59:10", "remaining_time": "2:07:50"} | |
| {"current_steps": 980, "total_steps": 1200, "loss": 0.727, "lr": 5e-06, "epoch": 2.45, "percentage": 81.67, "elapsed_time": "9:04:36", "remaining_time": "2:02:15"} | |
| {"current_steps": 990, "total_steps": 1200, "loss": 0.7315, "lr": 5e-06, "epoch": 2.475, "percentage": 82.5, "elapsed_time": "9:10:02", "remaining_time": "1:56:40"} | |
| {"current_steps": 1000, "total_steps": 1200, "loss": 0.732, "lr": 5e-06, "epoch": 2.5, "percentage": 83.33, "elapsed_time": "9:15:29", "remaining_time": "1:51:05"} | |
| {"current_steps": 1010, "total_steps": 1200, "loss": 0.7301, "lr": 5e-06, "epoch": 2.525, "percentage": 84.17, "elapsed_time": "9:20:55", "remaining_time": "1:45:31"} | |
| {"current_steps": 1020, "total_steps": 1200, "loss": 0.727, "lr": 5e-06, "epoch": 2.55, "percentage": 85.0, "elapsed_time": "9:26:22", "remaining_time": "1:39:56"} | |
| {"current_steps": 1030, "total_steps": 1200, "loss": 0.732, "lr": 5e-06, "epoch": 2.575, "percentage": 85.83, "elapsed_time": "9:31:49", "remaining_time": "1:34:22"} | |
| {"current_steps": 1040, "total_steps": 1200, "loss": 0.7304, "lr": 5e-06, "epoch": 2.6, "percentage": 86.67, "elapsed_time": "9:37:16", "remaining_time": "1:28:48"} | |
| {"current_steps": 1050, "total_steps": 1200, "loss": 0.7301, "lr": 5e-06, "epoch": 2.625, "percentage": 87.5, "elapsed_time": "9:42:43", "remaining_time": "1:23:14"} | |
| {"current_steps": 1060, "total_steps": 1200, "loss": 0.7303, "lr": 5e-06, "epoch": 2.65, "percentage": 88.33, "elapsed_time": "9:48:10", "remaining_time": "1:17:40"} | |
| {"current_steps": 1070, "total_steps": 1200, "loss": 0.7352, "lr": 5e-06, "epoch": 2.675, "percentage": 89.17, "elapsed_time": "9:53:35", "remaining_time": "1:12:07"} | |
| {"current_steps": 1080, "total_steps": 1200, "loss": 0.7325, "lr": 5e-06, "epoch": 2.7, "percentage": 90.0, "elapsed_time": "9:59:01", "remaining_time": "1:06:33"} | |
| {"current_steps": 1090, "total_steps": 1200, "loss": 0.7297, "lr": 5e-06, "epoch": 2.725, "percentage": 90.83, "elapsed_time": "10:04:28", "remaining_time": "1:01:00"} | |
| {"current_steps": 1100, "total_steps": 1200, "loss": 0.7302, "lr": 5e-06, "epoch": 2.75, "percentage": 91.67, "elapsed_time": "10:09:54", "remaining_time": "0:55:26"} | |
| {"current_steps": 1110, "total_steps": 1200, "loss": 0.7338, "lr": 5e-06, "epoch": 2.775, "percentage": 92.5, "elapsed_time": "10:15:22", "remaining_time": "0:49:53"} | |
| {"current_steps": 1120, "total_steps": 1200, "loss": 0.7333, "lr": 5e-06, "epoch": 2.8, "percentage": 93.33, "elapsed_time": "10:20:49", "remaining_time": "0:44:20"} | |
| {"current_steps": 1130, "total_steps": 1200, "loss": 0.7368, "lr": 5e-06, "epoch": 2.825, "percentage": 94.17, "elapsed_time": "10:26:17", "remaining_time": "0:38:47"} | |
| {"current_steps": 1140, "total_steps": 1200, "loss": 0.7315, "lr": 5e-06, "epoch": 2.85, "percentage": 95.0, "elapsed_time": "10:31:44", "remaining_time": "0:33:14"} | |
| {"current_steps": 1150, "total_steps": 1200, "loss": 0.7328, "lr": 5e-06, "epoch": 2.875, "percentage": 95.83, "elapsed_time": "10:37:11", "remaining_time": "0:27:42"} | |
| {"current_steps": 1160, "total_steps": 1200, "loss": 0.7335, "lr": 5e-06, "epoch": 2.9, "percentage": 96.67, "elapsed_time": "10:42:37", "remaining_time": "0:22:09"} | |
| {"current_steps": 1170, "total_steps": 1200, "loss": 0.7296, "lr": 5e-06, "epoch": 2.925, "percentage": 97.5, "elapsed_time": "10:48:03", "remaining_time": "0:16:37"} | |
| {"current_steps": 1180, "total_steps": 1200, "loss": 0.7336, "lr": 5e-06, "epoch": 2.95, "percentage": 98.33, "elapsed_time": "10:53:30", "remaining_time": "0:11:04"} | |
| {"current_steps": 1190, "total_steps": 1200, "loss": 0.7316, "lr": 5e-06, "epoch": 2.975, "percentage": 99.17, "elapsed_time": "10:58:57", "remaining_time": "0:05:32"} | |
| {"current_steps": 1200, "total_steps": 1200, "loss": 0.7331, "lr": 5e-06, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "11:04:21", "remaining_time": "0:00:00"} | |
| {"current_steps": 1200, "total_steps": 1200, "eval_loss": 0.8070117235183716, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "11:10:12", "remaining_time": "0:00:00"} | |
| {"current_steps": 1200, "total_steps": 1200, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "11:11:47", "remaining_time": "0:00:00"} | |