File size: 21,965 Bytes
c84107e 2910f76 2c2263a f647994 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 | {"current_steps": 10, "total_steps": 1197, "loss": 1.0783, "lr": 5e-06, "epoch": 0.025031289111389236, "percentage": 0.84, "elapsed_time": "0:05:23", "remaining_time": "10:39:35"}
{"current_steps": 20, "total_steps": 1197, "loss": 0.9676, "lr": 5e-06, "epoch": 0.05006257822277847, "percentage": 1.67, "elapsed_time": "0:10:39", "remaining_time": "10:27:40"}
{"current_steps": 30, "total_steps": 1197, "loss": 0.9339, "lr": 5e-06, "epoch": 0.07509386733416772, "percentage": 2.51, "elapsed_time": "0:15:56", "remaining_time": "10:20:10"}
{"current_steps": 40, "total_steps": 1197, "loss": 0.9069, "lr": 5e-06, "epoch": 0.10012515644555695, "percentage": 3.34, "elapsed_time": "0:21:12", "remaining_time": "10:13:29"}
{"current_steps": 50, "total_steps": 1197, "loss": 0.8873, "lr": 5e-06, "epoch": 0.1251564455569462, "percentage": 4.18, "elapsed_time": "0:26:29", "remaining_time": "10:07:47"}
{"current_steps": 60, "total_steps": 1197, "loss": 0.8743, "lr": 5e-06, "epoch": 0.15018773466833543, "percentage": 5.01, "elapsed_time": "0:31:47", "remaining_time": "10:02:26"}
{"current_steps": 70, "total_steps": 1197, "loss": 0.8694, "lr": 5e-06, "epoch": 0.17521902377972465, "percentage": 5.85, "elapsed_time": "0:37:05", "remaining_time": "9:57:05"}
{"current_steps": 80, "total_steps": 1197, "loss": 0.8554, "lr": 5e-06, "epoch": 0.2002503128911139, "percentage": 6.68, "elapsed_time": "0:42:19", "remaining_time": "9:50:56"}
{"current_steps": 90, "total_steps": 1197, "loss": 0.8509, "lr": 5e-06, "epoch": 0.22528160200250313, "percentage": 7.52, "elapsed_time": "0:47:33", "remaining_time": "9:45:00"}
{"current_steps": 100, "total_steps": 1197, "loss": 0.8447, "lr": 5e-06, "epoch": 0.2503128911138924, "percentage": 8.35, "elapsed_time": "0:52:49", "remaining_time": "9:39:32"}
{"current_steps": 110, "total_steps": 1197, "loss": 0.8397, "lr": 5e-06, "epoch": 0.2753441802252816, "percentage": 9.19, "elapsed_time": "0:58:05", "remaining_time": "9:34:00"}
{"current_steps": 120, "total_steps": 1197, "loss": 0.8363, "lr": 5e-06, "epoch": 0.30037546933667086, "percentage": 10.03, "elapsed_time": "1:03:20", "remaining_time": "9:28:31"}
{"current_steps": 130, "total_steps": 1197, "loss": 0.8331, "lr": 5e-06, "epoch": 0.32540675844806005, "percentage": 10.86, "elapsed_time": "1:08:36", "remaining_time": "9:23:09"}
{"current_steps": 140, "total_steps": 1197, "loss": 0.8319, "lr": 5e-06, "epoch": 0.3504380475594493, "percentage": 11.7, "elapsed_time": "1:13:52", "remaining_time": "9:17:46"}
{"current_steps": 150, "total_steps": 1197, "loss": 0.8228, "lr": 5e-06, "epoch": 0.37546933667083854, "percentage": 12.53, "elapsed_time": "1:19:07", "remaining_time": "9:12:20"}
{"current_steps": 160, "total_steps": 1197, "loss": 0.8273, "lr": 5e-06, "epoch": 0.4005006257822278, "percentage": 13.37, "elapsed_time": "1:24:26", "remaining_time": "9:07:14"}
{"current_steps": 170, "total_steps": 1197, "loss": 0.8271, "lr": 5e-06, "epoch": 0.425531914893617, "percentage": 14.2, "elapsed_time": "1:29:42", "remaining_time": "9:01:55"}
{"current_steps": 180, "total_steps": 1197, "loss": 0.8201, "lr": 5e-06, "epoch": 0.45056320400500627, "percentage": 15.04, "elapsed_time": "1:34:58", "remaining_time": "8:56:37"}
{"current_steps": 190, "total_steps": 1197, "loss": 0.8165, "lr": 5e-06, "epoch": 0.4755944931163955, "percentage": 15.87, "elapsed_time": "1:40:15", "remaining_time": "8:51:22"}
{"current_steps": 200, "total_steps": 1197, "loss": 0.8165, "lr": 5e-06, "epoch": 0.5006257822277848, "percentage": 16.71, "elapsed_time": "1:45:32", "remaining_time": "8:46:08"}
{"current_steps": 210, "total_steps": 1197, "loss": 0.814, "lr": 5e-06, "epoch": 0.5256570713391739, "percentage": 17.54, "elapsed_time": "1:50:50", "remaining_time": "8:40:58"}
{"current_steps": 220, "total_steps": 1197, "loss": 0.8158, "lr": 5e-06, "epoch": 0.5506883604505632, "percentage": 18.38, "elapsed_time": "1:56:07", "remaining_time": "8:35:40"}
{"current_steps": 230, "total_steps": 1197, "loss": 0.8126, "lr": 5e-06, "epoch": 0.5757196495619524, "percentage": 19.21, "elapsed_time": "2:01:23", "remaining_time": "8:30:23"}
{"current_steps": 240, "total_steps": 1197, "loss": 0.8094, "lr": 5e-06, "epoch": 0.6007509386733417, "percentage": 20.05, "elapsed_time": "2:06:39", "remaining_time": "8:25:01"}
{"current_steps": 250, "total_steps": 1197, "loss": 0.8081, "lr": 5e-06, "epoch": 0.6257822277847309, "percentage": 20.89, "elapsed_time": "2:11:57", "remaining_time": "8:19:49"}
{"current_steps": 260, "total_steps": 1197, "loss": 0.8063, "lr": 5e-06, "epoch": 0.6508135168961201, "percentage": 21.72, "elapsed_time": "2:17:15", "remaining_time": "8:14:38"}
{"current_steps": 270, "total_steps": 1197, "loss": 0.8086, "lr": 5e-06, "epoch": 0.6758448060075094, "percentage": 22.56, "elapsed_time": "2:22:32", "remaining_time": "8:09:23"}
{"current_steps": 280, "total_steps": 1197, "loss": 0.8006, "lr": 5e-06, "epoch": 0.7008760951188986, "percentage": 23.39, "elapsed_time": "2:27:49", "remaining_time": "8:04:07"}
{"current_steps": 290, "total_steps": 1197, "loss": 0.8006, "lr": 5e-06, "epoch": 0.7259073842302879, "percentage": 24.23, "elapsed_time": "2:33:06", "remaining_time": "7:58:51"}
{"current_steps": 300, "total_steps": 1197, "loss": 0.7961, "lr": 5e-06, "epoch": 0.7509386733416771, "percentage": 25.06, "elapsed_time": "2:38:21", "remaining_time": "7:53:30"}
{"current_steps": 310, "total_steps": 1197, "loss": 0.7989, "lr": 5e-06, "epoch": 0.7759699624530664, "percentage": 25.9, "elapsed_time": "2:43:38", "remaining_time": "7:48:12"}
{"current_steps": 320, "total_steps": 1197, "loss": 0.7958, "lr": 5e-06, "epoch": 0.8010012515644556, "percentage": 26.73, "elapsed_time": "2:48:54", "remaining_time": "7:42:55"}
{"current_steps": 330, "total_steps": 1197, "loss": 0.798, "lr": 5e-06, "epoch": 0.8260325406758448, "percentage": 27.57, "elapsed_time": "2:54:14", "remaining_time": "7:37:45"}
{"current_steps": 340, "total_steps": 1197, "loss": 0.7979, "lr": 5e-06, "epoch": 0.851063829787234, "percentage": 28.4, "elapsed_time": "2:59:33", "remaining_time": "7:32:35"}
{"current_steps": 350, "total_steps": 1197, "loss": 0.796, "lr": 5e-06, "epoch": 0.8760951188986232, "percentage": 29.24, "elapsed_time": "3:04:53", "remaining_time": "7:27:25"}
{"current_steps": 360, "total_steps": 1197, "loss": 0.7927, "lr": 5e-06, "epoch": 0.9011264080100125, "percentage": 30.08, "elapsed_time": "3:10:12", "remaining_time": "7:22:13"}
{"current_steps": 370, "total_steps": 1197, "loss": 0.7954, "lr": 5e-06, "epoch": 0.9261576971214017, "percentage": 30.91, "elapsed_time": "3:15:30", "remaining_time": "7:17:00"}
{"current_steps": 380, "total_steps": 1197, "loss": 0.7892, "lr": 5e-06, "epoch": 0.951188986232791, "percentage": 31.75, "elapsed_time": "3:20:50", "remaining_time": "7:11:47"}
{"current_steps": 390, "total_steps": 1197, "loss": 0.7876, "lr": 5e-06, "epoch": 0.9762202753441802, "percentage": 32.58, "elapsed_time": "3:26:08", "remaining_time": "7:06:33"}
{"current_steps": 399, "total_steps": 1197, "eval_loss": 0.7894856929779053, "epoch": 0.9987484355444305, "percentage": 33.33, "elapsed_time": "3:35:34", "remaining_time": "7:11:09"}
{"current_steps": 400, "total_steps": 1197, "loss": 0.8446, "lr": 5e-06, "epoch": 1.0018773466833542, "percentage": 33.42, "elapsed_time": "3:37:09", "remaining_time": "7:12:41"}
{"current_steps": 410, "total_steps": 1197, "loss": 0.7458, "lr": 5e-06, "epoch": 1.0269086357947435, "percentage": 34.25, "elapsed_time": "3:42:27", "remaining_time": "7:07:00"}
{"current_steps": 420, "total_steps": 1197, "loss": 0.7468, "lr": 5e-06, "epoch": 1.0519399249061328, "percentage": 35.09, "elapsed_time": "3:47:44", "remaining_time": "7:01:19"}
{"current_steps": 430, "total_steps": 1197, "loss": 0.7482, "lr": 5e-06, "epoch": 1.0769712140175218, "percentage": 35.92, "elapsed_time": "3:53:02", "remaining_time": "6:55:41"}
{"current_steps": 440, "total_steps": 1197, "loss": 0.7462, "lr": 5e-06, "epoch": 1.1020025031289111, "percentage": 36.76, "elapsed_time": "3:58:20", "remaining_time": "6:50:02"}
{"current_steps": 450, "total_steps": 1197, "loss": 0.7451, "lr": 5e-06, "epoch": 1.1270337922403004, "percentage": 37.59, "elapsed_time": "4:03:37", "remaining_time": "6:44:24"}
{"current_steps": 460, "total_steps": 1197, "loss": 0.7455, "lr": 5e-06, "epoch": 1.1520650813516897, "percentage": 38.43, "elapsed_time": "4:08:55", "remaining_time": "6:38:48"}
{"current_steps": 470, "total_steps": 1197, "loss": 0.7464, "lr": 5e-06, "epoch": 1.1770963704630788, "percentage": 39.26, "elapsed_time": "4:14:12", "remaining_time": "6:33:12"}
{"current_steps": 480, "total_steps": 1197, "loss": 0.7467, "lr": 5e-06, "epoch": 1.202127659574468, "percentage": 40.1, "elapsed_time": "4:19:30", "remaining_time": "6:27:38"}
{"current_steps": 490, "total_steps": 1197, "loss": 0.7466, "lr": 5e-06, "epoch": 1.2271589486858574, "percentage": 40.94, "elapsed_time": "4:24:48", "remaining_time": "6:22:05"}
{"current_steps": 500, "total_steps": 1197, "loss": 0.7472, "lr": 5e-06, "epoch": 1.2521902377972465, "percentage": 41.77, "elapsed_time": "4:30:06", "remaining_time": "6:16:32"}
{"current_steps": 510, "total_steps": 1197, "loss": 0.7483, "lr": 5e-06, "epoch": 1.2772215269086358, "percentage": 42.61, "elapsed_time": "4:35:24", "remaining_time": "6:10:59"}
{"current_steps": 520, "total_steps": 1197, "loss": 0.7435, "lr": 5e-06, "epoch": 1.302252816020025, "percentage": 43.44, "elapsed_time": "4:40:42", "remaining_time": "6:05:27"}
{"current_steps": 530, "total_steps": 1197, "loss": 0.7466, "lr": 5e-06, "epoch": 1.3272841051314144, "percentage": 44.28, "elapsed_time": "4:45:58", "remaining_time": "5:59:53"}
{"current_steps": 540, "total_steps": 1197, "loss": 0.7448, "lr": 5e-06, "epoch": 1.3523153942428034, "percentage": 45.11, "elapsed_time": "4:51:16", "remaining_time": "5:54:22"}
{"current_steps": 550, "total_steps": 1197, "loss": 0.744, "lr": 5e-06, "epoch": 1.3773466833541927, "percentage": 45.95, "elapsed_time": "4:56:33", "remaining_time": "5:48:52"}
{"current_steps": 560, "total_steps": 1197, "loss": 0.7478, "lr": 5e-06, "epoch": 1.402377972465582, "percentage": 46.78, "elapsed_time": "5:01:51", "remaining_time": "5:43:21"}
{"current_steps": 570, "total_steps": 1197, "loss": 0.7439, "lr": 5e-06, "epoch": 1.4274092615769711, "percentage": 47.62, "elapsed_time": "5:07:09", "remaining_time": "5:37:52"}
{"current_steps": 580, "total_steps": 1197, "loss": 0.7409, "lr": 5e-06, "epoch": 1.4524405506883604, "percentage": 48.45, "elapsed_time": "5:12:26", "remaining_time": "5:32:22"}
{"current_steps": 590, "total_steps": 1197, "loss": 0.7426, "lr": 5e-06, "epoch": 1.4774718397997497, "percentage": 49.29, "elapsed_time": "5:17:45", "remaining_time": "5:26:54"}
{"current_steps": 600, "total_steps": 1197, "loss": 0.7411, "lr": 5e-06, "epoch": 1.502503128911139, "percentage": 50.13, "elapsed_time": "5:23:03", "remaining_time": "5:21:27"}
{"current_steps": 610, "total_steps": 1197, "loss": 0.7443, "lr": 5e-06, "epoch": 1.5275344180225283, "percentage": 50.96, "elapsed_time": "5:28:21", "remaining_time": "5:15:59"}
{"current_steps": 620, "total_steps": 1197, "loss": 0.745, "lr": 5e-06, "epoch": 1.5525657071339174, "percentage": 51.8, "elapsed_time": "5:33:40", "remaining_time": "5:10:31"}
{"current_steps": 630, "total_steps": 1197, "loss": 0.7431, "lr": 5e-06, "epoch": 1.5775969962453065, "percentage": 52.63, "elapsed_time": "5:38:58", "remaining_time": "5:05:04"}
{"current_steps": 640, "total_steps": 1197, "loss": 0.745, "lr": 5e-06, "epoch": 1.6026282853566958, "percentage": 53.47, "elapsed_time": "5:44:13", "remaining_time": "4:59:34"}
{"current_steps": 650, "total_steps": 1197, "loss": 0.745, "lr": 5e-06, "epoch": 1.627659574468085, "percentage": 54.3, "elapsed_time": "5:49:30", "remaining_time": "4:54:07"}
{"current_steps": 660, "total_steps": 1197, "loss": 0.7413, "lr": 5e-06, "epoch": 1.6526908635794744, "percentage": 55.14, "elapsed_time": "5:54:47", "remaining_time": "4:48:40"}
{"current_steps": 670, "total_steps": 1197, "loss": 0.746, "lr": 5e-06, "epoch": 1.6777221526908637, "percentage": 55.97, "elapsed_time": "6:00:03", "remaining_time": "4:43:12"}
{"current_steps": 680, "total_steps": 1197, "loss": 0.7434, "lr": 5e-06, "epoch": 1.702753441802253, "percentage": 56.81, "elapsed_time": "6:05:21", "remaining_time": "4:37:46"}
{"current_steps": 690, "total_steps": 1197, "loss": 0.7426, "lr": 5e-06, "epoch": 1.727784730913642, "percentage": 57.64, "elapsed_time": "6:10:39", "remaining_time": "4:32:21"}
{"current_steps": 700, "total_steps": 1197, "loss": 0.7397, "lr": 5e-06, "epoch": 1.7528160200250313, "percentage": 58.48, "elapsed_time": "6:15:55", "remaining_time": "4:26:54"}
{"current_steps": 710, "total_steps": 1197, "loss": 0.7425, "lr": 5e-06, "epoch": 1.7778473091364204, "percentage": 59.31, "elapsed_time": "6:21:14", "remaining_time": "4:21:29"}
{"current_steps": 720, "total_steps": 1197, "loss": 0.7415, "lr": 5e-06, "epoch": 1.8028785982478097, "percentage": 60.15, "elapsed_time": "6:26:31", "remaining_time": "4:16:04"}
{"current_steps": 730, "total_steps": 1197, "loss": 0.7409, "lr": 5e-06, "epoch": 1.827909887359199, "percentage": 60.99, "elapsed_time": "6:31:48", "remaining_time": "4:10:39"}
{"current_steps": 740, "total_steps": 1197, "loss": 0.741, "lr": 5e-06, "epoch": 1.8529411764705883, "percentage": 61.82, "elapsed_time": "6:37:06", "remaining_time": "4:05:14"}
{"current_steps": 750, "total_steps": 1197, "loss": 0.7398, "lr": 5e-06, "epoch": 1.8779724655819776, "percentage": 62.66, "elapsed_time": "6:42:24", "remaining_time": "3:59:49"}
{"current_steps": 760, "total_steps": 1197, "loss": 0.7375, "lr": 5e-06, "epoch": 1.9030037546933667, "percentage": 63.49, "elapsed_time": "6:47:42", "remaining_time": "3:54:25"}
{"current_steps": 770, "total_steps": 1197, "loss": 0.7398, "lr": 5e-06, "epoch": 1.928035043804756, "percentage": 64.33, "elapsed_time": "6:52:59", "remaining_time": "3:49:01"}
{"current_steps": 780, "total_steps": 1197, "loss": 0.738, "lr": 5e-06, "epoch": 1.953066332916145, "percentage": 65.16, "elapsed_time": "6:58:15", "remaining_time": "3:43:36"}
{"current_steps": 790, "total_steps": 1197, "loss": 0.7419, "lr": 5e-06, "epoch": 1.9780976220275344, "percentage": 66.0, "elapsed_time": "7:03:29", "remaining_time": "3:38:10"}
{"current_steps": 798, "total_steps": 1197, "eval_loss": 0.7726743817329407, "epoch": 1.9981226533166458, "percentage": 66.67, "elapsed_time": "7:12:37", "remaining_time": "3:36:18"}
{"current_steps": 800, "total_steps": 1197, "loss": 0.7865, "lr": 5e-06, "epoch": 2.0037546933667083, "percentage": 66.83, "elapsed_time": "7:14:45", "remaining_time": "3:35:44"}
{"current_steps": 810, "total_steps": 1197, "loss": 0.699, "lr": 5e-06, "epoch": 2.0287859824780976, "percentage": 67.67, "elapsed_time": "7:20:01", "remaining_time": "3:30:14"}
{"current_steps": 820, "total_steps": 1197, "loss": 0.6925, "lr": 5e-06, "epoch": 2.053817271589487, "percentage": 68.5, "elapsed_time": "7:25:20", "remaining_time": "3:24:44"}
{"current_steps": 830, "total_steps": 1197, "loss": 0.6919, "lr": 5e-06, "epoch": 2.078848560700876, "percentage": 69.34, "elapsed_time": "7:30:38", "remaining_time": "3:19:15"}
{"current_steps": 840, "total_steps": 1197, "loss": 0.6934, "lr": 5e-06, "epoch": 2.1038798498122655, "percentage": 70.18, "elapsed_time": "7:35:56", "remaining_time": "3:13:46"}
{"current_steps": 850, "total_steps": 1197, "loss": 0.6927, "lr": 5e-06, "epoch": 2.1289111389236544, "percentage": 71.01, "elapsed_time": "7:41:14", "remaining_time": "3:08:17"}
{"current_steps": 860, "total_steps": 1197, "loss": 0.6937, "lr": 5e-06, "epoch": 2.1539424280350437, "percentage": 71.85, "elapsed_time": "7:46:31", "remaining_time": "3:02:48"}
{"current_steps": 870, "total_steps": 1197, "loss": 0.6945, "lr": 5e-06, "epoch": 2.178973717146433, "percentage": 72.68, "elapsed_time": "7:51:48", "remaining_time": "2:57:20"}
{"current_steps": 880, "total_steps": 1197, "loss": 0.6944, "lr": 5e-06, "epoch": 2.2040050062578223, "percentage": 73.52, "elapsed_time": "7:57:06", "remaining_time": "2:51:52"}
{"current_steps": 890, "total_steps": 1197, "loss": 0.6964, "lr": 5e-06, "epoch": 2.2290362953692116, "percentage": 74.35, "elapsed_time": "8:02:24", "remaining_time": "2:46:24"}
{"current_steps": 900, "total_steps": 1197, "loss": 0.6935, "lr": 5e-06, "epoch": 2.254067584480601, "percentage": 75.19, "elapsed_time": "8:07:43", "remaining_time": "2:40:56"}
{"current_steps": 910, "total_steps": 1197, "loss": 0.6993, "lr": 5e-06, "epoch": 2.27909887359199, "percentage": 76.02, "elapsed_time": "8:13:00", "remaining_time": "2:35:29"}
{"current_steps": 920, "total_steps": 1197, "loss": 0.6986, "lr": 5e-06, "epoch": 2.3041301627033794, "percentage": 76.86, "elapsed_time": "8:18:20", "remaining_time": "2:30:02"}
{"current_steps": 930, "total_steps": 1197, "loss": 0.6979, "lr": 5e-06, "epoch": 2.3291614518147683, "percentage": 77.69, "elapsed_time": "8:23:39", "remaining_time": "2:24:35"}
{"current_steps": 940, "total_steps": 1197, "loss": 0.6985, "lr": 5e-06, "epoch": 2.3541927409261576, "percentage": 78.53, "elapsed_time": "8:28:58", "remaining_time": "2:19:09"}
{"current_steps": 950, "total_steps": 1197, "loss": 0.6994, "lr": 5e-06, "epoch": 2.379224030037547, "percentage": 79.37, "elapsed_time": "8:34:17", "remaining_time": "2:13:42"}
{"current_steps": 960, "total_steps": 1197, "loss": 0.6953, "lr": 5e-06, "epoch": 2.404255319148936, "percentage": 80.2, "elapsed_time": "8:39:34", "remaining_time": "2:08:16"}
{"current_steps": 970, "total_steps": 1197, "loss": 0.6977, "lr": 5e-06, "epoch": 2.4292866082603255, "percentage": 81.04, "elapsed_time": "8:44:53", "remaining_time": "2:02:50"}
{"current_steps": 980, "total_steps": 1197, "loss": 0.6936, "lr": 5e-06, "epoch": 2.454317897371715, "percentage": 81.87, "elapsed_time": "8:50:12", "remaining_time": "1:57:24"}
{"current_steps": 990, "total_steps": 1197, "loss": 0.6966, "lr": 5e-06, "epoch": 2.4793491864831037, "percentage": 82.71, "elapsed_time": "8:55:30", "remaining_time": "1:51:58"}
{"current_steps": 1000, "total_steps": 1197, "loss": 0.6977, "lr": 5e-06, "epoch": 2.504380475594493, "percentage": 83.54, "elapsed_time": "9:00:48", "remaining_time": "1:46:32"}
{"current_steps": 1010, "total_steps": 1197, "loss": 0.7037, "lr": 5e-06, "epoch": 2.5294117647058822, "percentage": 84.38, "elapsed_time": "9:06:04", "remaining_time": "1:41:06"}
{"current_steps": 1020, "total_steps": 1197, "loss": 0.695, "lr": 5e-06, "epoch": 2.5544430538172715, "percentage": 85.21, "elapsed_time": "9:11:20", "remaining_time": "1:35:40"}
{"current_steps": 1030, "total_steps": 1197, "loss": 0.702, "lr": 5e-06, "epoch": 2.579474342928661, "percentage": 86.05, "elapsed_time": "9:16:37", "remaining_time": "1:30:14"}
{"current_steps": 1040, "total_steps": 1197, "loss": 0.6965, "lr": 5e-06, "epoch": 2.60450563204005, "percentage": 86.88, "elapsed_time": "9:21:54", "remaining_time": "1:24:49"}
{"current_steps": 1050, "total_steps": 1197, "loss": 0.6958, "lr": 5e-06, "epoch": 2.6295369211514394, "percentage": 87.72, "elapsed_time": "9:27:14", "remaining_time": "1:19:24"}
{"current_steps": 1060, "total_steps": 1197, "loss": 0.6977, "lr": 5e-06, "epoch": 2.6545682102628287, "percentage": 88.55, "elapsed_time": "9:32:32", "remaining_time": "1:13:59"}
{"current_steps": 1070, "total_steps": 1197, "loss": 0.6992, "lr": 5e-06, "epoch": 2.679599499374218, "percentage": 89.39, "elapsed_time": "9:37:51", "remaining_time": "1:08:35"}
{"current_steps": 1080, "total_steps": 1197, "loss": 0.6977, "lr": 5e-06, "epoch": 2.704630788485607, "percentage": 90.23, "elapsed_time": "9:43:10", "remaining_time": "1:03:10"}
{"current_steps": 1090, "total_steps": 1197, "loss": 0.6994, "lr": 5e-06, "epoch": 2.729662077596996, "percentage": 91.06, "elapsed_time": "9:48:29", "remaining_time": "0:57:46"}
{"current_steps": 1100, "total_steps": 1197, "loss": 0.698, "lr": 5e-06, "epoch": 2.7546933667083855, "percentage": 91.9, "elapsed_time": "9:53:48", "remaining_time": "0:52:21"}
{"current_steps": 1110, "total_steps": 1197, "loss": 0.699, "lr": 5e-06, "epoch": 2.779724655819775, "percentage": 92.73, "elapsed_time": "9:59:06", "remaining_time": "0:46:57"}
{"current_steps": 1120, "total_steps": 1197, "loss": 0.6979, "lr": 5e-06, "epoch": 2.804755944931164, "percentage": 93.57, "elapsed_time": "10:04:23", "remaining_time": "0:41:33"}
{"current_steps": 1130, "total_steps": 1197, "loss": 0.7011, "lr": 5e-06, "epoch": 2.829787234042553, "percentage": 94.4, "elapsed_time": "10:09:40", "remaining_time": "0:36:08"}
{"current_steps": 1140, "total_steps": 1197, "loss": 0.6988, "lr": 5e-06, "epoch": 2.8548185231539422, "percentage": 95.24, "elapsed_time": "10:14:58", "remaining_time": "0:30:44"}
{"current_steps": 1150, "total_steps": 1197, "loss": 0.6968, "lr": 5e-06, "epoch": 2.8798498122653315, "percentage": 96.07, "elapsed_time": "10:20:14", "remaining_time": "0:25:20"}
{"current_steps": 1160, "total_steps": 1197, "loss": 0.7005, "lr": 5e-06, "epoch": 2.904881101376721, "percentage": 96.91, "elapsed_time": "10:25:30", "remaining_time": "0:19:57"}
{"current_steps": 1170, "total_steps": 1197, "loss": 0.7034, "lr": 5e-06, "epoch": 2.92991239048811, "percentage": 97.74, "elapsed_time": "10:30:47", "remaining_time": "0:14:33"}
{"current_steps": 1180, "total_steps": 1197, "loss": 0.6951, "lr": 5e-06, "epoch": 2.9549436795994994, "percentage": 98.58, "elapsed_time": "10:36:04", "remaining_time": "0:09:09"}
{"current_steps": 1190, "total_steps": 1197, "loss": 0.6976, "lr": 5e-06, "epoch": 2.9799749687108887, "percentage": 99.42, "elapsed_time": "10:41:23", "remaining_time": "0:03:46"}
{"current_steps": 1197, "total_steps": 1197, "eval_loss": 0.770167887210846, "epoch": 2.997496871088861, "percentage": 100.0, "elapsed_time": "10:50:52", "remaining_time": "0:00:00"}
{"current_steps": 1197, "total_steps": 1197, "epoch": 2.997496871088861, "percentage": 100.0, "elapsed_time": "10:52:26", "remaining_time": "0:00:00"}
|