Llama-3.1-8B-Instruct-KTO-600 / trainer_log.jsonl
chchen's picture
Training in progress, step 670
a4414f5 verified
{"current_steps": 10, "total_steps": 670, "loss": 0.5, "lr": 7.462686567164179e-07, "epoch": 0.14814814814814814, "percentage": 1.49, "elapsed_time": "0:00:51", "remaining_time": "0:56:56"}
{"current_steps": 20, "total_steps": 670, "loss": 0.5, "lr": 1.4925373134328358e-06, "epoch": 0.2962962962962963, "percentage": 2.99, "elapsed_time": "0:01:44", "remaining_time": "0:56:24"}
{"current_steps": 30, "total_steps": 670, "loss": 0.5003, "lr": 2.238805970149254e-06, "epoch": 0.4444444444444444, "percentage": 4.48, "elapsed_time": "0:02:36", "remaining_time": "0:55:47"}
{"current_steps": 40, "total_steps": 670, "loss": 0.4997, "lr": 2.9850746268656716e-06, "epoch": 0.5925925925925926, "percentage": 5.97, "elapsed_time": "0:03:26", "remaining_time": "0:54:16"}
{"current_steps": 50, "total_steps": 670, "loss": 0.4993, "lr": 3.73134328358209e-06, "epoch": 0.7407407407407407, "percentage": 7.46, "elapsed_time": "0:04:17", "remaining_time": "0:53:08"}
{"current_steps": 50, "total_steps": 670, "eval_loss": 0.49984320998191833, "epoch": 0.7407407407407407, "percentage": 7.46, "elapsed_time": "0:04:41", "remaining_time": "0:58:07"}
{"current_steps": 60, "total_steps": 670, "loss": 0.4997, "lr": 4.477611940298508e-06, "epoch": 0.8888888888888888, "percentage": 8.96, "elapsed_time": "0:05:39", "remaining_time": "0:57:27"}
{"current_steps": 70, "total_steps": 670, "loss": 0.498, "lr": 4.999694642351633e-06, "epoch": 1.037037037037037, "percentage": 10.45, "elapsed_time": "0:06:30", "remaining_time": "0:55:48"}
{"current_steps": 80, "total_steps": 670, "loss": 0.4936, "lr": 4.994268136829438e-06, "epoch": 1.1851851851851851, "percentage": 11.94, "elapsed_time": "0:07:22", "remaining_time": "0:54:22"}
{"current_steps": 90, "total_steps": 670, "loss": 0.489, "lr": 4.982072857175816e-06, "epoch": 1.3333333333333333, "percentage": 13.43, "elapsed_time": "0:08:12", "remaining_time": "0:52:56"}
{"current_steps": 100, "total_steps": 670, "loss": 0.4763, "lr": 4.963141898105898e-06, "epoch": 1.4814814814814814, "percentage": 14.93, "elapsed_time": "0:09:03", "remaining_time": "0:51:35"}
{"current_steps": 100, "total_steps": 670, "eval_loss": 0.4761941134929657, "epoch": 1.4814814814814814, "percentage": 14.93, "elapsed_time": "0:09:27", "remaining_time": "0:53:53"}
{"current_steps": 110, "total_steps": 670, "loss": 0.4616, "lr": 4.93752663316054e-06, "epoch": 1.6296296296296298, "percentage": 16.42, "elapsed_time": "0:10:25", "remaining_time": "0:53:05"}
{"current_steps": 120, "total_steps": 670, "loss": 0.4534, "lr": 4.905296575292329e-06, "epoch": 1.7777777777777777, "percentage": 17.91, "elapsed_time": "0:11:18", "remaining_time": "0:51:50"}
{"current_steps": 130, "total_steps": 670, "loss": 0.4199, "lr": 4.866539188226086e-06, "epoch": 1.925925925925926, "percentage": 19.4, "elapsed_time": "0:12:10", "remaining_time": "0:50:36"}
{"current_steps": 140, "total_steps": 670, "loss": 0.406, "lr": 4.821359649105801e-06, "epoch": 2.074074074074074, "percentage": 20.9, "elapsed_time": "0:13:03", "remaining_time": "0:49:25"}
{"current_steps": 150, "total_steps": 670, "loss": 0.3669, "lr": 4.769880563072097e-06, "epoch": 2.2222222222222223, "percentage": 22.39, "elapsed_time": "0:13:53", "remaining_time": "0:48:10"}
{"current_steps": 150, "total_steps": 670, "eval_loss": 0.3864615559577942, "epoch": 2.2222222222222223, "percentage": 22.39, "elapsed_time": "0:14:17", "remaining_time": "0:49:33"}
{"current_steps": 160, "total_steps": 670, "loss": 0.34, "lr": 4.712241630544792e-06, "epoch": 2.3703703703703702, "percentage": 23.88, "elapsed_time": "0:15:16", "remaining_time": "0:48:41"}
{"current_steps": 170, "total_steps": 670, "loss": 0.3402, "lr": 4.648599268113464e-06, "epoch": 2.5185185185185186, "percentage": 25.37, "elapsed_time": "0:16:07", "remaining_time": "0:47:26"}
{"current_steps": 180, "total_steps": 670, "loss": 0.341, "lr": 4.579126184064814e-06, "epoch": 2.6666666666666665, "percentage": 26.87, "elapsed_time": "0:16:57", "remaining_time": "0:46:10"}
{"current_steps": 190, "total_steps": 670, "loss": 0.3134, "lr": 4.504010909698744e-06, "epoch": 2.814814814814815, "percentage": 28.36, "elapsed_time": "0:17:52", "remaining_time": "0:45:09"}
{"current_steps": 200, "total_steps": 670, "loss": 0.2687, "lr": 4.4234572877050175e-06, "epoch": 2.962962962962963, "percentage": 29.85, "elapsed_time": "0:18:42", "remaining_time": "0:43:58"}
{"current_steps": 200, "total_steps": 670, "eval_loss": 0.28439071774482727, "epoch": 2.962962962962963, "percentage": 29.85, "elapsed_time": "0:19:06", "remaining_time": "0:44:54"}
{"current_steps": 210, "total_steps": 670, "loss": 0.2378, "lr": 4.337683918988924e-06, "epoch": 3.111111111111111, "percentage": 31.34, "elapsed_time": "0:20:01", "remaining_time": "0:43:50"}
{"current_steps": 220, "total_steps": 670, "loss": 0.2449, "lr": 4.246923569447105e-06, "epoch": 3.259259259259259, "percentage": 32.84, "elapsed_time": "0:20:52", "remaining_time": "0:42:41"}
{"current_steps": 230, "total_steps": 670, "loss": 0.2281, "lr": 4.151422538303393e-06, "epoch": 3.4074074074074074, "percentage": 34.33, "elapsed_time": "0:21:42", "remaining_time": "0:41:32"}
{"current_steps": 240, "total_steps": 670, "loss": 0.2467, "lr": 4.051439989718845e-06, "epoch": 3.5555555555555554, "percentage": 35.82, "elapsed_time": "0:22:32", "remaining_time": "0:40:22"}
{"current_steps": 250, "total_steps": 670, "loss": 0.2398, "lr": 3.947247249489779e-06, "epoch": 3.7037037037037037, "percentage": 37.31, "elapsed_time": "0:23:23", "remaining_time": "0:39:17"}
{"current_steps": 250, "total_steps": 670, "eval_loss": 0.22377242147922516, "epoch": 3.7037037037037037, "percentage": 37.31, "elapsed_time": "0:23:47", "remaining_time": "0:39:57"}
{"current_steps": 260, "total_steps": 670, "loss": 0.2811, "lr": 3.839127068742399e-06, "epoch": 3.851851851851852, "percentage": 38.81, "elapsed_time": "0:24:46", "remaining_time": "0:39:03"}
{"current_steps": 270, "total_steps": 670, "loss": 0.2314, "lr": 3.7273728566221447e-06, "epoch": 4.0, "percentage": 40.3, "elapsed_time": "0:25:38", "remaining_time": "0:37:59"}
{"current_steps": 280, "total_steps": 670, "loss": 0.224, "lr": 3.6122878840600417e-06, "epoch": 4.148148148148148, "percentage": 41.79, "elapsed_time": "0:26:28", "remaining_time": "0:36:51"}
{"current_steps": 290, "total_steps": 670, "loss": 0.2012, "lr": 3.4941844607768007e-06, "epoch": 4.296296296296296, "percentage": 43.28, "elapsed_time": "0:27:17", "remaining_time": "0:35:45"}
{"current_steps": 300, "total_steps": 670, "loss": 0.2508, "lr": 3.3733830877580796e-06, "epoch": 4.444444444444445, "percentage": 44.78, "elapsed_time": "0:28:10", "remaining_time": "0:34:45"}
{"current_steps": 300, "total_steps": 670, "eval_loss": 0.20890283584594727, "epoch": 4.444444444444445, "percentage": 44.78, "elapsed_time": "0:28:34", "remaining_time": "0:35:14"}
{"current_steps": 310, "total_steps": 670, "loss": 0.1983, "lr": 3.2502115875008523e-06, "epoch": 4.592592592592593, "percentage": 46.27, "elapsed_time": "0:29:30", "remaining_time": "0:34:15"}
{"current_steps": 320, "total_steps": 670, "loss": 0.2225, "lr": 3.1250042143911462e-06, "epoch": 4.7407407407407405, "percentage": 47.76, "elapsed_time": "0:30:23", "remaining_time": "0:33:14"}
{"current_steps": 330, "total_steps": 670, "loss": 0.1805, "lr": 2.9981007476273787e-06, "epoch": 4.888888888888889, "percentage": 49.25, "elapsed_time": "0:31:14", "remaining_time": "0:32:10"}
{"current_steps": 340, "total_steps": 670, "loss": 0.1994, "lr": 2.869845569150825e-06, "epoch": 5.037037037037037, "percentage": 50.75, "elapsed_time": "0:32:06", "remaining_time": "0:31:10"}
{"current_steps": 350, "total_steps": 670, "loss": 0.1947, "lr": 2.740586729085476e-06, "epoch": 5.185185185185185, "percentage": 52.24, "elapsed_time": "0:32:57", "remaining_time": "0:30:07"}
{"current_steps": 350, "total_steps": 670, "eval_loss": 0.20565180480480194, "epoch": 5.185185185185185, "percentage": 52.24, "elapsed_time": "0:33:21", "remaining_time": "0:30:29"}
{"current_steps": 360, "total_steps": 670, "loss": 0.2154, "lr": 2.610675001223441e-06, "epoch": 5.333333333333333, "percentage": 53.73, "elapsed_time": "0:34:17", "remaining_time": "0:29:32"}
{"current_steps": 370, "total_steps": 670, "loss": 0.2425, "lr": 2.48046293111904e-06, "epoch": 5.481481481481482, "percentage": 55.22, "elapsed_time": "0:35:08", "remaining_time": "0:28:29"}
{"current_steps": 380, "total_steps": 670, "loss": 0.2111, "lr": 2.350303879374813e-06, "epoch": 5.62962962962963, "percentage": 56.72, "elapsed_time": "0:36:02", "remaining_time": "0:27:29"}
{"current_steps": 390, "total_steps": 670, "loss": 0.1708, "lr": 2.220551062715699e-06, "epoch": 5.777777777777778, "percentage": 58.21, "elapsed_time": "0:36:54", "remaining_time": "0:26:30"}
{"current_steps": 400, "total_steps": 670, "loss": 0.1666, "lr": 2.0915565954536745e-06, "epoch": 5.925925925925926, "percentage": 59.7, "elapsed_time": "0:37:46", "remaining_time": "0:25:29"}
{"current_steps": 400, "total_steps": 670, "eval_loss": 0.20268844068050385, "epoch": 5.925925925925926, "percentage": 59.7, "elapsed_time": "0:38:10", "remaining_time": "0:25:46"}
{"current_steps": 410, "total_steps": 670, "loss": 0.204, "lr": 1.9636705339440327e-06, "epoch": 6.074074074074074, "percentage": 61.19, "elapsed_time": "0:39:09", "remaining_time": "0:24:49"}
{"current_steps": 420, "total_steps": 670, "loss": 0.198, "lr": 1.8372399266264069e-06, "epoch": 6.222222222222222, "percentage": 62.69, "elapsed_time": "0:40:00", "remaining_time": "0:23:48"}
{"current_steps": 430, "total_steps": 670, "loss": 0.2036, "lr": 1.7126078722284739e-06, "epoch": 6.37037037037037, "percentage": 64.18, "elapsed_time": "0:40:49", "remaining_time": "0:22:47"}
{"current_steps": 440, "total_steps": 670, "loss": 0.1477, "lr": 1.5901125886881147e-06, "epoch": 6.518518518518518, "percentage": 65.67, "elapsed_time": "0:41:43", "remaining_time": "0:21:48"}
{"current_steps": 450, "total_steps": 670, "loss": 0.1956, "lr": 1.4700864953207192e-06, "epoch": 6.666666666666667, "percentage": 67.16, "elapsed_time": "0:42:35", "remaining_time": "0:20:49"}
{"current_steps": 450, "total_steps": 670, "eval_loss": 0.20225472748279572, "epoch": 6.666666666666667, "percentage": 67.16, "elapsed_time": "0:42:59", "remaining_time": "0:21:01"}
{"current_steps": 460, "total_steps": 670, "loss": 0.2073, "lr": 1.3528553107224108e-06, "epoch": 6.814814814814815, "percentage": 68.66, "elapsed_time": "0:43:56", "remaining_time": "0:20:03"}
{"current_steps": 470, "total_steps": 670, "loss": 0.2205, "lr": 1.2387371688572133e-06, "epoch": 6.962962962962963, "percentage": 70.15, "elapsed_time": "0:44:46", "remaining_time": "0:19:03"}
{"current_steps": 480, "total_steps": 670, "loss": 0.1891, "lr": 1.1280417557268735e-06, "epoch": 7.111111111111111, "percentage": 71.64, "elapsed_time": "0:45:38", "remaining_time": "0:18:04"}
{"current_steps": 490, "total_steps": 670, "loss": 0.167, "lr": 1.021069468966194e-06, "epoch": 7.2592592592592595, "percentage": 73.13, "elapsed_time": "0:46:27", "remaining_time": "0:17:04"}
{"current_steps": 500, "total_steps": 670, "loss": 0.1888, "lr": 9.181106026444913e-07, "epoch": 7.407407407407407, "percentage": 74.63, "elapsed_time": "0:47:19", "remaining_time": "0:16:05"}
{"current_steps": 500, "total_steps": 670, "eval_loss": 0.20255741477012634, "epoch": 7.407407407407407, "percentage": 74.63, "elapsed_time": "0:47:43", "remaining_time": "0:16:13"}
{"current_steps": 510, "total_steps": 670, "loss": 0.1591, "lr": 8.1944455948542e-07, "epoch": 7.555555555555555, "percentage": 76.12, "elapsed_time": "0:48:39", "remaining_time": "0:15:15"}
{"current_steps": 520, "total_steps": 670, "loss": 0.2168, "lr": 7.253390926429918e-07, "epoch": 7.703703703703704, "percentage": 77.61, "elapsed_time": "0:49:32", "remaining_time": "0:14:17"}
{"current_steps": 530, "total_steps": 670, "loss": 0.2137, "lr": 6.360495790913926e-07, "epoch": 7.851851851851852, "percentage": 79.1, "elapsed_time": "0:50:24", "remaining_time": "0:13:18"}
{"current_steps": 540, "total_steps": 670, "loss": 0.1988, "lr": 5.518183266004276e-07, "epoch": 8.0, "percentage": 80.6, "elapsed_time": "0:51:16", "remaining_time": "0:12:20"}
{"current_steps": 550, "total_steps": 670, "loss": 0.2411, "lr": 4.728739161772874e-07, "epoch": 8.148148148148149, "percentage": 82.09, "elapsed_time": "0:52:06", "remaining_time": "0:11:22"}
{"current_steps": 550, "total_steps": 670, "eval_loss": 0.20238587260246277, "epoch": 8.148148148148149, "percentage": 82.09, "elapsed_time": "0:52:30", "remaining_time": "0:11:27"}
{"current_steps": 560, "total_steps": 670, "loss": 0.1966, "lr": 3.9943058175905493e-07, "epoch": 8.296296296296296, "percentage": 83.58, "elapsed_time": "0:53:30", "remaining_time": "0:10:30"}
{"current_steps": 570, "total_steps": 670, "loss": 0.1677, "lr": 3.3168762883931256e-07, "epoch": 8.444444444444445, "percentage": 85.07, "elapsed_time": "0:54:22", "remaining_time": "0:09:32"}
{"current_steps": 580, "total_steps": 670, "loss": 0.1693, "lr": 2.698288936065338e-07, "epoch": 8.592592592592592, "percentage": 86.57, "elapsed_time": "0:55:13", "remaining_time": "0:08:34"}
{"current_steps": 590, "total_steps": 670, "loss": 0.1945, "lr": 2.1402224406202377e-07, "epoch": 8.74074074074074, "percentage": 88.06, "elapsed_time": "0:56:03", "remaining_time": "0:07:36"}
{"current_steps": 600, "total_steps": 670, "loss": 0.2231, "lr": 1.644191244712251e-07, "epoch": 8.88888888888889, "percentage": 89.55, "elapsed_time": "0:56:56", "remaining_time": "0:06:38"}
{"current_steps": 600, "total_steps": 670, "eval_loss": 0.20180447399616241, "epoch": 8.88888888888889, "percentage": 89.55, "elapsed_time": "0:57:20", "remaining_time": "0:06:41"}
{"current_steps": 610, "total_steps": 670, "loss": 0.1474, "lr": 1.2115414438463646e-07, "epoch": 9.037037037037036, "percentage": 91.04, "elapsed_time": "0:58:16", "remaining_time": "0:05:43"}
{"current_steps": 620, "total_steps": 670, "loss": 0.2276, "lr": 8.434471334363204e-08, "epoch": 9.185185185185185, "percentage": 92.54, "elapsed_time": "0:59:09", "remaining_time": "0:04:46"}
{"current_steps": 630, "total_steps": 670, "loss": 0.2027, "lr": 5.4090722262481463e-08, "epoch": 9.333333333333334, "percentage": 94.03, "elapsed_time": "1:00:02", "remaining_time": "0:03:48"}
{"current_steps": 640, "total_steps": 670, "loss": 0.2072, "lr": 3.047427235122663e-08, "epoch": 9.481481481481481, "percentage": 95.52, "elapsed_time": "1:00:54", "remaining_time": "0:02:51"}
{"current_steps": 650, "total_steps": 670, "loss": 0.1966, "lr": 1.3559452315037025e-08, "epoch": 9.62962962962963, "percentage": 97.01, "elapsed_time": "1:01:45", "remaining_time": "0:01:54"}
{"current_steps": 650, "total_steps": 670, "eval_loss": 0.2017362266778946, "epoch": 9.62962962962963, "percentage": 97.01, "elapsed_time": "1:02:09", "remaining_time": "0:01:54"}
{"current_steps": 660, "total_steps": 670, "loss": 0.1469, "lr": 3.392164434669609e-09, "epoch": 9.777777777777779, "percentage": 98.51, "elapsed_time": "1:03:06", "remaining_time": "0:00:57"}
{"current_steps": 670, "total_steps": 670, "loss": 0.163, "lr": 0.0, "epoch": 9.925925925925926, "percentage": 100.0, "elapsed_time": "1:03:57", "remaining_time": "0:00:00"}
{"current_steps": 670, "total_steps": 670, "epoch": 9.925925925925926, "percentage": 100.0, "elapsed_time": "1:04:03", "remaining_time": "0:00:00"}