QFFT-LIMO-7B / trainer_log.jsonl
lwl-uestc's picture
Upload folder using huggingface_hub
16f8cd5 verified
{"current_steps": 10, "total_steps": 612, "loss": 0.8809, "lr": 1.4516129032258066e-06, "epoch": 0.0975609756097561, "percentage": 1.63, "elapsed_time": "0:02:46", "remaining_time": "2:46:59"}
{"current_steps": 20, "total_steps": 612, "loss": 0.8044, "lr": 3.0645161290322584e-06, "epoch": 0.1951219512195122, "percentage": 3.27, "elapsed_time": "0:05:24", "remaining_time": "2:40:02"}
{"current_steps": 30, "total_steps": 612, "loss": 0.7459, "lr": 4.67741935483871e-06, "epoch": 0.2926829268292683, "percentage": 4.9, "elapsed_time": "0:08:13", "remaining_time": "2:39:29"}
{"current_steps": 40, "total_steps": 612, "loss": 0.727, "lr": 6.290322580645162e-06, "epoch": 0.3902439024390244, "percentage": 6.54, "elapsed_time": "0:10:53", "remaining_time": "2:35:49"}
{"current_steps": 50, "total_steps": 612, "loss": 0.6279, "lr": 7.903225806451613e-06, "epoch": 0.4878048780487805, "percentage": 8.17, "elapsed_time": "0:13:34", "remaining_time": "2:32:40"}
{"current_steps": 60, "total_steps": 612, "loss": 0.6367, "lr": 9.516129032258065e-06, "epoch": 0.5853658536585366, "percentage": 9.8, "elapsed_time": "0:16:31", "remaining_time": "2:31:57"}
{"current_steps": 70, "total_steps": 612, "loss": 0.689, "lr": 9.996003750499608e-06, "epoch": 0.6829268292682927, "percentage": 11.44, "elapsed_time": "0:19:01", "remaining_time": "2:27:20"}
{"current_steps": 80, "total_steps": 612, "loss": 0.6537, "lr": 9.976445660039118e-06, "epoch": 0.7804878048780488, "percentage": 13.07, "elapsed_time": "0:21:50", "remaining_time": "2:25:12"}
{"current_steps": 90, "total_steps": 612, "loss": 0.6421, "lr": 9.940655438201113e-06, "epoch": 0.8780487804878049, "percentage": 14.71, "elapsed_time": "0:24:40", "remaining_time": "2:23:05"}
{"current_steps": 100, "total_steps": 612, "loss": 0.6039, "lr": 9.888749825250151e-06, "epoch": 0.975609756097561, "percentage": 16.34, "elapsed_time": "0:27:24", "remaining_time": "2:20:21"}
{"current_steps": 110, "total_steps": 612, "loss": 0.5969, "lr": 9.820898126506978e-06, "epoch": 1.0682926829268293, "percentage": 17.97, "elapsed_time": "0:30:21", "remaining_time": "2:18:34"}
{"current_steps": 120, "total_steps": 612, "loss": 0.516, "lr": 9.737321660109767e-06, "epoch": 1.1658536585365853, "percentage": 19.61, "elapsed_time": "0:33:08", "remaining_time": "2:15:51"}
{"current_steps": 130, "total_steps": 612, "loss": 0.5287, "lr": 9.638293035120342e-06, "epoch": 1.2634146341463415, "percentage": 21.24, "elapsed_time": "0:36:00", "remaining_time": "2:13:31"}
{"current_steps": 140, "total_steps": 612, "loss": 0.5411, "lr": 9.524135262330098e-06, "epoch": 1.3609756097560974, "percentage": 22.88, "elapsed_time": "0:38:57", "remaining_time": "2:11:19"}
{"current_steps": 150, "total_steps": 612, "loss": 0.5023, "lr": 9.395220700665924e-06, "epoch": 1.4585365853658536, "percentage": 24.51, "elapsed_time": "0:41:49", "remaining_time": "2:08:49"}
{"current_steps": 160, "total_steps": 612, "loss": 0.5487, "lr": 9.251969842632785e-06, "epoch": 1.5560975609756098, "percentage": 26.14, "elapsed_time": "0:44:30", "remaining_time": "2:05:43"}
{"current_steps": 170, "total_steps": 612, "loss": 0.491, "lr": 9.094849942754564e-06, "epoch": 1.653658536585366, "percentage": 27.78, "elapsed_time": "0:47:13", "remaining_time": "2:02:45"}
{"current_steps": 180, "total_steps": 612, "loss": 0.4901, "lr": 8.924373493486941e-06, "epoch": 1.751219512195122, "percentage": 29.41, "elapsed_time": "0:49:34", "remaining_time": "1:58:59"}
{"current_steps": 190, "total_steps": 612, "loss": 0.5439, "lr": 8.741096553573506e-06, "epoch": 1.848780487804878, "percentage": 31.05, "elapsed_time": "0:51:58", "remaining_time": "1:55:25"}
{"current_steps": 200, "total_steps": 612, "loss": 0.5212, "lr": 8.545616934297733e-06, "epoch": 1.946341463414634, "percentage": 32.68, "elapsed_time": "0:54:47", "remaining_time": "1:52:52"}
{"current_steps": 210, "total_steps": 612, "loss": 0.49, "lr": 8.338572249546813e-06, "epoch": 2.0390243902439025, "percentage": 34.31, "elapsed_time": "0:57:58", "remaining_time": "1:50:58"}
{"current_steps": 220, "total_steps": 612, "loss": 0.4122, "lr": 8.120637836047698e-06, "epoch": 2.1365853658536587, "percentage": 35.95, "elapsed_time": "1:00:47", "remaining_time": "1:48:19"}
{"current_steps": 230, "total_steps": 612, "loss": 0.3693, "lr": 7.892524550559056e-06, "epoch": 2.234146341463415, "percentage": 37.58, "elapsed_time": "1:03:15", "remaining_time": "1:45:04"}
{"current_steps": 240, "total_steps": 612, "loss": 0.3851, "lr": 7.654976451204288e-06, "epoch": 2.3317073170731706, "percentage": 39.22, "elapsed_time": "1:05:51", "remaining_time": "1:42:05"}
{"current_steps": 250, "total_steps": 612, "loss": 0.377, "lr": 7.408768370508577e-06, "epoch": 2.4292682926829268, "percentage": 40.85, "elapsed_time": "1:08:44", "remaining_time": "1:39:31"}
{"current_steps": 260, "total_steps": 612, "loss": 0.3864, "lr": 7.154703388056246e-06, "epoch": 2.526829268292683, "percentage": 42.48, "elapsed_time": "1:11:26", "remaining_time": "1:36:42"}
{"current_steps": 270, "total_steps": 612, "loss": 0.3881, "lr": 6.893610211012067e-06, "epoch": 2.624390243902439, "percentage": 44.12, "elapsed_time": "1:13:55", "remaining_time": "1:33:37"}
{"current_steps": 280, "total_steps": 612, "loss": 0.4051, "lr": 6.6263404710507495e-06, "epoch": 2.721951219512195, "percentage": 45.75, "elapsed_time": "1:16:31", "remaining_time": "1:30:43"}
{"current_steps": 290, "total_steps": 612, "loss": 0.4061, "lr": 6.3537659465114275e-06, "epoch": 2.819512195121951, "percentage": 47.39, "elapsed_time": "1:19:22", "remaining_time": "1:28:07"}
{"current_steps": 300, "total_steps": 612, "loss": 0.3537, "lr": 6.076775718837911e-06, "epoch": 2.9170731707317072, "percentage": 49.02, "elapsed_time": "1:22:11", "remaining_time": "1:25:29"}
{"current_steps": 310, "total_steps": 612, "loss": 0.3309, "lr": 5.796273272579823e-06, "epoch": 3.0097560975609756, "percentage": 50.65, "elapsed_time": "1:25:05", "remaining_time": "1:22:53"}
{"current_steps": 320, "total_steps": 612, "loss": 0.2277, "lr": 5.513173548413789e-06, "epoch": 3.107317073170732, "percentage": 52.29, "elapsed_time": "1:27:43", "remaining_time": "1:20:03"}
{"current_steps": 330, "total_steps": 612, "loss": 0.2754, "lr": 5.228399958797117e-06, "epoch": 3.204878048780488, "percentage": 53.92, "elapsed_time": "1:30:31", "remaining_time": "1:17:21"}
{"current_steps": 340, "total_steps": 612, "loss": 0.2226, "lr": 4.9428813759883e-06, "epoch": 3.3024390243902437, "percentage": 55.56, "elapsed_time": "1:33:15", "remaining_time": "1:14:36"}
{"current_steps": 350, "total_steps": 612, "loss": 0.3032, "lr": 4.6575491022587714e-06, "epoch": 3.4, "percentage": 57.19, "elapsed_time": "1:35:51", "remaining_time": "1:11:45"}
{"current_steps": 360, "total_steps": 612, "loss": 0.2326, "lr": 4.373333832178478e-06, "epoch": 3.497560975609756, "percentage": 58.82, "elapsed_time": "1:38:35", "remaining_time": "1:09:00"}
{"current_steps": 370, "total_steps": 612, "loss": 0.3115, "lr": 4.091162616883634e-06, "epoch": 3.5951219512195123, "percentage": 60.46, "elapsed_time": "1:41:19", "remaining_time": "1:06:16"}
{"current_steps": 380, "total_steps": 612, "loss": 0.2202, "lr": 3.8119558402285994e-06, "epoch": 3.692682926829268, "percentage": 62.09, "elapsed_time": "1:43:52", "remaining_time": "1:03:25"}
{"current_steps": 390, "total_steps": 612, "loss": 0.2969, "lr": 3.5366242166850624e-06, "epoch": 3.790243902439024, "percentage": 63.73, "elapsed_time": "1:46:26", "remaining_time": "1:00:35"}
{"current_steps": 400, "total_steps": 612, "loss": 0.237, "lr": 3.2660658207807205e-06, "epoch": 3.8878048780487804, "percentage": 65.36, "elapsed_time": "1:49:01", "remaining_time": "0:57:46"}
{"current_steps": 410, "total_steps": 612, "loss": 0.2668, "lr": 3.0011631577668327e-06, "epoch": 3.9853658536585366, "percentage": 66.99, "elapsed_time": "1:51:43", "remaining_time": "0:55:02"}
{"current_steps": 420, "total_steps": 612, "loss": 0.1837, "lr": 2.7427802850695306e-06, "epoch": 4.078048780487805, "percentage": 68.63, "elapsed_time": "1:54:52", "remaining_time": "0:52:30"}
{"current_steps": 430, "total_steps": 612, "loss": 0.196, "lr": 2.4917599939140884e-06, "epoch": 4.175609756097561, "percentage": 70.26, "elapsed_time": "1:57:45", "remaining_time": "0:49:50"}
{"current_steps": 440, "total_steps": 612, "loss": 0.1483, "lr": 2.2489210603151144e-06, "epoch": 4.273170731707317, "percentage": 71.9, "elapsed_time": "2:00:35", "remaining_time": "0:47:08"}
{"current_steps": 450, "total_steps": 612, "loss": 0.1495, "lr": 2.015055574399388e-06, "epoch": 4.3707317073170735, "percentage": 73.53, "elapsed_time": "2:03:10", "remaining_time": "0:44:20"}
{"current_steps": 460, "total_steps": 612, "loss": 0.1489, "lr": 1.7909263567724917e-06, "epoch": 4.46829268292683, "percentage": 75.16, "elapsed_time": "2:05:59", "remaining_time": "0:41:38"}
{"current_steps": 470, "total_steps": 612, "loss": 0.1702, "lr": 1.5772644703565564e-06, "epoch": 4.565853658536585, "percentage": 76.8, "elapsed_time": "2:08:49", "remaining_time": "0:38:55"}
{"current_steps": 480, "total_steps": 612, "loss": 0.1774, "lr": 1.3747668358149658e-06, "epoch": 4.663414634146341, "percentage": 78.43, "elapsed_time": "2:11:34", "remaining_time": "0:36:11"}
{"current_steps": 490, "total_steps": 612, "loss": 0.1462, "lr": 1.1840939583419986e-06, "epoch": 4.760975609756097, "percentage": 80.07, "elapsed_time": "2:14:21", "remaining_time": "0:33:27"}
{"current_steps": 500, "total_steps": 612, "loss": 0.1865, "lr": 1.0058677732321826e-06, "epoch": 4.8585365853658535, "percentage": 81.7, "elapsed_time": "2:16:56", "remaining_time": "0:30:40"}
{"current_steps": 510, "total_steps": 612, "loss": 0.1795, "lr": 8.406696172566258e-07, "epoch": 4.95609756097561, "percentage": 83.33, "elapsed_time": "2:19:33", "remaining_time": "0:27:54"}
{"current_steps": 520, "total_steps": 612, "loss": 0.157, "lr": 6.890383324633121e-07, "epoch": 5.048780487804878, "percentage": 84.97, "elapsed_time": "2:22:41", "remaining_time": "0:25:14"}
{"current_steps": 530, "total_steps": 612, "loss": 0.1632, "lr": 5.514685085863286e-07, "epoch": 5.146341463414634, "percentage": 86.6, "elapsed_time": "2:25:24", "remaining_time": "0:22:29"}
{"current_steps": 540, "total_steps": 612, "loss": 0.1269, "lr": 4.2840886979696074e-07, "epoch": 5.2439024390243905, "percentage": 88.24, "elapsed_time": "2:28:24", "remaining_time": "0:19:47"}
{"current_steps": 550, "total_steps": 612, "loss": 0.1096, "lr": 3.2026081105871634e-07, "epoch": 5.341463414634147, "percentage": 89.87, "elapsed_time": "2:31:21", "remaining_time": "0:17:03"}
{"current_steps": 560, "total_steps": 612, "loss": 0.1133, "lr": 2.2737708886037823e-07, "epoch": 5.439024390243903, "percentage": 91.5, "elapsed_time": "2:33:55", "remaining_time": "0:14:17"}
{"current_steps": 570, "total_steps": 612, "loss": 0.1188, "lr": 1.5006067059766484e-07, "epoch": 5.536585365853659, "percentage": 93.14, "elapsed_time": "2:36:33", "remaining_time": "0:11:32"}
{"current_steps": 580, "total_steps": 612, "loss": 0.1069, "lr": 8.856374635655696e-08, "epoch": 5.634146341463414, "percentage": 94.77, "elapsed_time": "2:39:23", "remaining_time": "0:08:47"}
{"current_steps": 590, "total_steps": 612, "loss": 0.0943, "lr": 4.3086906321652136e-08, "epoch": 5.7317073170731705, "percentage": 96.41, "elapsed_time": "2:42:07", "remaining_time": "0:06:02"}
{"current_steps": 600, "total_steps": 612, "loss": 0.1061, "lr": 1.3778486492681542e-08, "epoch": 5.829268292682927, "percentage": 98.04, "elapsed_time": "2:44:56", "remaining_time": "0:03:17"}
{"current_steps": 610, "total_steps": 612, "loss": 0.1294, "lr": 7.340848433040615e-10, "epoch": 5.926829268292683, "percentage": 99.67, "elapsed_time": "2:47:26", "remaining_time": "0:00:32"}
{"current_steps": 612, "total_steps": 612, "epoch": 5.946341463414634, "percentage": 100.0, "elapsed_time": "2:48:24", "remaining_time": "0:00:00"}