Qwen2.5-7B-t13 / trainer_log.jsonl
AiMijie's picture
Upload 15 files
3c4129b verified
{"current_steps": 1, "total_steps": 43, "loss": 2.0516, "lr": 0.0, "epoch": 0.023071377072819033, "percentage": 2.33, "elapsed_time": "0:00:16", "remaining_time": "0:11:21"}
{"current_steps": 2, "total_steps": 43, "loss": 2.1984, "lr": 2.0000000000000003e-06, "epoch": 0.046142754145638065, "percentage": 4.65, "elapsed_time": "0:00:30", "remaining_time": "0:10:33"}
{"current_steps": 3, "total_steps": 43, "loss": 2.0262, "lr": 4.000000000000001e-06, "epoch": 0.0692141312184571, "percentage": 6.98, "elapsed_time": "0:00:45", "remaining_time": "0:10:10"}
{"current_steps": 4, "total_steps": 43, "loss": 1.9887, "lr": 6e-06, "epoch": 0.09228550829127613, "percentage": 9.3, "elapsed_time": "0:01:01", "remaining_time": "0:09:56"}
{"current_steps": 5, "total_steps": 43, "loss": 1.8539, "lr": 8.000000000000001e-06, "epoch": 0.11535688536409516, "percentage": 11.63, "elapsed_time": "0:01:16", "remaining_time": "0:09:42"}
{"current_steps": 6, "total_steps": 43, "loss": 1.6958, "lr": 1e-05, "epoch": 0.1384282624369142, "percentage": 13.95, "elapsed_time": "0:01:31", "remaining_time": "0:09:27"}
{"current_steps": 7, "total_steps": 43, "loss": 1.5919, "lr": 9.98292246503335e-06, "epoch": 0.16149963950973323, "percentage": 16.28, "elapsed_time": "0:01:46", "remaining_time": "0:09:08"}
{"current_steps": 8, "total_steps": 43, "loss": 1.4645, "lr": 9.931806517013612e-06, "epoch": 0.18457101658255226, "percentage": 18.6, "elapsed_time": "0:02:01", "remaining_time": "0:08:52"}
{"current_steps": 9, "total_steps": 43, "loss": 1.4254, "lr": 9.847001329696653e-06, "epoch": 0.2076423936553713, "percentage": 20.93, "elapsed_time": "0:02:17", "remaining_time": "0:08:40"}
{"current_steps": 10, "total_steps": 43, "loss": 1.3279, "lr": 9.729086208503174e-06, "epoch": 0.23071377072819033, "percentage": 23.26, "elapsed_time": "0:02:32", "remaining_time": "0:08:23"}
{"current_steps": 11, "total_steps": 43, "loss": 1.2615, "lr": 9.578866633275289e-06, "epoch": 0.25378514780100936, "percentage": 25.58, "elapsed_time": "0:02:47", "remaining_time": "0:08:07"}
{"current_steps": 12, "total_steps": 43, "loss": 1.198, "lr": 9.397368756032445e-06, "epoch": 0.2768565248738284, "percentage": 27.91, "elapsed_time": "0:03:03", "remaining_time": "0:07:52"}
{"current_steps": 13, "total_steps": 43, "loss": 1.2127, "lr": 9.185832391312644e-06, "epoch": 0.2999279019466474, "percentage": 30.23, "elapsed_time": "0:03:18", "remaining_time": "0:07:36"}
{"current_steps": 14, "total_steps": 43, "loss": 1.192, "lr": 8.94570254698197e-06, "epoch": 0.32299927901946646, "percentage": 32.56, "elapsed_time": "0:03:34", "remaining_time": "0:07:23"}
{"current_steps": 15, "total_steps": 43, "loss": 1.1819, "lr": 8.67861955336566e-06, "epoch": 0.3460706560922855, "percentage": 34.88, "elapsed_time": "0:03:48", "remaining_time": "0:07:06"}
{"current_steps": 16, "total_steps": 43, "loss": 1.1531, "lr": 8.386407858128707e-06, "epoch": 0.3691420331651045, "percentage": 37.21, "elapsed_time": "0:04:03", "remaining_time": "0:06:50"}
{"current_steps": 17, "total_steps": 43, "loss": 1.2092, "lr": 8.071063563448341e-06, "epoch": 0.39221341023792355, "percentage": 39.53, "elapsed_time": "0:04:18", "remaining_time": "0:06:35"}
{"current_steps": 18, "total_steps": 43, "loss": 1.1634, "lr": 7.734740790612137e-06, "epoch": 0.4152847873107426, "percentage": 41.86, "elapsed_time": "0:04:32", "remaining_time": "0:06:19"}
{"current_steps": 19, "total_steps": 43, "loss": 1.1431, "lr": 7.379736965185369e-06, "epoch": 0.4383561643835616, "percentage": 44.19, "elapsed_time": "0:04:48", "remaining_time": "0:06:04"}
{"current_steps": 20, "total_steps": 43, "loss": 1.1209, "lr": 7.008477123264849e-06, "epoch": 0.46142754145638065, "percentage": 46.51, "elapsed_time": "0:05:03", "remaining_time": "0:05:48"}
{"current_steps": 21, "total_steps": 43, "loss": 1.1877, "lr": 6.6234973460234184e-06, "epoch": 0.4844989185291997, "percentage": 48.84, "elapsed_time": "0:05:18", "remaining_time": "0:05:33"}
{"current_steps": 22, "total_steps": 43, "loss": 1.0835, "lr": 6.227427435703997e-06, "epoch": 0.5075702956020187, "percentage": 51.16, "elapsed_time": "0:05:33", "remaining_time": "0:05:18"}
{"current_steps": 23, "total_steps": 43, "loss": 1.0847, "lr": 5.82297295140367e-06, "epoch": 0.5306416726748377, "percentage": 53.49, "elapsed_time": "0:05:48", "remaining_time": "0:05:03"}
{"current_steps": 24, "total_steps": 43, "loss": 1.1755, "lr": 5.412896727361663e-06, "epoch": 0.5537130497476568, "percentage": 55.81, "elapsed_time": "0:06:04", "remaining_time": "0:04:48"}
{"current_steps": 25, "total_steps": 43, "loss": 1.1454, "lr": 5e-06, "epoch": 0.5767844268204758, "percentage": 58.14, "elapsed_time": "0:06:18", "remaining_time": "0:04:32"}
{"current_steps": 26, "total_steps": 43, "loss": 1.0624, "lr": 4.587103272638339e-06, "epoch": 0.5998558038932948, "percentage": 60.47, "elapsed_time": "0:06:34", "remaining_time": "0:04:17"}
{"current_steps": 27, "total_steps": 43, "loss": 1.1401, "lr": 4.17702704859633e-06, "epoch": 0.6229271809661139, "percentage": 62.79, "elapsed_time": "0:06:49", "remaining_time": "0:04:02"}
{"current_steps": 28, "total_steps": 43, "loss": 1.0402, "lr": 3.7725725642960047e-06, "epoch": 0.6459985580389329, "percentage": 65.12, "elapsed_time": "0:07:03", "remaining_time": "0:03:47"}
{"current_steps": 29, "total_steps": 43, "loss": 1.1484, "lr": 3.3765026539765832e-06, "epoch": 0.669069935111752, "percentage": 67.44, "elapsed_time": "0:07:18", "remaining_time": "0:03:31"}
{"current_steps": 30, "total_steps": 43, "loss": 1.0909, "lr": 2.991522876735154e-06, "epoch": 0.692141312184571, "percentage": 69.77, "elapsed_time": "0:07:33", "remaining_time": "0:03:16"}
{"current_steps": 31, "total_steps": 43, "loss": 1.118, "lr": 2.6202630348146323e-06, "epoch": 0.71521268925739, "percentage": 72.09, "elapsed_time": "0:07:49", "remaining_time": "0:03:01"}
{"current_steps": 32, "total_steps": 43, "loss": 1.0666, "lr": 2.265259209387867e-06, "epoch": 0.738284066330209, "percentage": 74.42, "elapsed_time": "0:08:04", "remaining_time": "0:02:46"}
{"current_steps": 33, "total_steps": 43, "loss": 1.086, "lr": 1.928936436551661e-06, "epoch": 0.7613554434030281, "percentage": 76.74, "elapsed_time": "0:08:19", "remaining_time": "0:02:31"}
{"current_steps": 34, "total_steps": 43, "loss": 1.0922, "lr": 1.6135921418712959e-06, "epoch": 0.7844268204758471, "percentage": 79.07, "elapsed_time": "0:08:34", "remaining_time": "0:02:16"}
{"current_steps": 35, "total_steps": 43, "loss": 1.0186, "lr": 1.321380446634342e-06, "epoch": 0.8074981975486661, "percentage": 81.4, "elapsed_time": "0:08:50", "remaining_time": "0:02:01"}
{"current_steps": 36, "total_steps": 43, "loss": 1.131, "lr": 1.0542974530180327e-06, "epoch": 0.8305695746214852, "percentage": 83.72, "elapsed_time": "0:09:04", "remaining_time": "0:01:45"}
{"current_steps": 37, "total_steps": 43, "loss": 1.0346, "lr": 8.141676086873574e-07, "epoch": 0.8536409516943042, "percentage": 86.05, "elapsed_time": "0:09:19", "remaining_time": "0:01:30"}
{"current_steps": 38, "total_steps": 43, "loss": 1.0757, "lr": 6.026312439675553e-07, "epoch": 0.8767123287671232, "percentage": 88.37, "elapsed_time": "0:09:34", "remaining_time": "0:01:15"}
{"current_steps": 39, "total_steps": 43, "loss": 1.1638, "lr": 4.211333667247125e-07, "epoch": 0.8997837058399423, "percentage": 90.7, "elapsed_time": "0:09:50", "remaining_time": "0:01:00"}
{"current_steps": 40, "total_steps": 43, "loss": 1.0145, "lr": 2.7091379149682683e-07, "epoch": 0.9228550829127613, "percentage": 93.02, "elapsed_time": "0:10:06", "remaining_time": "0:00:45"}
{"current_steps": 41, "total_steps": 43, "loss": 1.0958, "lr": 1.5299867030334815e-07, "epoch": 0.9459264599855803, "percentage": 95.35, "elapsed_time": "0:10:21", "remaining_time": "0:00:30"}
{"current_steps": 42, "total_steps": 43, "loss": 1.0899, "lr": 6.819348298638839e-08, "epoch": 0.9689978370583994, "percentage": 97.67, "elapsed_time": "0:10:36", "remaining_time": "0:00:15"}
{"current_steps": 43, "total_steps": 43, "loss": 1.0737, "lr": 1.7077534966650767e-08, "epoch": 0.9920692141312184, "percentage": 100.0, "elapsed_time": "0:10:52", "remaining_time": "0:00:00"}
{"current_steps": 43, "total_steps": 43, "epoch": 0.9920692141312184, "percentage": 100.0, "elapsed_time": "0:11:19", "remaining_time": "0:00:00"}