Light-R1-SFTData / trainer_log.jsonl
sedrickkeh's picture
Training in progress, epoch 2
7223987 verified
{"current_steps": 1, "total_steps": 183, "loss": 0.7971, "lr": 4.210526315789474e-06, "epoch": 0.016243654822335026, "percentage": 0.55, "elapsed_time": "0:04:34", "remaining_time": "13:52:26"}
{"current_steps": 2, "total_steps": 183, "loss": 0.8013, "lr": 8.421052631578948e-06, "epoch": 0.03248730964467005, "percentage": 1.09, "elapsed_time": "0:08:14", "remaining_time": "12:26:08"}
{"current_steps": 3, "total_steps": 183, "loss": 0.7483, "lr": 1.263157894736842e-05, "epoch": 0.048730964467005075, "percentage": 1.64, "elapsed_time": "0:11:54", "remaining_time": "11:54:39"}
{"current_steps": 4, "total_steps": 183, "loss": 0.696, "lr": 1.6842105263157896e-05, "epoch": 0.0649746192893401, "percentage": 2.19, "elapsed_time": "0:15:34", "remaining_time": "11:37:10"}
{"current_steps": 5, "total_steps": 183, "loss": 0.7237, "lr": 2.105263157894737e-05, "epoch": 0.08121827411167512, "percentage": 2.73, "elapsed_time": "0:19:14", "remaining_time": "11:25:06"}
{"current_steps": 6, "total_steps": 183, "loss": 0.7683, "lr": 2.526315789473684e-05, "epoch": 0.09746192893401015, "percentage": 3.28, "elapsed_time": "0:22:54", "remaining_time": "11:15:48"}
{"current_steps": 7, "total_steps": 183, "loss": 0.7212, "lr": 2.9473684210526317e-05, "epoch": 0.11370558375634518, "percentage": 3.83, "elapsed_time": "0:26:34", "remaining_time": "11:08:16"}
{"current_steps": 8, "total_steps": 183, "loss": 0.6675, "lr": 3.368421052631579e-05, "epoch": 0.1299492385786802, "percentage": 4.37, "elapsed_time": "0:30:15", "remaining_time": "11:01:47"}
{"current_steps": 9, "total_steps": 183, "loss": 0.6339, "lr": 3.789473684210526e-05, "epoch": 0.14619289340101524, "percentage": 4.92, "elapsed_time": "0:33:55", "remaining_time": "10:55:55"}
{"current_steps": 10, "total_steps": 183, "loss": 0.6086, "lr": 4.210526315789474e-05, "epoch": 0.16243654822335024, "percentage": 5.46, "elapsed_time": "0:37:35", "remaining_time": "10:50:27"}
{"current_steps": 11, "total_steps": 183, "loss": 0.5825, "lr": 4.6315789473684214e-05, "epoch": 0.17868020304568527, "percentage": 6.01, "elapsed_time": "0:41:16", "remaining_time": "10:45:23"}
{"current_steps": 12, "total_steps": 183, "loss": 0.5701, "lr": 5.052631578947368e-05, "epoch": 0.1949238578680203, "percentage": 6.56, "elapsed_time": "0:44:57", "remaining_time": "10:40:34"}
{"current_steps": 13, "total_steps": 183, "loss": 0.5649, "lr": 5.4736842105263165e-05, "epoch": 0.21116751269035533, "percentage": 7.1, "elapsed_time": "0:48:37", "remaining_time": "10:35:47"}
{"current_steps": 14, "total_steps": 183, "loss": 0.5556, "lr": 5.8947368421052634e-05, "epoch": 0.22741116751269036, "percentage": 7.65, "elapsed_time": "0:52:17", "remaining_time": "10:31:09"}
{"current_steps": 15, "total_steps": 183, "loss": 0.5472, "lr": 6.315789473684212e-05, "epoch": 0.2436548223350254, "percentage": 8.2, "elapsed_time": "0:55:57", "remaining_time": "10:26:41"}
{"current_steps": 16, "total_steps": 183, "loss": 0.5383, "lr": 6.736842105263159e-05, "epoch": 0.2598984771573604, "percentage": 8.74, "elapsed_time": "0:59:36", "remaining_time": "10:22:13"}
{"current_steps": 17, "total_steps": 183, "loss": 0.5259, "lr": 7.157894736842105e-05, "epoch": 0.27614213197969545, "percentage": 9.29, "elapsed_time": "1:03:17", "remaining_time": "10:17:59"}
{"current_steps": 18, "total_steps": 183, "loss": 0.5215, "lr": 7.578947368421052e-05, "epoch": 0.2923857868020305, "percentage": 9.84, "elapsed_time": "1:06:57", "remaining_time": "10:13:44"}
{"current_steps": 19, "total_steps": 183, "loss": 0.5219, "lr": 8e-05, "epoch": 0.3086294416243655, "percentage": 10.38, "elapsed_time": "1:10:37", "remaining_time": "10:09:37"}
{"current_steps": 20, "total_steps": 183, "loss": 0.5159, "lr": 7.999266113727178e-05, "epoch": 0.3248730964467005, "percentage": 10.93, "elapsed_time": "1:14:17", "remaining_time": "10:05:27"}
{"current_steps": 21, "total_steps": 183, "loss": 0.5082, "lr": 7.99706472420324e-05, "epoch": 0.3411167512690355, "percentage": 11.48, "elapsed_time": "1:17:57", "remaining_time": "10:01:24"}
{"current_steps": 22, "total_steps": 183, "loss": 0.5065, "lr": 7.993396639212965e-05, "epoch": 0.35736040609137054, "percentage": 12.02, "elapsed_time": "1:21:37", "remaining_time": "9:57:23"}
{"current_steps": 23, "total_steps": 183, "loss": 0.5082, "lr": 7.988263204734962e-05, "epoch": 0.37360406091370557, "percentage": 12.57, "elapsed_time": "1:25:17", "remaining_time": "9:53:19"}
{"current_steps": 24, "total_steps": 183, "loss": 0.5009, "lr": 7.98166630444778e-05, "epoch": 0.3898477157360406, "percentage": 13.11, "elapsed_time": "1:28:58", "remaining_time": "9:49:24"}
{"current_steps": 25, "total_steps": 183, "loss": 0.4935, "lr": 7.973608359038701e-05, "epoch": 0.40609137055837563, "percentage": 13.66, "elapsed_time": "1:32:38", "remaining_time": "9:45:27"}
{"current_steps": 26, "total_steps": 183, "loss": 0.4869, "lr": 7.964092325315485e-05, "epoch": 0.42233502538071066, "percentage": 14.21, "elapsed_time": "1:36:18", "remaining_time": "9:41:33"}
{"current_steps": 27, "total_steps": 183, "loss": 0.492, "lr": 7.953121695121395e-05, "epoch": 0.4385786802030457, "percentage": 14.75, "elapsed_time": "1:39:59", "remaining_time": "9:37:41"}
{"current_steps": 28, "total_steps": 183, "loss": 0.4773, "lr": 7.94070049405388e-05, "epoch": 0.4548223350253807, "percentage": 15.3, "elapsed_time": "1:43:39", "remaining_time": "9:33:50"}
{"current_steps": 29, "total_steps": 183, "loss": 0.4869, "lr": 7.926833279987421e-05, "epoch": 0.47106598984771575, "percentage": 15.85, "elapsed_time": "1:47:20", "remaining_time": "9:29:59"}
{"current_steps": 30, "total_steps": 183, "loss": 0.4752, "lr": 7.911525141401037e-05, "epoch": 0.4873096446700508, "percentage": 16.39, "elapsed_time": "1:51:00", "remaining_time": "9:26:07"}
{"current_steps": 31, "total_steps": 183, "loss": 0.4811, "lr": 7.894781695511117e-05, "epoch": 0.5035532994923858, "percentage": 16.94, "elapsed_time": "1:54:40", "remaining_time": "9:22:18"}
{"current_steps": 32, "total_steps": 183, "loss": 0.4832, "lr": 7.876609086210207e-05, "epoch": 0.5197969543147208, "percentage": 17.49, "elapsed_time": "1:58:21", "remaining_time": "9:18:28"}
{"current_steps": 33, "total_steps": 183, "loss": 0.4706, "lr": 7.857013981812564e-05, "epoch": 0.5360406091370559, "percentage": 18.03, "elapsed_time": "2:02:01", "remaining_time": "9:14:39"}
{"current_steps": 34, "total_steps": 183, "loss": 0.4933, "lr": 7.836003572607253e-05, "epoch": 0.5522842639593909, "percentage": 18.58, "elapsed_time": "2:05:41", "remaining_time": "9:10:51"}
{"current_steps": 35, "total_steps": 183, "loss": 0.4735, "lr": 7.813585568219723e-05, "epoch": 0.5685279187817259, "percentage": 19.13, "elapsed_time": "2:09:22", "remaining_time": "9:07:02"}
{"current_steps": 36, "total_steps": 183, "loss": 0.4795, "lr": 7.789768194782818e-05, "epoch": 0.584771573604061, "percentage": 19.67, "elapsed_time": "2:13:02", "remaining_time": "9:03:13"}
{"current_steps": 37, "total_steps": 183, "loss": 0.4739, "lr": 7.764560191918247e-05, "epoch": 0.601015228426396, "percentage": 20.22, "elapsed_time": "2:16:41", "remaining_time": "8:59:24"}
{"current_steps": 38, "total_steps": 183, "loss": 0.4665, "lr": 7.737970809529645e-05, "epoch": 0.617258883248731, "percentage": 20.77, "elapsed_time": "2:20:21", "remaining_time": "8:55:36"}
{"current_steps": 39, "total_steps": 183, "loss": 0.4616, "lr": 7.71000980440838e-05, "epoch": 0.6335025380710659, "percentage": 21.31, "elapsed_time": "2:24:01", "remaining_time": "8:51:48"}
{"current_steps": 40, "total_steps": 183, "loss": 0.4578, "lr": 7.680687436653367e-05, "epoch": 0.649746192893401, "percentage": 21.86, "elapsed_time": "2:27:41", "remaining_time": "8:48:00"}
{"current_steps": 41, "total_steps": 183, "loss": 0.4532, "lr": 7.650014465906201e-05, "epoch": 0.665989847715736, "percentage": 22.4, "elapsed_time": "2:31:21", "remaining_time": "8:44:13"}
{"current_steps": 42, "total_steps": 183, "loss": 0.4504, "lr": 7.618002147402967e-05, "epoch": 0.682233502538071, "percentage": 22.95, "elapsed_time": "2:35:02", "remaining_time": "8:40:28"}
{"current_steps": 43, "total_steps": 183, "loss": 0.4514, "lr": 7.584662227844223e-05, "epoch": 0.698477157360406, "percentage": 23.5, "elapsed_time": "2:38:42", "remaining_time": "8:36:43"}
{"current_steps": 44, "total_steps": 183, "loss": 0.4531, "lr": 7.550006941084619e-05, "epoch": 0.7147208121827411, "percentage": 24.04, "elapsed_time": "2:42:22", "remaining_time": "8:32:56"}
{"current_steps": 45, "total_steps": 183, "loss": 0.441, "lr": 7.51404900364377e-05, "epoch": 0.7309644670050761, "percentage": 24.59, "elapsed_time": "2:46:01", "remaining_time": "8:29:09"}
{"current_steps": 46, "total_steps": 183, "loss": 0.4404, "lr": 7.476801610040021e-05, "epoch": 0.7472081218274111, "percentage": 25.14, "elapsed_time": "2:49:41", "remaining_time": "8:25:23"}
{"current_steps": 47, "total_steps": 183, "loss": 0.4382, "lr": 7.438278427948805e-05, "epoch": 0.7634517766497462, "percentage": 25.68, "elapsed_time": "2:53:21", "remaining_time": "8:21:38"}
{"current_steps": 48, "total_steps": 183, "loss": 0.4373, "lr": 7.398493593187383e-05, "epoch": 0.7796954314720812, "percentage": 26.23, "elapsed_time": "2:57:01", "remaining_time": "8:17:53"}
{"current_steps": 49, "total_steps": 183, "loss": 0.4373, "lr": 7.357461704527802e-05, "epoch": 0.7959390862944162, "percentage": 26.78, "elapsed_time": "3:00:41", "remaining_time": "8:14:08"}
{"current_steps": 50, "total_steps": 183, "loss": 0.4406, "lr": 7.315197818339979e-05, "epoch": 0.8121827411167513, "percentage": 27.32, "elapsed_time": "3:04:21", "remaining_time": "8:10:23"}
{"current_steps": 51, "total_steps": 183, "loss": 0.4344, "lr": 7.271717443066871e-05, "epoch": 0.8284263959390863, "percentage": 27.87, "elapsed_time": "3:08:01", "remaining_time": "8:06:39"}
{"current_steps": 52, "total_steps": 183, "loss": 0.433, "lr": 7.227036533533753e-05, "epoch": 0.8446700507614213, "percentage": 28.42, "elapsed_time": "3:11:41", "remaining_time": "8:02:54"}
{"current_steps": 53, "total_steps": 183, "loss": 0.4304, "lr": 7.181171485093706e-05, "epoch": 0.8609137055837564, "percentage": 28.96, "elapsed_time": "3:15:21", "remaining_time": "7:59:10"}
{"current_steps": 54, "total_steps": 183, "loss": 0.4221, "lr": 7.134139127611457e-05, "epoch": 0.8771573604060914, "percentage": 29.51, "elapsed_time": "3:19:01", "remaining_time": "7:55:27"}
{"current_steps": 55, "total_steps": 183, "loss": 0.4288, "lr": 7.085956719287773e-05, "epoch": 0.8934010152284264, "percentage": 30.05, "elapsed_time": "3:22:41", "remaining_time": "7:51:43"}
{"current_steps": 56, "total_steps": 183, "loss": 0.4271, "lr": 7.036641940326682e-05, "epoch": 0.9096446700507614, "percentage": 30.6, "elapsed_time": "3:26:22", "remaining_time": "7:48:00"}
{"current_steps": 57, "total_steps": 183, "loss": 0.4313, "lr": 6.986212886447851e-05, "epoch": 0.9258883248730965, "percentage": 31.15, "elapsed_time": "3:30:01", "remaining_time": "7:44:16"}
{"current_steps": 58, "total_steps": 183, "loss": 0.4218, "lr": 6.934688062246474e-05, "epoch": 0.9421319796954315, "percentage": 31.69, "elapsed_time": "3:33:41", "remaining_time": "7:40:33"}
{"current_steps": 59, "total_steps": 183, "loss": 0.4348, "lr": 6.882086374403148e-05, "epoch": 0.9583756345177665, "percentage": 32.24, "elapsed_time": "3:37:21", "remaining_time": "7:36:49"}
{"current_steps": 60, "total_steps": 183, "loss": 0.4272, "lr": 6.828427124746191e-05, "epoch": 0.9746192893401016, "percentage": 32.79, "elapsed_time": "3:41:01", "remaining_time": "7:33:05"}
{"current_steps": 61, "total_steps": 183, "loss": 0.4279, "lr": 6.773730003168967e-05, "epoch": 0.9908629441624366, "percentage": 33.33, "elapsed_time": "3:44:41", "remaining_time": "7:29:22"}
{"current_steps": 62, "total_steps": 183, "loss": 0.691, "lr": 6.718015080404824e-05, "epoch": 1.0101522842639594, "percentage": 33.88, "elapsed_time": "3:49:44", "remaining_time": "7:28:21"}
{"current_steps": 63, "total_steps": 183, "loss": 0.4051, "lr": 6.661302800662261e-05, "epoch": 1.0263959390862945, "percentage": 34.43, "elapsed_time": "3:53:23", "remaining_time": "7:24:33"}
{"current_steps": 64, "total_steps": 183, "loss": 0.4116, "lr": 6.603613974123086e-05, "epoch": 1.0426395939086295, "percentage": 34.97, "elapsed_time": "3:57:04", "remaining_time": "7:20:47"}
{"current_steps": 65, "total_steps": 183, "loss": 0.4076, "lr": 6.54496976930624e-05, "epoch": 1.0588832487309645, "percentage": 35.52, "elapsed_time": "4:00:43", "remaining_time": "7:17:01"}
{"current_steps": 66, "total_steps": 183, "loss": 0.4069, "lr": 6.485391705300173e-05, "epoch": 1.0751269035532995, "percentage": 36.07, "elapsed_time": "4:04:23", "remaining_time": "7:13:14"}
{"current_steps": 67, "total_steps": 183, "loss": 0.4011, "lr": 6.424901643866553e-05, "epoch": 1.0913705583756346, "percentage": 36.61, "elapsed_time": "4:08:03", "remaining_time": "7:09:29"}
{"current_steps": 68, "total_steps": 183, "loss": 0.4033, "lr": 6.363521781418243e-05, "epoch": 1.1076142131979696, "percentage": 37.16, "elapsed_time": "4:11:43", "remaining_time": "7:05:43"}
{"current_steps": 69, "total_steps": 183, "loss": 0.4032, "lr": 6.301274640874483e-05, "epoch": 1.1238578680203046, "percentage": 37.7, "elapsed_time": "4:15:23", "remaining_time": "7:01:57"}
{"current_steps": 70, "total_steps": 183, "loss": 0.397, "lr": 6.238183063396257e-05, "epoch": 1.1401015228426397, "percentage": 38.25, "elapsed_time": "4:19:03", "remaining_time": "6:58:11"}
{"current_steps": 71, "total_steps": 183, "loss": 0.3919, "lr": 6.174270200004885e-05, "epoch": 1.1563451776649747, "percentage": 38.8, "elapsed_time": "4:22:43", "remaining_time": "6:54:26"}
{"current_steps": 72, "total_steps": 183, "loss": 0.4003, "lr": 6.109559503086918e-05, "epoch": 1.1725888324873097, "percentage": 39.34, "elapsed_time": "4:26:23", "remaining_time": "6:50:41"}
{"current_steps": 73, "total_steps": 183, "loss": 0.3989, "lr": 6.044074717788442e-05, "epoch": 1.1888324873096447, "percentage": 39.89, "elapsed_time": "4:30:03", "remaining_time": "6:46:56"}
{"current_steps": 74, "total_steps": 183, "loss": 0.3908, "lr": 5.9778398733019614e-05, "epoch": 1.2050761421319798, "percentage": 40.44, "elapsed_time": "4:33:43", "remaining_time": "6:43:11"}
{"current_steps": 75, "total_steps": 183, "loss": 0.3987, "lr": 5.910879274049052e-05, "epoch": 1.2213197969543148, "percentage": 40.98, "elapsed_time": "4:37:23", "remaining_time": "6:39:27"}
{"current_steps": 76, "total_steps": 183, "loss": 0.4045, "lr": 5.84321749076202e-05, "epoch": 1.2375634517766498, "percentage": 41.53, "elapsed_time": "4:41:03", "remaining_time": "6:35:41"}
{"current_steps": 77, "total_steps": 183, "loss": 0.4017, "lr": 5.7748793514678394e-05, "epoch": 1.2538071065989849, "percentage": 42.08, "elapsed_time": "4:44:43", "remaining_time": "6:31:57"}
{"current_steps": 78, "total_steps": 183, "loss": 0.3972, "lr": 5.705889932377679e-05, "epoch": 1.2700507614213197, "percentage": 42.62, "elapsed_time": "4:48:23", "remaining_time": "6:28:13"}
{"current_steps": 79, "total_steps": 183, "loss": 0.4009, "lr": 5.636274548685361e-05, "epoch": 1.286294416243655, "percentage": 43.17, "elapsed_time": "4:52:04", "remaining_time": "6:24:30"}
{"current_steps": 80, "total_steps": 183, "loss": 0.39, "lr": 5.566058745278117e-05, "epoch": 1.3025380710659897, "percentage": 43.72, "elapsed_time": "4:55:43", "remaining_time": "6:20:45"}
{"current_steps": 81, "total_steps": 183, "loss": 0.3979, "lr": 5.4952682873630755e-05, "epoch": 1.318781725888325, "percentage": 44.26, "elapsed_time": "4:59:23", "remaining_time": "6:17:01"}
{"current_steps": 82, "total_steps": 183, "loss": 0.3974, "lr": 5.4239291510128936e-05, "epoch": 1.3350253807106598, "percentage": 44.81, "elapsed_time": "5:03:04", "remaining_time": "6:13:17"}
{"current_steps": 83, "total_steps": 183, "loss": 0.395, "lr": 5.352067513634011e-05, "epoch": 1.351269035532995, "percentage": 45.36, "elapsed_time": "5:06:44", "remaining_time": "6:09:34"}
{"current_steps": 84, "total_steps": 183, "loss": 0.3917, "lr": 5.279709744361036e-05, "epoch": 1.3675126903553299, "percentage": 45.9, "elapsed_time": "5:10:24", "remaining_time": "6:05:50"}
{"current_steps": 85, "total_steps": 183, "loss": 0.3897, "lr": 5.20688239438077e-05, "epoch": 1.383756345177665, "percentage": 46.45, "elapsed_time": "5:14:04", "remaining_time": "6:02:06"}
{"current_steps": 86, "total_steps": 183, "loss": 0.3958, "lr": 5.133612187189429e-05, "epoch": 1.4, "percentage": 46.99, "elapsed_time": "5:17:44", "remaining_time": "5:58:22"}
{"current_steps": 87, "total_steps": 183, "loss": 0.3885, "lr": 5.059926008786648e-05, "epoch": 1.4162436548223352, "percentage": 47.54, "elapsed_time": "5:21:23", "remaining_time": "5:54:38"}
{"current_steps": 88, "total_steps": 183, "loss": 0.3913, "lr": 4.985850897809838e-05, "epoch": 1.43248730964467, "percentage": 48.09, "elapsed_time": "5:25:04", "remaining_time": "5:50:55"}
{"current_steps": 89, "total_steps": 183, "loss": 0.3897, "lr": 4.911414035612551e-05, "epoch": 1.448730964467005, "percentage": 48.63, "elapsed_time": "5:28:44", "remaining_time": "5:47:12"}
{"current_steps": 90, "total_steps": 183, "loss": 0.3863, "lr": 4.836642736290468e-05, "epoch": 1.46497461928934, "percentage": 49.18, "elapsed_time": "5:32:24", "remaining_time": "5:43:29"}
{"current_steps": 91, "total_steps": 183, "loss": 0.3905, "lr": 4.761564436658674e-05, "epoch": 1.481218274111675, "percentage": 49.73, "elapsed_time": "5:36:04", "remaining_time": "5:39:45"}
{"current_steps": 92, "total_steps": 183, "loss": 0.3842, "lr": 4.686206686183914e-05, "epoch": 1.49746192893401, "percentage": 50.27, "elapsed_time": "5:39:44", "remaining_time": "5:36:02"}
{"current_steps": 93, "total_steps": 183, "loss": 0.3849, "lr": 4.610597136875498e-05, "epoch": 1.5137055837563453, "percentage": 50.82, "elapsed_time": "5:43:23", "remaining_time": "5:32:18"}
{"current_steps": 94, "total_steps": 183, "loss": 0.382, "lr": 4.534763533138594e-05, "epoch": 1.5299492385786801, "percentage": 51.37, "elapsed_time": "5:47:03", "remaining_time": "5:28:35"}
{"current_steps": 95, "total_steps": 183, "loss": 0.3902, "lr": 4.458733701593603e-05, "epoch": 1.5461928934010152, "percentage": 51.91, "elapsed_time": "5:50:43", "remaining_time": "5:24:53"}
{"current_steps": 96, "total_steps": 183, "loss": 0.3865, "lr": 4.3825355408653694e-05, "epoch": 1.5624365482233502, "percentage": 52.46, "elapsed_time": "5:54:24", "remaining_time": "5:21:10"}
{"current_steps": 97, "total_steps": 183, "loss": 0.3927, "lr": 4.306197011345984e-05, "epoch": 1.5786802030456852, "percentage": 53.01, "elapsed_time": "5:58:04", "remaining_time": "5:17:28"}
{"current_steps": 98, "total_steps": 183, "loss": 0.3897, "lr": 4.229746124934894e-05, "epoch": 1.5949238578680203, "percentage": 53.55, "elapsed_time": "6:01:44", "remaining_time": "5:13:45"}
{"current_steps": 99, "total_steps": 183, "loss": 0.3898, "lr": 4.153210934760142e-05, "epoch": 1.6111675126903553, "percentage": 54.1, "elapsed_time": "6:05:24", "remaining_time": "5:10:02"}
{"current_steps": 100, "total_steps": 183, "loss": 0.3915, "lr": 4.0766195248844574e-05, "epoch": 1.6274111675126903, "percentage": 54.64, "elapsed_time": "6:09:05", "remaining_time": "5:06:20"}
{"current_steps": 101, "total_steps": 183, "loss": 0.3938, "lr": 4e-05, "epoch": 1.6436548223350254, "percentage": 55.19, "elapsed_time": "6:12:44", "remaining_time": "5:02:37"}
{"current_steps": 102, "total_steps": 183, "loss": 0.3837, "lr": 3.923380475115544e-05, "epoch": 1.6598984771573604, "percentage": 55.74, "elapsed_time": "6:16:24", "remaining_time": "4:58:54"}
{"current_steps": 103, "total_steps": 183, "loss": 0.3866, "lr": 3.846789065239859e-05, "epoch": 1.6761421319796954, "percentage": 56.28, "elapsed_time": "6:20:04", "remaining_time": "4:55:12"}
{"current_steps": 104, "total_steps": 183, "loss": 0.3879, "lr": 3.770253875065107e-05, "epoch": 1.6923857868020304, "percentage": 56.83, "elapsed_time": "6:23:44", "remaining_time": "4:51:29"}
{"current_steps": 105, "total_steps": 183, "loss": 0.386, "lr": 3.6938029886540174e-05, "epoch": 1.7086294416243655, "percentage": 57.38, "elapsed_time": "6:27:23", "remaining_time": "4:47:46"}
{"current_steps": 106, "total_steps": 183, "loss": 0.382, "lr": 3.617464459134631e-05, "epoch": 1.7248730964467005, "percentage": 57.92, "elapsed_time": "6:31:03", "remaining_time": "4:44:04"}
{"current_steps": 107, "total_steps": 183, "loss": 0.3837, "lr": 3.541266298406399e-05, "epoch": 1.7411167512690355, "percentage": 58.47, "elapsed_time": "6:34:44", "remaining_time": "4:40:22"}
{"current_steps": 108, "total_steps": 183, "loss": 0.385, "lr": 3.4652364668614065e-05, "epoch": 1.7573604060913706, "percentage": 59.02, "elapsed_time": "6:38:24", "remaining_time": "4:36:40"}
{"current_steps": 109, "total_steps": 183, "loss": 0.388, "lr": 3.3894028631245017e-05, "epoch": 1.7736040609137056, "percentage": 59.56, "elapsed_time": "6:42:04", "remaining_time": "4:32:58"}
{"current_steps": 110, "total_steps": 183, "loss": 0.3873, "lr": 3.313793313816087e-05, "epoch": 1.7898477157360406, "percentage": 60.11, "elapsed_time": "6:45:44", "remaining_time": "4:29:15"}
{"current_steps": 111, "total_steps": 183, "loss": 0.3837, "lr": 3.238435563341326e-05, "epoch": 1.8060913705583757, "percentage": 60.66, "elapsed_time": "6:49:25", "remaining_time": "4:25:34"}
{"current_steps": 112, "total_steps": 183, "loss": 0.3819, "lr": 3.163357263709534e-05, "epoch": 1.8223350253807107, "percentage": 61.2, "elapsed_time": "6:53:05", "remaining_time": "4:21:51"}
{"current_steps": 113, "total_steps": 183, "loss": 0.3768, "lr": 3.088585964387451e-05, "epoch": 1.8385786802030457, "percentage": 61.75, "elapsed_time": "6:56:44", "remaining_time": "4:18:09"}
{"current_steps": 114, "total_steps": 183, "loss": 0.3839, "lr": 3.0141491021901644e-05, "epoch": 1.8548223350253807, "percentage": 62.3, "elapsed_time": "7:00:24", "remaining_time": "4:14:27"}
{"current_steps": 115, "total_steps": 183, "loss": 0.3797, "lr": 2.9400739912133543e-05, "epoch": 1.8710659898477158, "percentage": 62.84, "elapsed_time": "7:04:04", "remaining_time": "4:10:45"}
{"current_steps": 116, "total_steps": 183, "loss": 0.3823, "lr": 2.866387812810572e-05, "epoch": 1.8873096446700508, "percentage": 63.39, "elapsed_time": "7:07:44", "remaining_time": "4:07:03"}
{"current_steps": 117, "total_steps": 183, "loss": 0.378, "lr": 2.793117605619231e-05, "epoch": 1.9035532994923858, "percentage": 63.93, "elapsed_time": "7:11:25", "remaining_time": "4:03:21"}
{"current_steps": 118, "total_steps": 183, "loss": 0.3814, "lr": 2.7202902556389647e-05, "epoch": 1.9197969543147209, "percentage": 64.48, "elapsed_time": "7:15:05", "remaining_time": "3:59:40"}
{"current_steps": 119, "total_steps": 183, "loss": 0.3721, "lr": 2.6479324863659897e-05, "epoch": 1.936040609137056, "percentage": 65.03, "elapsed_time": "7:18:46", "remaining_time": "3:55:58"}
{"current_steps": 120, "total_steps": 183, "loss": 0.3854, "lr": 2.5760708489871077e-05, "epoch": 1.952284263959391, "percentage": 65.57, "elapsed_time": "7:22:26", "remaining_time": "3:52:17"}
{"current_steps": 121, "total_steps": 183, "loss": 0.3784, "lr": 2.504731712636925e-05, "epoch": 1.9685279187817257, "percentage": 66.12, "elapsed_time": "7:26:06", "remaining_time": "3:48:35"}
{"current_steps": 122, "total_steps": 183, "loss": 0.3809, "lr": 2.4339412547218845e-05, "epoch": 1.984771573604061, "percentage": 66.67, "elapsed_time": "7:29:49", "remaining_time": "3:44:54"}
{"current_steps": 123, "total_steps": 183, "loss": 0.606, "lr": 2.3637254513146406e-05, "epoch": 2.0040609137055836, "percentage": 67.21, "elapsed_time": "7:35:05", "remaining_time": "3:41:59"}
{"current_steps": 124, "total_steps": 183, "loss": 0.3647, "lr": 2.294110067622321e-05, "epoch": 2.020304568527919, "percentage": 67.76, "elapsed_time": "7:38:46", "remaining_time": "3:38:17"}
{"current_steps": 125, "total_steps": 183, "loss": 0.3608, "lr": 2.225120648532161e-05, "epoch": 2.0365482233502537, "percentage": 68.31, "elapsed_time": "7:42:27", "remaining_time": "3:34:34"}
{"current_steps": 126, "total_steps": 183, "loss": 0.3614, "lr": 2.1567825092379807e-05, "epoch": 2.052791878172589, "percentage": 68.85, "elapsed_time": "7:46:07", "remaining_time": "3:30:52"}
{"current_steps": 127, "total_steps": 183, "loss": 0.3682, "lr": 2.089120725950948e-05, "epoch": 2.0690355329949237, "percentage": 69.4, "elapsed_time": "7:49:48", "remaining_time": "3:27:09"}
{"current_steps": 128, "total_steps": 183, "loss": 0.3548, "lr": 2.0221601266980383e-05, "epoch": 2.085279187817259, "percentage": 69.95, "elapsed_time": "7:53:28", "remaining_time": "3:23:26"}
{"current_steps": 129, "total_steps": 183, "loss": 0.3552, "lr": 1.955925282211558e-05, "epoch": 2.1015228426395938, "percentage": 70.49, "elapsed_time": "7:57:08", "remaining_time": "3:19:44"}
{"current_steps": 130, "total_steps": 183, "loss": 0.3641, "lr": 1.890440496913083e-05, "epoch": 2.117766497461929, "percentage": 71.04, "elapsed_time": "8:00:48", "remaining_time": "3:16:01"}
{"current_steps": 131, "total_steps": 183, "loss": 0.3641, "lr": 1.825729799995116e-05, "epoch": 2.134010152284264, "percentage": 71.58, "elapsed_time": "8:04:29", "remaining_time": "3:12:19"}
{"current_steps": 132, "total_steps": 183, "loss": 0.3618, "lr": 1.761816936603744e-05, "epoch": 2.150253807106599, "percentage": 72.13, "elapsed_time": "8:08:10", "remaining_time": "3:08:36"}
{"current_steps": 133, "total_steps": 183, "loss": 0.3546, "lr": 1.6987253591255178e-05, "epoch": 2.166497461928934, "percentage": 72.68, "elapsed_time": "8:11:50", "remaining_time": "3:04:54"}
{"current_steps": 134, "total_steps": 183, "loss": 0.3549, "lr": 1.6364782185817592e-05, "epoch": 2.182741116751269, "percentage": 73.22, "elapsed_time": "8:15:30", "remaining_time": "3:01:11"}
{"current_steps": 135, "total_steps": 183, "loss": 0.3586, "lr": 1.5750983561334493e-05, "epoch": 2.198984771573604, "percentage": 73.77, "elapsed_time": "8:19:10", "remaining_time": "2:57:29"}
{"current_steps": 136, "total_steps": 183, "loss": 0.3559, "lr": 1.5146082946998286e-05, "epoch": 2.215228426395939, "percentage": 74.32, "elapsed_time": "8:22:51", "remaining_time": "2:53:46"}
{"current_steps": 137, "total_steps": 183, "loss": 0.3639, "lr": 1.4550302306937619e-05, "epoch": 2.231472081218274, "percentage": 74.86, "elapsed_time": "8:26:30", "remaining_time": "2:50:04"}
{"current_steps": 138, "total_steps": 183, "loss": 0.355, "lr": 1.396386025876916e-05, "epoch": 2.2477157360406093, "percentage": 75.41, "elapsed_time": "8:30:11", "remaining_time": "2:46:21"}
{"current_steps": 139, "total_steps": 183, "loss": 0.3549, "lr": 1.338697199337739e-05, "epoch": 2.263959390862944, "percentage": 75.96, "elapsed_time": "8:33:51", "remaining_time": "2:42:39"}
{"current_steps": 140, "total_steps": 183, "loss": 0.3586, "lr": 1.2819849195951778e-05, "epoch": 2.2802030456852793, "percentage": 76.5, "elapsed_time": "8:37:31", "remaining_time": "2:38:57"}
{"current_steps": 141, "total_steps": 183, "loss": 0.3604, "lr": 1.2262699968310336e-05, "epoch": 2.296446700507614, "percentage": 77.05, "elapsed_time": "8:41:11", "remaining_time": "2:35:14"}
{"current_steps": 142, "total_steps": 183, "loss": 0.3551, "lr": 1.1715728752538103e-05, "epoch": 2.3126903553299494, "percentage": 77.6, "elapsed_time": "8:44:51", "remaining_time": "2:31:32"}
{"current_steps": 143, "total_steps": 183, "loss": 0.3563, "lr": 1.1179136255968523e-05, "epoch": 2.328934010152284, "percentage": 78.14, "elapsed_time": "8:48:31", "remaining_time": "2:27:50"}
{"current_steps": 144, "total_steps": 183, "loss": 0.359, "lr": 1.065311937753526e-05, "epoch": 2.3451776649746194, "percentage": 78.69, "elapsed_time": "8:52:11", "remaining_time": "2:24:08"}
{"current_steps": 145, "total_steps": 183, "loss": 0.3548, "lr": 1.0137871135521493e-05, "epoch": 2.3614213197969542, "percentage": 79.23, "elapsed_time": "8:55:52", "remaining_time": "2:20:26"}
{"current_steps": 146, "total_steps": 183, "loss": 0.3523, "lr": 9.633580596733179e-06, "epoch": 2.3776649746192895, "percentage": 79.78, "elapsed_time": "8:59:32", "remaining_time": "2:16:43"}
{"current_steps": 147, "total_steps": 183, "loss": 0.359, "lr": 9.140432807122282e-06, "epoch": 2.3939086294416243, "percentage": 80.33, "elapsed_time": "9:03:12", "remaining_time": "2:13:01"}
{"current_steps": 148, "total_steps": 183, "loss": 0.3518, "lr": 8.658608723885433e-06, "epoch": 2.4101522842639596, "percentage": 80.87, "elapsed_time": "9:06:52", "remaining_time": "2:09:19"}
{"current_steps": 149, "total_steps": 183, "loss": 0.3535, "lr": 8.18828514906294e-06, "epoch": 2.4263959390862944, "percentage": 81.42, "elapsed_time": "9:10:33", "remaining_time": "2:05:37"}
{"current_steps": 150, "total_steps": 183, "loss": 0.3534, "lr": 7.729634664662469e-06, "epoch": 2.4426395939086296, "percentage": 81.97, "elapsed_time": "9:14:13", "remaining_time": "2:01:55"}
{"current_steps": 151, "total_steps": 183, "loss": 0.3596, "lr": 7.282825569331296e-06, "epoch": 2.4588832487309644, "percentage": 82.51, "elapsed_time": "9:17:54", "remaining_time": "1:58:13"}
{"current_steps": 152, "total_steps": 183, "loss": 0.361, "lr": 6.848021816600221e-06, "epoch": 2.4751269035532997, "percentage": 83.06, "elapsed_time": "9:21:35", "remaining_time": "1:54:32"}
{"current_steps": 153, "total_steps": 183, "loss": 0.3614, "lr": 6.425382954722002e-06, "epoch": 2.4913705583756345, "percentage": 83.61, "elapsed_time": "9:25:15", "remaining_time": "1:50:50"}
{"current_steps": 154, "total_steps": 183, "loss": 0.3575, "lr": 6.015064068126188e-06, "epoch": 2.5076142131979697, "percentage": 84.15, "elapsed_time": "9:28:56", "remaining_time": "1:47:08"}
{"current_steps": 155, "total_steps": 183, "loss": 0.351, "lr": 5.617215720511962e-06, "epoch": 2.5238578680203045, "percentage": 84.7, "elapsed_time": "9:32:37", "remaining_time": "1:43:26"}
{"current_steps": 156, "total_steps": 183, "loss": 0.3543, "lr": 5.231983899599798e-06, "epoch": 2.5401015228426393, "percentage": 85.25, "elapsed_time": "9:36:18", "remaining_time": "1:39:44"}
{"current_steps": 157, "total_steps": 183, "loss": 0.3646, "lr": 4.859509963562313e-06, "epoch": 2.5563451776649746, "percentage": 85.79, "elapsed_time": "9:39:58", "remaining_time": "1:36:02"}
{"current_steps": 158, "total_steps": 183, "loss": 0.3546, "lr": 4.4999305891538294e-06, "epoch": 2.57258883248731, "percentage": 86.34, "elapsed_time": "9:43:39", "remaining_time": "1:32:21"}
{"current_steps": 159, "total_steps": 183, "loss": 0.3579, "lr": 4.153377721557781e-06, "epoch": 2.5888324873096447, "percentage": 86.89, "elapsed_time": "9:47:20", "remaining_time": "1:28:39"}
{"current_steps": 160, "total_steps": 183, "loss": 0.3565, "lr": 3.819978525970336e-06, "epoch": 2.6050761421319795, "percentage": 87.43, "elapsed_time": "9:51:00", "remaining_time": "1:24:57"}
{"current_steps": 161, "total_steps": 183, "loss": 0.3553, "lr": 3.499855340938001e-06, "epoch": 2.6213197969543147, "percentage": 87.98, "elapsed_time": "9:54:40", "remaining_time": "1:21:15"}
{"current_steps": 162, "total_steps": 183, "loss": 0.3545, "lr": 3.19312563346633e-06, "epoch": 2.63756345177665, "percentage": 88.52, "elapsed_time": "9:58:21", "remaining_time": "1:17:33"}
{"current_steps": 163, "total_steps": 183, "loss": 0.3552, "lr": 2.8999019559162156e-06, "epoch": 2.6538071065989848, "percentage": 89.07, "elapsed_time": "10:02:01", "remaining_time": "1:13:52"}
{"current_steps": 164, "total_steps": 183, "loss": 0.3468, "lr": 2.6202919047035604e-06, "epoch": 2.6700507614213196, "percentage": 89.62, "elapsed_time": "10:05:41", "remaining_time": "1:10:10"}
{"current_steps": 165, "total_steps": 183, "loss": 0.3562, "lr": 2.3543980808175393e-06, "epoch": 2.686294416243655, "percentage": 90.16, "elapsed_time": "10:09:21", "remaining_time": "1:06:28"}
{"current_steps": 166, "total_steps": 183, "loss": 0.3556, "lr": 2.10231805217183e-06, "epoch": 2.70253807106599, "percentage": 90.71, "elapsed_time": "10:13:02", "remaining_time": "1:02:46"}
{"current_steps": 167, "total_steps": 183, "loss": 0.354, "lr": 1.8641443178027784e-06, "epoch": 2.718781725888325, "percentage": 91.26, "elapsed_time": "10:16:42", "remaining_time": "0:59:05"}
{"current_steps": 168, "total_steps": 183, "loss": 0.3534, "lr": 1.6399642739274791e-06, "epoch": 2.7350253807106597, "percentage": 91.8, "elapsed_time": "10:20:23", "remaining_time": "0:55:23"}
{"current_steps": 169, "total_steps": 183, "loss": 0.3585, "lr": 1.4298601818743607e-06, "epoch": 2.751269035532995, "percentage": 92.35, "elapsed_time": "10:24:03", "remaining_time": "0:51:41"}
{"current_steps": 170, "total_steps": 183, "loss": 0.3632, "lr": 1.233909137897924e-06, "epoch": 2.76751269035533, "percentage": 92.9, "elapsed_time": "10:27:43", "remaining_time": "0:48:00"}
{"current_steps": 171, "total_steps": 183, "loss": 0.3581, "lr": 1.0521830448888414e-06, "epoch": 2.783756345177665, "percentage": 93.44, "elapsed_time": "10:31:24", "remaining_time": "0:44:18"}
{"current_steps": 172, "total_steps": 183, "loss": 0.3502, "lr": 8.847485859896365e-07, "epoch": 2.8, "percentage": 93.99, "elapsed_time": "10:35:04", "remaining_time": "0:40:36"}
{"current_steps": 173, "total_steps": 183, "loss": 0.3567, "lr": 7.31667200125803e-07, "epoch": 2.816243654822335, "percentage": 94.54, "elapsed_time": "10:38:44", "remaining_time": "0:36:55"}
{"current_steps": 174, "total_steps": 183, "loss": 0.3554, "lr": 5.929950594612032e-07, "epoch": 2.8324873096446703, "percentage": 95.08, "elapsed_time": "10:42:24", "remaining_time": "0:33:13"}
{"current_steps": 175, "total_steps": 183, "loss": 0.3563, "lr": 4.687830487860634e-07, "epoch": 2.848730964467005, "percentage": 95.63, "elapsed_time": "10:46:05", "remaining_time": "0:29:32"}
{"current_steps": 176, "total_steps": 183, "loss": 0.3505, "lr": 3.590767468451528e-07, "epoch": 2.86497461928934, "percentage": 96.17, "elapsed_time": "10:49:44", "remaining_time": "0:25:50"}
{"current_steps": 177, "total_steps": 183, "loss": 0.3541, "lr": 2.639164096129987e-07, "epoch": 2.881218274111675, "percentage": 96.72, "elapsed_time": "10:53:25", "remaining_time": "0:22:08"}
{"current_steps": 178, "total_steps": 183, "loss": 0.356, "lr": 1.833369555222042e-07, "epoch": 2.89746192893401, "percentage": 97.27, "elapsed_time": "10:57:05", "remaining_time": "0:18:27"}
{"current_steps": 179, "total_steps": 183, "loss": 0.3602, "lr": 1.1736795265038237e-07, "epoch": 2.9137055837563453, "percentage": 97.81, "elapsed_time": "11:00:45", "remaining_time": "0:14:45"}
{"current_steps": 180, "total_steps": 183, "loss": 0.3592, "lr": 6.603360787035495e-08, "epoch": 2.92994923857868, "percentage": 98.36, "elapsed_time": "11:04:25", "remaining_time": "0:11:04"}
{"current_steps": 181, "total_steps": 183, "loss": 0.3495, "lr": 2.9352757967600064e-08, "epoch": 2.9461928934010153, "percentage": 98.91, "elapsed_time": "11:08:05", "remaining_time": "0:07:22"}
{"current_steps": 182, "total_steps": 183, "loss": 0.3571, "lr": 7.338862728225593e-09, "epoch": 2.96243654822335, "percentage": 99.45, "elapsed_time": "11:11:45", "remaining_time": "0:03:41"}
{"current_steps": 183, "total_steps": 183, "loss": 0.3592, "lr": 0.0, "epoch": 2.9786802030456854, "percentage": 100.0, "elapsed_time": "11:15:26", "remaining_time": "0:00:00"}
{"current_steps": 183, "total_steps": 183, "epoch": 2.9786802030456854, "percentage": 100.0, "elapsed_time": "11:16:57", "remaining_time": "0:00:00"}