EmoLLM_Qwen / trainer_log.jsonl
vvEverett's picture
Upload folder using huggingface_hub
964a7e4 verified
{"current_steps": 1, "total_steps": 100, "loss": 7.1138, "lr": 2e-07, "epoch": 0.01, "percentage": 1.0, "elapsed_time": "0:00:30", "remaining_time": "0:50:08"}
{"current_steps": 2, "total_steps": 100, "loss": 6.8466, "lr": 4e-07, "epoch": 0.02, "percentage": 2.0, "elapsed_time": "0:00:56", "remaining_time": "0:45:56"}
{"current_steps": 3, "total_steps": 100, "loss": 6.8936, "lr": 6e-07, "epoch": 0.03, "percentage": 3.0, "elapsed_time": "0:01:23", "remaining_time": "0:44:58"}
{"current_steps": 4, "total_steps": 100, "loss": 7.1196, "lr": 8e-07, "epoch": 0.04, "percentage": 4.0, "elapsed_time": "0:01:50", "remaining_time": "0:44:17"}
{"current_steps": 5, "total_steps": 100, "loss": 6.7063, "lr": 1e-06, "epoch": 0.05, "percentage": 5.0, "elapsed_time": "0:02:17", "remaining_time": "0:43:40"}
{"current_steps": 6, "total_steps": 100, "loss": 6.028, "lr": 9.99726628670463e-07, "epoch": 0.06, "percentage": 6.0, "elapsed_time": "0:02:44", "remaining_time": "0:43:00"}
{"current_steps": 7, "total_steps": 100, "loss": 5.593, "lr": 9.989068136093872e-07, "epoch": 0.07, "percentage": 7.0, "elapsed_time": "0:03:10", "remaining_time": "0:42:16"}
{"current_steps": 8, "total_steps": 100, "loss": 4.1199, "lr": 9.975414512725056e-07, "epoch": 0.08, "percentage": 8.0, "elapsed_time": "0:03:37", "remaining_time": "0:41:44"}
{"current_steps": 9, "total_steps": 100, "loss": 3.8539, "lr": 9.956320346634875e-07, "epoch": 0.09, "percentage": 9.0, "elapsed_time": "0:04:04", "remaining_time": "0:41:11"}
{"current_steps": 10, "total_steps": 100, "loss": 3.364, "lr": 9.931806517013612e-07, "epoch": 0.1, "percentage": 10.0, "elapsed_time": "0:04:30", "remaining_time": "0:40:35"}
{"current_steps": 11, "total_steps": 100, "loss": 3.2359, "lr": 9.901899829374047e-07, "epoch": 0.11, "percentage": 11.0, "elapsed_time": "0:04:56", "remaining_time": "0:40:01"}
{"current_steps": 12, "total_steps": 100, "loss": 2.0694, "lr": 9.866632986240029e-07, "epoch": 0.12, "percentage": 12.0, "elapsed_time": "0:05:20", "remaining_time": "0:39:12"}
{"current_steps": 13, "total_steps": 100, "loss": 1.8041, "lr": 9.826044551386742e-07, "epoch": 0.13, "percentage": 13.0, "elapsed_time": "0:05:46", "remaining_time": "0:38:36"}
{"current_steps": 14, "total_steps": 100, "loss": 1.8221, "lr": 9.780178907671788e-07, "epoch": 0.14, "percentage": 14.0, "elapsed_time": "0:06:11", "remaining_time": "0:38:03"}
{"current_steps": 15, "total_steps": 100, "loss": 1.5577, "lr": 9.729086208503173e-07, "epoch": 0.15, "percentage": 15.0, "elapsed_time": "0:06:38", "remaining_time": "0:37:39"}
{"current_steps": 16, "total_steps": 100, "loss": 1.3898, "lr": 9.672822322997304e-07, "epoch": 0.16, "percentage": 16.0, "elapsed_time": "0:07:04", "remaining_time": "0:37:06"}
{"current_steps": 17, "total_steps": 100, "loss": 1.2839, "lr": 9.611448774886923e-07, "epoch": 0.17, "percentage": 17.0, "elapsed_time": "0:07:30", "remaining_time": "0:36:38"}
{"current_steps": 18, "total_steps": 100, "loss": 1.1126, "lr": 9.545032675245813e-07, "epoch": 0.18, "percentage": 18.0, "elapsed_time": "0:07:57", "remaining_time": "0:36:15"}
{"current_steps": 19, "total_steps": 100, "loss": 0.9637, "lr": 9.473646649103817e-07, "epoch": 0.19, "percentage": 19.0, "elapsed_time": "0:08:25", "remaining_time": "0:35:57"}
{"current_steps": 20, "total_steps": 100, "loss": 0.6976, "lr": 9.397368756032444e-07, "epoch": 0.2, "percentage": 20.0, "elapsed_time": "0:08:51", "remaining_time": "0:35:26"}
{"current_steps": 21, "total_steps": 100, "loss": 0.6686, "lr": 9.316282404787869e-07, "epoch": 0.21, "percentage": 21.0, "elapsed_time": "0:09:18", "remaining_time": "0:34:59"}
{"current_steps": 22, "total_steps": 100, "loss": 0.6055, "lr": 9.230476262104676e-07, "epoch": 0.22, "percentage": 22.0, "elapsed_time": "0:09:47", "remaining_time": "0:34:42"}
{"current_steps": 23, "total_steps": 100, "loss": 0.5312, "lr": 9.1400441557401e-07, "epoch": 0.23, "percentage": 23.0, "elapsed_time": "0:10:12", "remaining_time": "0:34:11"}
{"current_steps": 24, "total_steps": 100, "loss": 0.5334, "lr": 9.045084971874737e-07, "epoch": 0.24, "percentage": 24.0, "elapsed_time": "0:10:38", "remaining_time": "0:33:43"}
{"current_steps": 25, "total_steps": 100, "loss": 0.5246, "lr": 8.945702546981968e-07, "epoch": 0.25, "percentage": 25.0, "elapsed_time": "0:11:04", "remaining_time": "0:33:13"}
{"current_steps": 26, "total_steps": 100, "loss": 0.4586, "lr": 8.842005554284295e-07, "epoch": 0.26, "percentage": 26.0, "elapsed_time": "0:11:30", "remaining_time": "0:32:46"}
{"current_steps": 27, "total_steps": 100, "loss": 0.514, "lr": 8.734107384920769e-07, "epoch": 0.27, "percentage": 27.0, "elapsed_time": "0:11:58", "remaining_time": "0:32:23"}
{"current_steps": 28, "total_steps": 100, "loss": 0.469, "lr": 8.622126023955445e-07, "epoch": 0.28, "percentage": 28.0, "elapsed_time": "0:12:24", "remaining_time": "0:31:55"}
{"current_steps": 29, "total_steps": 100, "loss": 0.4928, "lr": 8.506183921362442e-07, "epoch": 0.29, "percentage": 29.0, "elapsed_time": "0:12:50", "remaining_time": "0:31:27"}
{"current_steps": 30, "total_steps": 100, "loss": 0.416, "lr": 8.386407858128706e-07, "epoch": 0.3, "percentage": 30.0, "elapsed_time": "0:13:18", "remaining_time": "0:31:02"}
{"current_steps": 31, "total_steps": 100, "loss": 0.4065, "lr": 8.262928807620843e-07, "epoch": 0.31, "percentage": 31.0, "elapsed_time": "0:13:47", "remaining_time": "0:30:40"}
{"current_steps": 32, "total_steps": 100, "loss": 0.4302, "lr": 8.135881792367685e-07, "epoch": 0.32, "percentage": 32.0, "elapsed_time": "0:14:13", "remaining_time": "0:30:14"}
{"current_steps": 33, "total_steps": 100, "loss": 0.475, "lr": 8.005405736415125e-07, "epoch": 0.33, "percentage": 33.0, "elapsed_time": "0:14:39", "remaining_time": "0:29:45"}
{"current_steps": 34, "total_steps": 100, "loss": 0.4418, "lr": 7.871643313414718e-07, "epoch": 0.34, "percentage": 34.0, "elapsed_time": "0:15:04", "remaining_time": "0:29:15"}
{"current_steps": 35, "total_steps": 100, "loss": 0.4074, "lr": 7.734740790612136e-07, "epoch": 0.35, "percentage": 35.0, "elapsed_time": "0:15:30", "remaining_time": "0:28:47"}
{"current_steps": 36, "total_steps": 100, "loss": 0.4006, "lr": 7.594847868906076e-07, "epoch": 0.36, "percentage": 36.0, "elapsed_time": "0:15:54", "remaining_time": "0:28:17"}
{"current_steps": 37, "total_steps": 100, "loss": 0.4099, "lr": 7.452117519152541e-07, "epoch": 0.37, "percentage": 37.0, "elapsed_time": "0:16:20", "remaining_time": "0:27:49"}
{"current_steps": 38, "total_steps": 100, "loss": 0.4258, "lr": 7.306705814893439e-07, "epoch": 0.38, "percentage": 38.0, "elapsed_time": "0:16:47", "remaining_time": "0:27:23"}
{"current_steps": 39, "total_steps": 100, "loss": 0.4066, "lr": 7.158771761692464e-07, "epoch": 0.39, "percentage": 39.0, "elapsed_time": "0:17:13", "remaining_time": "0:26:55"}
{"current_steps": 40, "total_steps": 100, "loss": 0.4272, "lr": 7.008477123264847e-07, "epoch": 0.4, "percentage": 40.0, "elapsed_time": "0:17:37", "remaining_time": "0:26:26"}
{"current_steps": 41, "total_steps": 100, "loss": 0.4166, "lr": 6.855986244591103e-07, "epoch": 0.41, "percentage": 41.0, "elapsed_time": "0:18:05", "remaining_time": "0:26:01"}
{"current_steps": 42, "total_steps": 100, "loss": 0.3928, "lr": 6.701465872208216e-07, "epoch": 0.42, "percentage": 42.0, "elapsed_time": "0:18:30", "remaining_time": "0:25:33"}
{"current_steps": 43, "total_steps": 100, "loss": 0.4291, "lr": 6.545084971874736e-07, "epoch": 0.43, "percentage": 43.0, "elapsed_time": "0:18:56", "remaining_time": "0:25:06"}
{"current_steps": 44, "total_steps": 100, "loss": 0.3841, "lr": 6.387014543809223e-07, "epoch": 0.44, "percentage": 44.0, "elapsed_time": "0:19:20", "remaining_time": "0:24:36"}
{"current_steps": 45, "total_steps": 100, "loss": 0.3897, "lr": 6.227427435703995e-07, "epoch": 0.45, "percentage": 45.0, "elapsed_time": "0:19:46", "remaining_time": "0:24:10"}
{"current_steps": 46, "total_steps": 100, "loss": 0.3938, "lr": 6.066498153718734e-07, "epoch": 0.46, "percentage": 46.0, "elapsed_time": "0:20:12", "remaining_time": "0:23:43"}
{"current_steps": 47, "total_steps": 100, "loss": 0.3722, "lr": 5.90440267166055e-07, "epoch": 0.47, "percentage": 47.0, "elapsed_time": "0:20:40", "remaining_time": "0:23:18"}
{"current_steps": 48, "total_steps": 100, "loss": 0.4295, "lr": 5.741318238559209e-07, "epoch": 0.48, "percentage": 48.0, "elapsed_time": "0:21:08", "remaining_time": "0:22:53"}
{"current_steps": 49, "total_steps": 100, "loss": 0.3834, "lr": 5.577423184847931e-07, "epoch": 0.49, "percentage": 49.0, "elapsed_time": "0:21:34", "remaining_time": "0:22:27"}
{"current_steps": 50, "total_steps": 100, "loss": 0.3391, "lr": 5.412896727361662e-07, "epoch": 0.5, "percentage": 50.0, "elapsed_time": "0:21:59", "remaining_time": "0:21:59"}
{"current_steps": 51, "total_steps": 100, "loss": 0.3942, "lr": 5.247918773366111e-07, "epoch": 0.51, "percentage": 51.0, "elapsed_time": "0:22:26", "remaining_time": "0:21:33"}
{"current_steps": 52, "total_steps": 100, "loss": 0.3848, "lr": 5.082669723831793e-07, "epoch": 0.52, "percentage": 52.0, "elapsed_time": "0:22:50", "remaining_time": "0:21:05"}
{"current_steps": 53, "total_steps": 100, "loss": 0.385, "lr": 4.917330276168208e-07, "epoch": 0.53, "percentage": 53.0, "elapsed_time": "0:23:17", "remaining_time": "0:20:39"}
{"current_steps": 54, "total_steps": 100, "loss": 0.3694, "lr": 4.752081226633888e-07, "epoch": 0.54, "percentage": 54.0, "elapsed_time": "0:23:44", "remaining_time": "0:20:13"}
{"current_steps": 55, "total_steps": 100, "loss": 0.3615, "lr": 4.5871032726383385e-07, "epoch": 0.55, "percentage": 55.0, "elapsed_time": "0:24:11", "remaining_time": "0:19:47"}
{"current_steps": 56, "total_steps": 100, "loss": 0.3257, "lr": 4.4225768151520694e-07, "epoch": 0.56, "percentage": 56.0, "elapsed_time": "0:24:38", "remaining_time": "0:19:22"}
{"current_steps": 57, "total_steps": 100, "loss": 0.351, "lr": 4.258681761440789e-07, "epoch": 0.57, "percentage": 57.0, "elapsed_time": "0:25:04", "remaining_time": "0:18:54"}
{"current_steps": 58, "total_steps": 100, "loss": 0.3964, "lr": 4.095597328339452e-07, "epoch": 0.58, "percentage": 58.0, "elapsed_time": "0:25:30", "remaining_time": "0:18:28"}
{"current_steps": 59, "total_steps": 100, "loss": 0.3783, "lr": 3.9335018462812664e-07, "epoch": 0.59, "percentage": 59.0, "elapsed_time": "0:25:55", "remaining_time": "0:18:01"}
{"current_steps": 60, "total_steps": 100, "loss": 0.3617, "lr": 3.772572564296004e-07, "epoch": 0.6, "percentage": 60.0, "elapsed_time": "0:26:20", "remaining_time": "0:17:33"}
{"current_steps": 61, "total_steps": 100, "loss": 0.3997, "lr": 3.612985456190778e-07, "epoch": 0.61, "percentage": 61.0, "elapsed_time": "0:26:47", "remaining_time": "0:17:08"}
{"current_steps": 62, "total_steps": 100, "loss": 0.3582, "lr": 3.454915028125263e-07, "epoch": 0.62, "percentage": 62.0, "elapsed_time": "0:27:13", "remaining_time": "0:16:41"}
{"current_steps": 63, "total_steps": 100, "loss": 0.3804, "lr": 3.2985341277917846e-07, "epoch": 0.63, "percentage": 63.0, "elapsed_time": "0:27:39", "remaining_time": "0:16:14"}
{"current_steps": 64, "total_steps": 100, "loss": 0.3646, "lr": 3.1440137554088953e-07, "epoch": 0.64, "percentage": 64.0, "elapsed_time": "0:28:07", "remaining_time": "0:15:49"}
{"current_steps": 65, "total_steps": 100, "loss": 0.3387, "lr": 2.9915228767351535e-07, "epoch": 0.65, "percentage": 65.0, "elapsed_time": "0:28:35", "remaining_time": "0:15:23"}
{"current_steps": 66, "total_steps": 100, "loss": 0.3839, "lr": 2.841228238307536e-07, "epoch": 0.66, "percentage": 66.0, "elapsed_time": "0:29:01", "remaining_time": "0:14:57"}
{"current_steps": 67, "total_steps": 100, "loss": 0.3635, "lr": 2.6932941851065615e-07, "epoch": 0.67, "percentage": 67.0, "elapsed_time": "0:29:28", "remaining_time": "0:14:30"}
{"current_steps": 68, "total_steps": 100, "loss": 0.3905, "lr": 2.547882480847461e-07, "epoch": 0.68, "percentage": 68.0, "elapsed_time": "0:29:55", "remaining_time": "0:14:04"}
{"current_steps": 69, "total_steps": 100, "loss": 0.3666, "lr": 2.4051521310939254e-07, "epoch": 0.69, "percentage": 69.0, "elapsed_time": "0:30:21", "remaining_time": "0:13:38"}
{"current_steps": 70, "total_steps": 100, "loss": 0.3317, "lr": 2.2652592093878665e-07, "epoch": 0.7, "percentage": 70.0, "elapsed_time": "0:30:49", "remaining_time": "0:13:12"}
{"current_steps": 71, "total_steps": 100, "loss": 0.3231, "lr": 2.128356686585282e-07, "epoch": 0.71, "percentage": 71.0, "elapsed_time": "0:31:17", "remaining_time": "0:12:46"}
{"current_steps": 72, "total_steps": 100, "loss": 0.3447, "lr": 1.9945942635848745e-07, "epoch": 0.72, "percentage": 72.0, "elapsed_time": "0:31:40", "remaining_time": "0:12:19"}
{"current_steps": 73, "total_steps": 100, "loss": 0.3284, "lr": 1.8641182076323148e-07, "epoch": 0.73, "percentage": 73.0, "elapsed_time": "0:32:08", "remaining_time": "0:11:53"}
{"current_steps": 74, "total_steps": 100, "loss": 0.3591, "lr": 1.7370711923791564e-07, "epoch": 0.74, "percentage": 74.0, "elapsed_time": "0:32:34", "remaining_time": "0:11:26"}
{"current_steps": 75, "total_steps": 100, "loss": 0.3444, "lr": 1.6135921418712955e-07, "epoch": 0.75, "percentage": 75.0, "elapsed_time": "0:33:02", "remaining_time": "0:11:00"}
{"current_steps": 76, "total_steps": 100, "loss": 0.4039, "lr": 1.493816078637557e-07, "epoch": 0.76, "percentage": 76.0, "elapsed_time": "0:33:26", "remaining_time": "0:10:33"}
{"current_steps": 77, "total_steps": 100, "loss": 0.3203, "lr": 1.3778739760445552e-07, "epoch": 0.77, "percentage": 77.0, "elapsed_time": "0:33:50", "remaining_time": "0:10:06"}
{"current_steps": 78, "total_steps": 100, "loss": 0.3715, "lr": 1.2658926150792322e-07, "epoch": 0.78, "percentage": 78.0, "elapsed_time": "0:34:16", "remaining_time": "0:09:39"}
{"current_steps": 79, "total_steps": 100, "loss": 0.3226, "lr": 1.1579944457157059e-07, "epoch": 0.79, "percentage": 79.0, "elapsed_time": "0:34:41", "remaining_time": "0:09:13"}
{"current_steps": 80, "total_steps": 100, "loss": 0.3627, "lr": 1.0542974530180327e-07, "epoch": 0.8, "percentage": 80.0, "elapsed_time": "0:35:06", "remaining_time": "0:08:46"}
{"current_steps": 81, "total_steps": 100, "loss": 0.3646, "lr": 9.549150281252632e-08, "epoch": 0.81, "percentage": 81.0, "elapsed_time": "0:35:35", "remaining_time": "0:08:20"}
{"current_steps": 82, "total_steps": 100, "loss": 0.3506, "lr": 8.599558442598998e-08, "epoch": 0.82, "percentage": 82.0, "elapsed_time": "0:36:00", "remaining_time": "0:07:54"}
{"current_steps": 83, "total_steps": 100, "loss": 0.3471, "lr": 7.695237378953224e-08, "epoch": 0.83, "percentage": 83.0, "elapsed_time": "0:36:29", "remaining_time": "0:07:28"}
{"current_steps": 84, "total_steps": 100, "loss": 0.3362, "lr": 6.837175952121304e-08, "epoch": 0.84, "percentage": 84.0, "elapsed_time": "0:36:57", "remaining_time": "0:07:02"}
{"current_steps": 85, "total_steps": 100, "loss": 0.354, "lr": 6.026312439675551e-08, "epoch": 0.85, "percentage": 85.0, "elapsed_time": "0:37:24", "remaining_time": "0:06:36"}
{"current_steps": 86, "total_steps": 100, "loss": 0.3589, "lr": 5.263533508961826e-08, "epoch": 0.86, "percentage": 86.0, "elapsed_time": "0:37:50", "remaining_time": "0:06:09"}
{"current_steps": 87, "total_steps": 100, "loss": 0.3209, "lr": 4.549673247541874e-08, "epoch": 0.87, "percentage": 87.0, "elapsed_time": "0:38:17", "remaining_time": "0:05:43"}
{"current_steps": 88, "total_steps": 100, "loss": 0.3707, "lr": 3.8855122511307626e-08, "epoch": 0.88, "percentage": 88.0, "elapsed_time": "0:38:44", "remaining_time": "0:05:16"}
{"current_steps": 89, "total_steps": 100, "loss": 0.3314, "lr": 3.271776770026963e-08, "epoch": 0.89, "percentage": 89.0, "elapsed_time": "0:39:09", "remaining_time": "0:04:50"}
{"current_steps": 90, "total_steps": 100, "loss": 0.3634, "lr": 2.7091379149682682e-08, "epoch": 0.9, "percentage": 90.0, "elapsed_time": "0:39:34", "remaining_time": "0:04:23"}
{"current_steps": 91, "total_steps": 100, "loss": 0.3762, "lr": 2.1982109232821176e-08, "epoch": 0.91, "percentage": 91.0, "elapsed_time": "0:40:00", "remaining_time": "0:03:57"}
{"current_steps": 92, "total_steps": 100, "loss": 0.3393, "lr": 1.7395544861325718e-08, "epoch": 0.92, "percentage": 92.0, "elapsed_time": "0:40:26", "remaining_time": "0:03:30"}
{"current_steps": 93, "total_steps": 100, "loss": 0.3408, "lr": 1.3336701375997127e-08, "epoch": 0.93, "percentage": 93.0, "elapsed_time": "0:40:53", "remaining_time": "0:03:04"}
{"current_steps": 94, "total_steps": 100, "loss": 0.3388, "lr": 9.810017062595321e-09, "epoch": 0.94, "percentage": 94.0, "elapsed_time": "0:41:20", "remaining_time": "0:02:38"}
{"current_steps": 95, "total_steps": 100, "loss": 0.3396, "lr": 6.819348298638839e-09, "epoch": 0.95, "percentage": 95.0, "elapsed_time": "0:41:45", "remaining_time": "0:02:11"}
{"current_steps": 96, "total_steps": 100, "loss": 0.3292, "lr": 4.367965336512403e-09, "epoch": 0.96, "percentage": 96.0, "elapsed_time": "0:42:11", "remaining_time": "0:01:45"}
{"current_steps": 97, "total_steps": 100, "loss": 0.3415, "lr": 2.458548727494292e-09, "epoch": 0.97, "percentage": 97.0, "elapsed_time": "0:42:39", "remaining_time": "0:01:19"}
{"current_steps": 98, "total_steps": 100, "loss": 0.3261, "lr": 1.0931863906127325e-09, "epoch": 0.98, "percentage": 98.0, "elapsed_time": "0:43:04", "remaining_time": "0:00:52"}
{"current_steps": 99, "total_steps": 100, "loss": 0.3191, "lr": 2.733713295369755e-10, "epoch": 0.99, "percentage": 99.0, "elapsed_time": "0:43:31", "remaining_time": "0:00:26"}
{"current_steps": 100, "total_steps": 100, "loss": 0.355, "lr": 0.0, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "0:43:59", "remaining_time": "0:00:00"}
{"current_steps": 100, "total_steps": 100, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "0:44:40", "remaining_time": "0:00:00"}