Limo_qwen / trainer_log.jsonl
tongliuphysics's picture
Upload folder using huggingface_hub
21683b3 verified
{"current_steps": 2, "total_steps": 120, "loss": 0.9614, "lr": 1.3333333333333333e-05, "epoch": 0.16842105263157894, "percentage": 1.67, "elapsed_time": "0:02:43", "remaining_time": "2:40:32"}
{"current_steps": 4, "total_steps": 120, "loss": 0.9707, "lr": 4e-05, "epoch": 0.3368421052631579, "percentage": 3.33, "elapsed_time": "0:05:26", "remaining_time": "2:37:54"}
{"current_steps": 6, "total_steps": 120, "loss": 0.9543, "lr": 6.666666666666667e-05, "epoch": 0.5052631578947369, "percentage": 5.0, "elapsed_time": "0:08:08", "remaining_time": "2:34:38"}
{"current_steps": 8, "total_steps": 120, "loss": 0.865, "lr": 7.998481228099806e-05, "epoch": 0.6736842105263158, "percentage": 6.67, "elapsed_time": "0:10:45", "remaining_time": "2:30:38"}
{"current_steps": 10, "total_steps": 120, "loss": 0.8631, "lr": 7.98633797202668e-05, "epoch": 0.8421052631578947, "percentage": 8.33, "elapsed_time": "0:13:28", "remaining_time": "2:28:13"}
{"current_steps": 12, "total_steps": 120, "loss": 0.8842, "lr": 7.962088338550013e-05, "epoch": 1.0, "percentage": 10.0, "elapsed_time": "0:15:57", "remaining_time": "2:23:34"}
{"current_steps": 12, "total_steps": 120, "eval_loss": 0.8996532559394836, "epoch": 1.0, "percentage": 10.0, "elapsed_time": "0:16:10", "remaining_time": "2:25:30"}
{"current_steps": 14, "total_steps": 120, "loss": 0.856, "lr": 7.925805973009672e-05, "epoch": 1.168421052631579, "percentage": 11.67, "elapsed_time": "0:18:56", "remaining_time": "2:23:21"}
{"current_steps": 16, "total_steps": 120, "loss": 0.8322, "lr": 7.877601063757323e-05, "epoch": 1.3368421052631578, "percentage": 13.33, "elapsed_time": "0:21:38", "remaining_time": "2:20:39"}
{"current_steps": 18, "total_steps": 120, "loss": 0.8178, "lr": 7.81762000751803e-05, "epoch": 1.5052631578947369, "percentage": 15.0, "elapsed_time": "0:24:18", "remaining_time": "2:17:45"}
{"current_steps": 20, "total_steps": 120, "loss": 0.8212, "lr": 7.74604496478822e-05, "epoch": 1.6736842105263157, "percentage": 16.67, "elapsed_time": "0:26:56", "remaining_time": "2:14:41"}
{"current_steps": 22, "total_steps": 120, "loss": 0.798, "lr": 7.663093306620231e-05, "epoch": 1.8421052631578947, "percentage": 18.33, "elapsed_time": "0:29:33", "remaining_time": "2:11:42"}
{"current_steps": 24, "total_steps": 120, "loss": 0.8086, "lr": 7.569016954473577e-05, "epoch": 2.0, "percentage": 20.0, "elapsed_time": "0:32:05", "remaining_time": "2:08:22"}
{"current_steps": 24, "total_steps": 120, "eval_loss": 0.8223039507865906, "epoch": 2.0, "percentage": 20.0, "elapsed_time": "0:32:18", "remaining_time": "2:09:13"}
{"current_steps": 26, "total_steps": 120, "loss": 0.7815, "lr": 7.464101615137756e-05, "epoch": 2.168421052631579, "percentage": 21.67, "elapsed_time": "0:35:07", "remaining_time": "2:06:58"}
{"current_steps": 28, "total_steps": 120, "loss": 0.7909, "lr": 7.348665913050115e-05, "epoch": 2.336842105263158, "percentage": 23.33, "elapsed_time": "0:37:49", "remaining_time": "2:04:15"}
{"current_steps": 30, "total_steps": 120, "loss": 0.795, "lr": 7.223060422643914e-05, "epoch": 2.5052631578947366, "percentage": 25.0, "elapsed_time": "0:40:23", "remaining_time": "2:01:11"}
{"current_steps": 32, "total_steps": 120, "loss": 0.7529, "lr": 7.087666603665284e-05, "epoch": 2.6736842105263157, "percentage": 26.67, "elapsed_time": "0:43:02", "remaining_time": "1:58:22"}
{"current_steps": 34, "total_steps": 120, "loss": 0.7329, "lr": 6.942895642692527e-05, "epoch": 2.8421052631578947, "percentage": 28.33, "elapsed_time": "0:45:46", "remaining_time": "1:55:46"}
{"current_steps": 36, "total_steps": 120, "loss": 0.7502, "lr": 6.789187204375981e-05, "epoch": 3.0, "percentage": 30.0, "elapsed_time": "0:48:16", "remaining_time": "1:52:39"}
{"current_steps": 36, "total_steps": 120, "eval_loss": 0.7780648469924927, "epoch": 3.0, "percentage": 30.0, "elapsed_time": "0:48:29", "remaining_time": "1:53:09"}
{"current_steps": 38, "total_steps": 120, "loss": 0.7365, "lr": 6.627008096190938e-05, "epoch": 3.168421052631579, "percentage": 31.67, "elapsed_time": "0:51:20", "remaining_time": "1:50:47"}
{"current_steps": 40, "total_steps": 120, "loss": 0.7316, "lr": 6.456850850758673e-05, "epoch": 3.336842105263158, "percentage": 33.33, "elapsed_time": "0:54:01", "remaining_time": "1:48:03"}
{"current_steps": 42, "total_steps": 120, "loss": 0.742, "lr": 6.279232230041065e-05, "epoch": 3.5052631578947366, "percentage": 35.0, "elapsed_time": "0:56:45", "remaining_time": "1:45:24"}
{"current_steps": 44, "total_steps": 120, "loss": 0.7204, "lr": 6.094691655951512e-05, "epoch": 3.6736842105263157, "percentage": 36.67, "elapsed_time": "0:59:22", "remaining_time": "1:42:33"}
{"current_steps": 46, "total_steps": 120, "loss": 0.7258, "lr": 5.903789572148295e-05, "epoch": 3.8421052631578947, "percentage": 38.33, "elapsed_time": "1:02:05", "remaining_time": "1:39:52"}
{"current_steps": 48, "total_steps": 120, "loss": 0.7287, "lr": 5.707105741985615e-05, "epoch": 4.0, "percentage": 40.0, "elapsed_time": "1:04:30", "remaining_time": "1:36:46"}
{"current_steps": 48, "total_steps": 120, "eval_loss": 0.7513701319694519, "epoch": 4.0, "percentage": 40.0, "elapsed_time": "1:04:43", "remaining_time": "1:37:05"}
{"current_steps": 50, "total_steps": 120, "loss": 0.7132, "lr": 5.505237487791343e-05, "epoch": 4.168421052631579, "percentage": 41.67, "elapsed_time": "1:07:36", "remaining_time": "1:34:38"}
{"current_steps": 52, "total_steps": 120, "loss": 0.7349, "lr": 5.298797876818735e-05, "epoch": 4.336842105263158, "percentage": 43.33, "elapsed_time": "1:10:12", "remaining_time": "1:31:48"}
{"current_steps": 54, "total_steps": 120, "loss": 0.708, "lr": 5.088413859381341e-05, "epoch": 4.505263157894737, "percentage": 45.0, "elapsed_time": "1:12:56", "remaining_time": "1:29:08"}
{"current_steps": 56, "total_steps": 120, "loss": 0.7166, "lr": 4.874724364825504e-05, "epoch": 4.673684210526316, "percentage": 46.67, "elapsed_time": "1:15:38", "remaining_time": "1:26:26"}
{"current_steps": 58, "total_steps": 120, "loss": 0.6791, "lr": 4.658378361122936e-05, "epoch": 4.842105263157895, "percentage": 48.33, "elapsed_time": "1:18:23", "remaining_time": "1:23:47"}
{"current_steps": 60, "total_steps": 120, "loss": 0.6899, "lr": 4.440032883976318e-05, "epoch": 5.0, "percentage": 50.0, "elapsed_time": "1:20:58", "remaining_time": "1:20:58"}
{"current_steps": 60, "total_steps": 120, "eval_loss": 0.7341214418411255, "epoch": 5.0, "percentage": 50.0, "elapsed_time": "1:21:11", "remaining_time": "1:21:11"}
{"current_steps": 62, "total_steps": 120, "loss": 0.695, "lr": 4.220351041423462e-05, "epoch": 5.168421052631579, "percentage": 51.67, "elapsed_time": "1:24:01", "remaining_time": "1:18:36"}
{"current_steps": 64, "total_steps": 120, "loss": 0.696, "lr": 4e-05, "epoch": 5.336842105263158, "percentage": 53.33, "elapsed_time": "1:26:32", "remaining_time": "1:15:43"}
{"current_steps": 66, "total_steps": 120, "loss": 0.6842, "lr": 3.779648958576538e-05, "epoch": 5.505263157894737, "percentage": 55.0, "elapsed_time": "1:29:15", "remaining_time": "1:13:01"}
{"current_steps": 68, "total_steps": 120, "loss": 0.6967, "lr": 3.559967116023683e-05, "epoch": 5.673684210526316, "percentage": 56.67, "elapsed_time": "1:31:54", "remaining_time": "1:10:17"}
{"current_steps": 70, "total_steps": 120, "loss": 0.6816, "lr": 3.341621638877064e-05, "epoch": 5.842105263157895, "percentage": 58.33, "elapsed_time": "1:34:35", "remaining_time": "1:07:33"}
{"current_steps": 72, "total_steps": 120, "loss": 0.6934, "lr": 3.125275635174497e-05, "epoch": 6.0, "percentage": 60.0, "elapsed_time": "1:37:08", "remaining_time": "1:04:45"}
{"current_steps": 72, "total_steps": 120, "eval_loss": 0.7228327989578247, "epoch": 6.0, "percentage": 60.0, "elapsed_time": "1:37:21", "remaining_time": "1:04:54"}
{"current_steps": 74, "total_steps": 120, "loss": 0.6659, "lr": 2.9115861406186593e-05, "epoch": 6.168421052631579, "percentage": 61.67, "elapsed_time": "1:40:05", "remaining_time": "1:02:12"}
{"current_steps": 76, "total_steps": 120, "loss": 0.6659, "lr": 2.7012021231812666e-05, "epoch": 6.336842105263158, "percentage": 63.33, "elapsed_time": "1:42:50", "remaining_time": "0:59:32"}
{"current_steps": 78, "total_steps": 120, "loss": 0.6888, "lr": 2.4947625122086585e-05, "epoch": 6.505263157894737, "percentage": 65.0, "elapsed_time": "1:45:31", "remaining_time": "0:56:49"}
{"current_steps": 80, "total_steps": 120, "loss": 0.6868, "lr": 2.2928942580143855e-05, "epoch": 6.673684210526316, "percentage": 66.67, "elapsed_time": "1:48:06", "remaining_time": "0:54:03"}
{"current_steps": 82, "total_steps": 120, "loss": 0.7081, "lr": 2.096210427851706e-05, "epoch": 6.842105263157895, "percentage": 68.33, "elapsed_time": "1:50:48", "remaining_time": "0:51:20"}
{"current_steps": 84, "total_steps": 120, "loss": 0.6727, "lr": 1.9053083440484887e-05, "epoch": 7.0, "percentage": 70.0, "elapsed_time": "1:53:19", "remaining_time": "0:48:34"}
{"current_steps": 84, "total_steps": 120, "eval_loss": 0.7168187499046326, "epoch": 7.0, "percentage": 70.0, "elapsed_time": "1:53:32", "remaining_time": "0:48:39"}
{"current_steps": 86, "total_steps": 120, "loss": 0.6816, "lr": 1.7207677699589355e-05, "epoch": 7.168421052631579, "percentage": 71.67, "elapsed_time": "1:56:14", "remaining_time": "0:45:57"}
{"current_steps": 88, "total_steps": 120, "loss": 0.6642, "lr": 1.5431491492413288e-05, "epoch": 7.336842105263158, "percentage": 73.33, "elapsed_time": "1:58:59", "remaining_time": "0:43:16"}
{"current_steps": 90, "total_steps": 120, "loss": 0.6729, "lr": 1.3729919038090627e-05, "epoch": 7.505263157894737, "percentage": 75.0, "elapsed_time": "2:01:38", "remaining_time": "0:40:32"}
{"current_steps": 92, "total_steps": 120, "loss": 0.6697, "lr": 1.2108127956240186e-05, "epoch": 7.673684210526316, "percentage": 76.67, "elapsed_time": "2:04:19", "remaining_time": "0:37:50"}
{"current_steps": 94, "total_steps": 120, "loss": 0.6757, "lr": 1.0571043573074737e-05, "epoch": 7.842105263157895, "percentage": 78.33, "elapsed_time": "2:07:01", "remaining_time": "0:35:07"}
{"current_steps": 96, "total_steps": 120, "loss": 0.69, "lr": 9.123333963347166e-06, "epoch": 8.0, "percentage": 80.0, "elapsed_time": "2:09:30", "remaining_time": "0:32:22"}
{"current_steps": 96, "total_steps": 120, "eval_loss": 0.7133689522743225, "epoch": 8.0, "percentage": 80.0, "elapsed_time": "2:09:43", "remaining_time": "0:32:25"}
{"current_steps": 98, "total_steps": 120, "loss": 0.6674, "lr": 7.769395773560874e-06, "epoch": 8.16842105263158, "percentage": 81.67, "elapsed_time": "2:12:34", "remaining_time": "0:29:45"}
{"current_steps": 100, "total_steps": 120, "loss": 0.6833, "lr": 6.513340869498859e-06, "epoch": 8.336842105263157, "percentage": 83.33, "elapsed_time": "2:15:15", "remaining_time": "0:27:03"}
{"current_steps": 102, "total_steps": 120, "loss": 0.6743, "lr": 5.358983848622452e-06, "epoch": 8.505263157894737, "percentage": 85.0, "elapsed_time": "2:17:54", "remaining_time": "0:24:20"}
{"current_steps": 104, "total_steps": 120, "loss": 0.6636, "lr": 4.3098304552642385e-06, "epoch": 8.673684210526316, "percentage": 86.67, "elapsed_time": "2:20:36", "remaining_time": "0:21:37"}
{"current_steps": 106, "total_steps": 120, "loss": 0.6609, "lr": 3.3690669337977e-06, "epoch": 8.842105263157894, "percentage": 88.33, "elapsed_time": "2:23:15", "remaining_time": "0:18:55"}
{"current_steps": 108, "total_steps": 120, "loss": 0.6892, "lr": 2.5395503521178143e-06, "epoch": 9.0, "percentage": 90.0, "elapsed_time": "2:25:43", "remaining_time": "0:16:11"}
{"current_steps": 108, "total_steps": 120, "eval_loss": 0.7123732566833496, "epoch": 9.0, "percentage": 90.0, "elapsed_time": "2:25:56", "remaining_time": "0:16:12"}
{"current_steps": 110, "total_steps": 120, "loss": 0.6742, "lr": 1.8237999248197002e-06, "epoch": 9.16842105263158, "percentage": 91.67, "elapsed_time": "2:28:46", "remaining_time": "0:13:31"}
{"current_steps": 112, "total_steps": 120, "loss": 0.6949, "lr": 1.2239893624267852e-06, "epoch": 9.336842105263157, "percentage": 93.33, "elapsed_time": "2:31:21", "remaining_time": "0:10:48"}
{"current_steps": 114, "total_steps": 120, "loss": 0.6467, "lr": 7.419402699032852e-07, "epoch": 9.505263157894737, "percentage": 95.0, "elapsed_time": "2:34:00", "remaining_time": "0:08:06"}
{"current_steps": 116, "total_steps": 120, "loss": 0.6643, "lr": 3.791166144998704e-07, "epoch": 9.673684210526316, "percentage": 96.67, "elapsed_time": "2:36:43", "remaining_time": "0:05:24"}
{"current_steps": 118, "total_steps": 120, "loss": 0.6764, "lr": 1.3662027973320614e-07, "epoch": 9.842105263157894, "percentage": 98.33, "elapsed_time": "2:39:24", "remaining_time": "0:02:42"}
{"current_steps": 120, "total_steps": 120, "loss": 0.6735, "lr": 1.5187719001943378e-08, "epoch": 10.0, "percentage": 100.0, "elapsed_time": "2:41:53", "remaining_time": "0:00:00"}
{"current_steps": 120, "total_steps": 120, "eval_loss": 0.7120494842529297, "epoch": 10.0, "percentage": 100.0, "elapsed_time": "2:42:06", "remaining_time": "0:00:00"}
{"current_steps": 120, "total_steps": 120, "epoch": 10.0, "percentage": 100.0, "elapsed_time": "2:42:14", "remaining_time": "0:00:00"}