QWQ-RED_DS-RED_final_model_sft / trainer_log.jsonl
yuzhounie's picture
Training in progress, step 30
ee30ab4 verified
{"current_steps": 1, "total_steps": 30, "loss": 1.1331, "lr": 0.0, "epoch": 0.06349206349206349, "percentage": 3.33, "elapsed_time": "0:00:12", "remaining_time": "0:05:58"}
{"current_steps": 2, "total_steps": 30, "loss": 0.9839, "lr": 3.3333333333333333e-06, "epoch": 0.12698412698412698, "percentage": 6.67, "elapsed_time": "0:00:23", "remaining_time": "0:05:25"}
{"current_steps": 3, "total_steps": 30, "loss": 1.1706, "lr": 6.666666666666667e-06, "epoch": 0.19047619047619047, "percentage": 10.0, "elapsed_time": "0:00:31", "remaining_time": "0:04:47"}
{"current_steps": 4, "total_steps": 30, "loss": 0.9681, "lr": 1e-05, "epoch": 0.25396825396825395, "percentage": 13.33, "elapsed_time": "0:00:40", "remaining_time": "0:04:26"}
{"current_steps": 5, "total_steps": 30, "loss": 0.8197, "lr": 9.966191788709716e-06, "epoch": 0.31746031746031744, "percentage": 16.67, "elapsed_time": "0:00:50", "remaining_time": "0:04:14"}
{"current_steps": 6, "total_steps": 30, "loss": 0.8382, "lr": 9.86522435289912e-06, "epoch": 0.38095238095238093, "percentage": 20.0, "elapsed_time": "0:00:57", "remaining_time": "0:03:51"}
{"current_steps": 7, "total_steps": 30, "loss": 0.9836, "lr": 9.698463103929542e-06, "epoch": 0.4444444444444444, "percentage": 23.33, "elapsed_time": "0:01:04", "remaining_time": "0:03:31"}
{"current_steps": 8, "total_steps": 30, "loss": 0.8731, "lr": 9.468163201617063e-06, "epoch": 0.5079365079365079, "percentage": 26.67, "elapsed_time": "0:01:11", "remaining_time": "0:03:15"}
{"current_steps": 9, "total_steps": 30, "loss": 0.8753, "lr": 9.177439057064684e-06, "epoch": 0.5714285714285714, "percentage": 30.0, "elapsed_time": "0:01:17", "remaining_time": "0:03:01"}
{"current_steps": 10, "total_steps": 30, "loss": 0.9582, "lr": 8.83022221559489e-06, "epoch": 0.6349206349206349, "percentage": 33.33, "elapsed_time": "0:01:24", "remaining_time": "0:02:49"}
{"current_steps": 11, "total_steps": 30, "loss": 0.785, "lr": 8.43120818934367e-06, "epoch": 0.6984126984126984, "percentage": 36.67, "elapsed_time": "0:01:33", "remaining_time": "0:02:41"}
{"current_steps": 12, "total_steps": 30, "loss": 0.8561, "lr": 7.985792958513932e-06, "epoch": 0.7619047619047619, "percentage": 40.0, "elapsed_time": "0:01:40", "remaining_time": "0:02:30"}
{"current_steps": 13, "total_steps": 30, "loss": 0.9083, "lr": 7.500000000000001e-06, "epoch": 0.8253968253968254, "percentage": 43.33, "elapsed_time": "0:01:51", "remaining_time": "0:02:25"}
{"current_steps": 14, "total_steps": 30, "loss": 0.8333, "lr": 6.980398830195785e-06, "epoch": 0.8888888888888888, "percentage": 46.67, "elapsed_time": "0:01:58", "remaining_time": "0:02:15"}
{"current_steps": 15, "total_steps": 30, "loss": 0.8507, "lr": 6.434016163555452e-06, "epoch": 0.9523809523809523, "percentage": 50.0, "elapsed_time": "0:02:05", "remaining_time": "0:02:05"}
{"current_steps": 16, "total_steps": 30, "loss": 0.7102, "lr": 5.8682408883346535e-06, "epoch": 1.0, "percentage": 53.33, "elapsed_time": "0:02:11", "remaining_time": "0:01:55"}
{"current_steps": 17, "total_steps": 30, "loss": 0.7307, "lr": 5.290724144552379e-06, "epoch": 1.0634920634920635, "percentage": 56.67, "elapsed_time": "0:02:19", "remaining_time": "0:01:46"}
{"current_steps": 18, "total_steps": 30, "loss": 0.6586, "lr": 4.7092758554476215e-06, "epoch": 1.126984126984127, "percentage": 60.0, "elapsed_time": "0:02:26", "remaining_time": "0:01:37"}
{"current_steps": 19, "total_steps": 30, "loss": 0.718, "lr": 4.131759111665349e-06, "epoch": 1.1904761904761905, "percentage": 63.33, "elapsed_time": "0:02:36", "remaining_time": "0:01:30"}
{"current_steps": 20, "total_steps": 30, "loss": 0.7562, "lr": 3.5659838364445505e-06, "epoch": 1.253968253968254, "percentage": 66.67, "elapsed_time": "0:02:44", "remaining_time": "0:01:22"}
{"current_steps": 21, "total_steps": 30, "loss": 0.6764, "lr": 3.019601169804216e-06, "epoch": 1.3174603174603174, "percentage": 70.0, "elapsed_time": "0:02:51", "remaining_time": "0:01:13"}
{"current_steps": 22, "total_steps": 30, "loss": 0.8151, "lr": 2.5000000000000015e-06, "epoch": 1.380952380952381, "percentage": 73.33, "elapsed_time": "0:02:59", "remaining_time": "0:01:05"}
{"current_steps": 23, "total_steps": 30, "loss": 0.6922, "lr": 2.0142070414860704e-06, "epoch": 1.4444444444444444, "percentage": 76.67, "elapsed_time": "0:03:07", "remaining_time": "0:00:56"}
{"current_steps": 24, "total_steps": 30, "loss": 0.7066, "lr": 1.5687918106563326e-06, "epoch": 1.507936507936508, "percentage": 80.0, "elapsed_time": "0:03:14", "remaining_time": "0:00:48"}
{"current_steps": 25, "total_steps": 30, "loss": 0.6978, "lr": 1.1697777844051105e-06, "epoch": 1.5714285714285714, "percentage": 83.33, "elapsed_time": "0:03:22", "remaining_time": "0:00:40"}
{"current_steps": 26, "total_steps": 30, "loss": 0.7835, "lr": 8.225609429353187e-07, "epoch": 1.6349206349206349, "percentage": 86.67, "elapsed_time": "0:03:30", "remaining_time": "0:00:32"}
{"current_steps": 27, "total_steps": 30, "loss": 0.6726, "lr": 5.318367983829393e-07, "epoch": 1.6984126984126984, "percentage": 90.0, "elapsed_time": "0:03:37", "remaining_time": "0:00:24"}
{"current_steps": 28, "total_steps": 30, "loss": 0.6786, "lr": 3.015368960704584e-07, "epoch": 1.7619047619047619, "percentage": 93.33, "elapsed_time": "0:03:45", "remaining_time": "0:00:16"}
{"current_steps": 29, "total_steps": 30, "loss": 0.647, "lr": 1.3477564710088097e-07, "epoch": 1.8253968253968254, "percentage": 96.67, "elapsed_time": "0:03:52", "remaining_time": "0:00:08"}
{"current_steps": 30, "total_steps": 30, "loss": 0.6099, "lr": 3.3808211290284886e-08, "epoch": 1.8888888888888888, "percentage": 100.0, "elapsed_time": "0:03:59", "remaining_time": "0:00:00"}
{"current_steps": 30, "total_steps": 30, "epoch": 1.8888888888888888, "percentage": 100.0, "elapsed_time": "0:05:21", "remaining_time": "0:00:00"}