sft / trainer_log.jsonl
lillian039's picture
Training in progress, step 250
3543cdf verified
{"current_steps": 10, "total_steps": 1392, "loss": 2.5556, "lr": 6.428571428571428e-07, "epoch": 0.021528525296017224, "percentage": 0.72, "elapsed_time": "0:08:01", "remaining_time": "18:28:38"}
{"current_steps": 20, "total_steps": 1392, "loss": 2.0585, "lr": 1.3571428571428572e-06, "epoch": 0.04305705059203445, "percentage": 1.44, "elapsed_time": "0:15:53", "remaining_time": "18:10:09"}
{"current_steps": 30, "total_steps": 1392, "loss": 0.6843, "lr": 2.0714285714285717e-06, "epoch": 0.06458557588805167, "percentage": 2.16, "elapsed_time": "0:23:42", "remaining_time": "17:56:09"}
{"current_steps": 40, "total_steps": 1392, "loss": 0.0841, "lr": 2.785714285714286e-06, "epoch": 0.0861141011840689, "percentage": 2.87, "elapsed_time": "0:31:34", "remaining_time": "17:47:01"}
{"current_steps": 50, "total_steps": 1392, "loss": 0.06, "lr": 3.5e-06, "epoch": 0.10764262648008611, "percentage": 3.59, "elapsed_time": "0:39:26", "remaining_time": "17:38:41"}
{"current_steps": 60, "total_steps": 1392, "loss": 0.0385, "lr": 4.2142857142857145e-06, "epoch": 0.12917115177610333, "percentage": 4.31, "elapsed_time": "0:47:30", "remaining_time": "17:34:44"}
{"current_steps": 70, "total_steps": 1392, "loss": 0.0336, "lr": 4.928571428571429e-06, "epoch": 0.15069967707212056, "percentage": 5.03, "elapsed_time": "0:55:19", "remaining_time": "17:24:44"}
{"current_steps": 80, "total_steps": 1392, "loss": 0.0302, "lr": 5.6428571428571435e-06, "epoch": 0.1722282023681378, "percentage": 5.75, "elapsed_time": "1:03:10", "remaining_time": "17:16:10"}
{"current_steps": 90, "total_steps": 1392, "loss": 0.0247, "lr": 6.357142857142858e-06, "epoch": 0.193756727664155, "percentage": 6.47, "elapsed_time": "1:10:58", "remaining_time": "17:06:47"}
{"current_steps": 100, "total_steps": 1392, "loss": 0.025, "lr": 7.0714285714285726e-06, "epoch": 0.21528525296017223, "percentage": 7.18, "elapsed_time": "1:18:49", "remaining_time": "16:58:27"}
{"current_steps": 110, "total_steps": 1392, "loss": 0.0251, "lr": 7.785714285714287e-06, "epoch": 0.23681377825618946, "percentage": 7.9, "elapsed_time": "1:26:54", "remaining_time": "16:52:54"}
{"current_steps": 120, "total_steps": 1392, "loss": 0.0232, "lr": 8.5e-06, "epoch": 0.25834230355220666, "percentage": 8.62, "elapsed_time": "1:34:48", "remaining_time": "16:44:57"}
{"current_steps": 130, "total_steps": 1392, "loss": 0.0226, "lr": 9.214285714285715e-06, "epoch": 0.2798708288482239, "percentage": 9.34, "elapsed_time": "1:42:40", "remaining_time": "16:36:46"}
{"current_steps": 140, "total_steps": 1392, "loss": 0.0209, "lr": 9.92857142857143e-06, "epoch": 0.3013993541442411, "percentage": 10.06, "elapsed_time": "1:50:31", "remaining_time": "16:28:23"}
{"current_steps": 150, "total_steps": 1392, "loss": 0.0222, "lr": 9.998725036777437e-06, "epoch": 0.32292787944025836, "percentage": 10.78, "elapsed_time": "1:58:24", "remaining_time": "16:20:25"}
{"current_steps": 160, "total_steps": 1392, "loss": 0.0212, "lr": 9.994318591270081e-06, "epoch": 0.3444564047362756, "percentage": 11.49, "elapsed_time": "2:06:29", "remaining_time": "16:13:58"}
{"current_steps": 170, "total_steps": 1392, "loss": 0.0201, "lr": 9.986767696851472e-06, "epoch": 0.36598493003229277, "percentage": 12.21, "elapsed_time": "2:14:21", "remaining_time": "16:05:50"}
{"current_steps": 180, "total_steps": 1392, "loss": 0.0206, "lr": 9.976077107603933e-06, "epoch": 0.38751345532831, "percentage": 12.93, "elapsed_time": "2:22:13", "remaining_time": "15:57:41"}
{"current_steps": 190, "total_steps": 1392, "loss": 0.017, "lr": 9.962253554377952e-06, "epoch": 0.40904198062432723, "percentage": 13.65, "elapsed_time": "2:30:05", "remaining_time": "15:49:29"}
{"current_steps": 200, "total_steps": 1392, "loss": 0.0182, "lr": 9.945305740554397e-06, "epoch": 0.43057050592034446, "percentage": 14.37, "elapsed_time": "2:37:59", "remaining_time": "15:41:35"}
{"current_steps": 210, "total_steps": 1392, "loss": 0.0197, "lr": 9.925244336564831e-06, "epoch": 0.4520990312163617, "percentage": 15.09, "elapsed_time": "2:46:04", "remaining_time": "15:34:48"}
{"current_steps": 220, "total_steps": 1392, "loss": 0.0187, "lr": 9.902081973173352e-06, "epoch": 0.4736275565123789, "percentage": 15.8, "elapsed_time": "2:53:55", "remaining_time": "15:26:35"}
{"current_steps": 230, "total_steps": 1392, "loss": 0.0154, "lr": 9.875833233524183e-06, "epoch": 0.4951560818083961, "percentage": 16.52, "elapsed_time": "3:01:45", "remaining_time": "15:18:16"}
{"current_steps": 240, "total_steps": 1392, "loss": 0.0176, "lr": 9.846514643960072e-06, "epoch": 0.5166846071044133, "percentage": 17.24, "elapsed_time": "3:09:42", "remaining_time": "15:10:34"}
{"current_steps": 250, "total_steps": 1392, "loss": 0.0182, "lr": 9.814144663617204e-06, "epoch": 0.5382131324004306, "percentage": 17.96, "elapsed_time": "3:17:32", "remaining_time": "15:02:20"}