qwen_binary_5000_sft03 / trainer_log.jsonl
jinqij's picture
Upload folder using huggingface_hub
e53275a verified
{"current_steps": 10, "total_steps": 156, "loss": 0.722, "accuracy": 0.4906249940395355, "lr": 6.249999999999999e-07, "epoch": 0.064, "percentage": 6.41, "elapsed_time": "0:06:33", "remaining_time": "1:35:46"}
{"current_steps": 20, "total_steps": 156, "loss": 0.5035, "accuracy": 0.925000011920929, "lr": 9.979871469976195e-07, "epoch": 0.128, "percentage": 12.82, "elapsed_time": "0:12:47", "remaining_time": "1:26:58"}
{"current_steps": 30, "total_steps": 156, "loss": 0.1368, "accuracy": 0.996874988079071, "lr": 9.755282581475767e-07, "epoch": 0.192, "percentage": 19.23, "elapsed_time": "0:18:54", "remaining_time": "1:19:25"}
{"current_steps": 40, "total_steps": 156, "loss": 0.0662, "accuracy": 0.9937499761581421, "lr": 9.29224396800933e-07, "epoch": 0.256, "percentage": 25.64, "elapsed_time": "0:24:58", "remaining_time": "1:12:25"}
{"current_steps": 50, "total_steps": 156, "loss": 0.0562, "accuracy": 0.9906250238418579, "lr": 8.613974319136957e-07, "epoch": 0.32, "percentage": 32.05, "elapsed_time": "0:31:04", "remaining_time": "1:05:52"}
{"current_steps": 60, "total_steps": 156, "loss": 0.051, "accuracy": 1.0, "lr": 7.754484907260512e-07, "epoch": 0.384, "percentage": 38.46, "elapsed_time": "0:37:05", "remaining_time": "0:59:21"}
{"current_steps": 70, "total_steps": 156, "loss": 0.0596, "accuracy": 0.984375, "lr": 6.756874120406714e-07, "epoch": 0.448, "percentage": 44.87, "elapsed_time": "0:43:14", "remaining_time": "0:53:07"}
{"current_steps": 80, "total_steps": 156, "loss": 0.0476, "accuracy": 1.0, "lr": 5.671166329088277e-07, "epoch": 0.512, "percentage": 51.28, "elapsed_time": "0:49:38", "remaining_time": "0:47:10"}
{"current_steps": 90, "total_steps": 156, "loss": 0.0575, "accuracy": 0.987500011920929, "lr": 4.5518034554828327e-07, "epoch": 0.576, "percentage": 57.69, "elapsed_time": "0:55:51", "remaining_time": "0:40:57"}
{"current_steps": 100, "total_steps": 156, "loss": 0.0454, "accuracy": 1.0, "lr": 3.454915028125263e-07, "epoch": 0.64, "percentage": 64.1, "elapsed_time": "1:02:12", "remaining_time": "0:34:50"}
{"current_steps": 110, "total_steps": 156, "loss": 0.0481, "accuracy": 1.0, "lr": 2.4355036129704696e-07, "epoch": 0.704, "percentage": 70.51, "elapsed_time": "1:08:28", "remaining_time": "0:28:38"}
{"current_steps": 120, "total_steps": 156, "loss": 0.0838, "accuracy": 0.984375, "lr": 1.5446867550656767e-07, "epoch": 0.768, "percentage": 76.92, "elapsed_time": "1:14:42", "remaining_time": "0:22:24"}
{"current_steps": 130, "total_steps": 156, "loss": 0.0652, "accuracy": 0.984375, "lr": 8.271337313934867e-08, "epoch": 0.832, "percentage": 83.33, "elapsed_time": "1:21:00", "remaining_time": "0:16:12"}
{"current_steps": 140, "total_steps": 156, "loss": 0.0472, "accuracy": 0.996874988079071, "lr": 3.188256468013139e-08, "epoch": 0.896, "percentage": 89.74, "elapsed_time": "1:27:30", "remaining_time": "0:10:00"}
{"current_steps": 150, "total_steps": 156, "loss": 0.0801, "accuracy": 0.987500011920929, "lr": 4.5251191160326495e-09, "epoch": 0.96, "percentage": 96.15, "elapsed_time": "1:34:00", "remaining_time": "0:03:45"}
{"current_steps": 156, "total_steps": 156, "epoch": 0.9984, "percentage": 100.0, "elapsed_time": "1:38:06", "remaining_time": "0:00:00"}