| {"current_steps": 5, "total_steps": 168, "loss": 2.9731, "lr": 5.000000000000001e-07, "epoch": 0.08888888888888889, "percentage": 2.98, "elapsed_time": "0:01:11", "remaining_time": "0:38:48", "throughput": 400.5, "total_tokens": 28608} |
| {"current_steps": 10, "total_steps": 168, "loss": 3.068, "lr": 1.0000000000000002e-06, "epoch": 0.17777777777777778, "percentage": 5.95, "elapsed_time": "0:02:26", "remaining_time": "0:38:35", "throughput": 388.29, "total_tokens": 56912} |
| {"current_steps": 15, "total_steps": 168, "loss": 2.9741, "lr": 1.5e-06, "epoch": 0.26666666666666666, "percentage": 8.93, "elapsed_time": "0:03:39", "remaining_time": "0:37:14", "throughput": 387.99, "total_tokens": 85008} |
| {"current_steps": 20, "total_steps": 168, "loss": 2.7761, "lr": 2.0000000000000003e-06, "epoch": 0.35555555555555557, "percentage": 11.9, "elapsed_time": "0:04:56", "remaining_time": "0:36:36", "throughput": 385.5, "total_tokens": 114416} |
| {"current_steps": 25, "total_steps": 168, "loss": 2.652, "lr": 2.5e-06, "epoch": 0.4444444444444444, "percentage": 14.88, "elapsed_time": "0:06:20", "remaining_time": "0:36:16", "throughput": 383.71, "total_tokens": 145984} |
| {"current_steps": 30, "total_steps": 168, "loss": 2.7979, "lr": 3e-06, "epoch": 0.5333333333333333, "percentage": 17.86, "elapsed_time": "0:07:33", "remaining_time": "0:34:47", "throughput": 380.44, "total_tokens": 172608} |
| {"current_steps": 35, "total_steps": 168, "loss": 2.5789, "lr": 3.5e-06, "epoch": 0.6222222222222222, "percentage": 20.83, "elapsed_time": "0:08:45", "remaining_time": "0:33:16", "throughput": 380.45, "total_tokens": 199888} |
| {"current_steps": 40, "total_steps": 168, "loss": 2.5007, "lr": 4.000000000000001e-06, "epoch": 0.7111111111111111, "percentage": 23.81, "elapsed_time": "0:09:57", "remaining_time": "0:31:51", "throughput": 379.52, "total_tokens": 226672} |
| {"current_steps": 45, "total_steps": 168, "loss": 2.3715, "lr": 4.5e-06, "epoch": 0.8, "percentage": 26.79, "elapsed_time": "0:11:07", "remaining_time": "0:30:24", "throughput": 379.93, "total_tokens": 253568} |
| {"current_steps": 50, "total_steps": 168, "loss": 2.2343, "lr": 5e-06, "epoch": 0.8888888888888888, "percentage": 29.76, "elapsed_time": "0:12:17", "remaining_time": "0:29:01", "throughput": 379.48, "total_tokens": 280048} |
| {"current_steps": 55, "total_steps": 168, "loss": 2.0521, "lr": 5.500000000000001e-06, "epoch": 0.9777777777777777, "percentage": 32.74, "elapsed_time": "0:13:31", "remaining_time": "0:27:47", "throughput": 378.97, "total_tokens": 307648} |
| {"current_steps": 60, "total_steps": 168, "loss": 1.9834, "lr": 6e-06, "epoch": 1.0533333333333332, "percentage": 35.71, "elapsed_time": "0:14:33", "remaining_time": "0:26:11", "throughput": 378.12, "total_tokens": 330192} |
| {"current_steps": 65, "total_steps": 168, "loss": 1.7906, "lr": 6.5000000000000004e-06, "epoch": 1.1422222222222222, "percentage": 38.69, "elapsed_time": "0:15:50", "remaining_time": "0:25:05", "throughput": 378.56, "total_tokens": 359648} |
| {"current_steps": 70, "total_steps": 168, "loss": 1.762, "lr": 7e-06, "epoch": 1.231111111111111, "percentage": 41.67, "elapsed_time": "0:17:04", "remaining_time": "0:23:53", "throughput": 377.79, "total_tokens": 386896} |
| {"current_steps": 75, "total_steps": 168, "loss": 1.6224, "lr": 7.500000000000001e-06, "epoch": 1.32, "percentage": 44.64, "elapsed_time": "0:18:31", "remaining_time": "0:22:58", "throughput": 377.85, "total_tokens": 420112} |
| {"current_steps": 80, "total_steps": 168, "loss": 1.5772, "lr": 8.000000000000001e-06, "epoch": 1.4088888888888889, "percentage": 47.62, "elapsed_time": "0:19:44", "remaining_time": "0:21:42", "throughput": 377.67, "total_tokens": 447184} |
| {"current_steps": 85, "total_steps": 168, "loss": 1.4699, "lr": 8.5e-06, "epoch": 1.4977777777777779, "percentage": 50.6, "elapsed_time": "0:20:59", "remaining_time": "0:20:30", "throughput": 377.42, "total_tokens": 475488} |
| {"current_steps": 90, "total_steps": 168, "loss": 1.3757, "lr": 9e-06, "epoch": 1.5866666666666667, "percentage": 53.57, "elapsed_time": "0:22:08", "remaining_time": "0:19:11", "throughput": 376.91, "total_tokens": 500832} |
| {"current_steps": 95, "total_steps": 168, "loss": 1.2694, "lr": 9.5e-06, "epoch": 1.6755555555555555, "percentage": 56.55, "elapsed_time": "0:23:24", "remaining_time": "0:17:59", "throughput": 376.83, "total_tokens": 529264} |
| {"current_steps": 100, "total_steps": 168, "loss": 1.2201, "lr": 1e-05, "epoch": 1.7644444444444445, "percentage": 59.52, "elapsed_time": "0:24:40", "remaining_time": "0:16:46", "throughput": 376.65, "total_tokens": 557664} |
| {"current_steps": 105, "total_steps": 168, "loss": 1.1181, "lr": 1.0500000000000001e-05, "epoch": 1.8533333333333335, "percentage": 62.5, "elapsed_time": "0:25:53", "remaining_time": "0:15:32", "throughput": 376.4, "total_tokens": 584736} |
| {"current_steps": 110, "total_steps": 168, "loss": 1.1125, "lr": 1.1000000000000001e-05, "epoch": 1.942222222222222, "percentage": 65.48, "elapsed_time": "0:27:04", "remaining_time": "0:14:16", "throughput": 376.35, "total_tokens": 611504} |
| {"current_steps": 115, "total_steps": 168, "loss": 1.0315, "lr": 1.15e-05, "epoch": 2.017777777777778, "percentage": 68.45, "elapsed_time": "0:28:06", "remaining_time": "0:12:57", "throughput": 376.18, "total_tokens": 634416} |
| {"current_steps": 120, "total_steps": 168, "loss": 0.9411, "lr": 1.2e-05, "epoch": 2.1066666666666665, "percentage": 71.43, "elapsed_time": "0:29:29", "remaining_time": "0:11:47", "throughput": 376.39, "total_tokens": 665968} |
| {"current_steps": 125, "total_steps": 168, "loss": 0.8717, "lr": 1.25e-05, "epoch": 2.1955555555555555, "percentage": 74.4, "elapsed_time": "0:30:40", "remaining_time": "0:10:33", "throughput": 376.2, "total_tokens": 692560} |
| {"current_steps": 130, "total_steps": 168, "loss": 0.8609, "lr": 1.3000000000000001e-05, "epoch": 2.2844444444444445, "percentage": 77.38, "elapsed_time": "0:31:49", "remaining_time": "0:09:18", "throughput": 375.94, "total_tokens": 717968} |
| {"current_steps": 135, "total_steps": 168, "loss": 0.8748, "lr": 1.3500000000000001e-05, "epoch": 2.3733333333333335, "percentage": 80.36, "elapsed_time": "0:33:05", "remaining_time": "0:08:05", "throughput": 375.78, "total_tokens": 746272} |
| {"current_steps": 140, "total_steps": 168, "loss": 0.8541, "lr": 1.4e-05, "epoch": 2.462222222222222, "percentage": 83.33, "elapsed_time": "0:34:28", "remaining_time": "0:06:53", "throughput": 375.53, "total_tokens": 776928} |
| {"current_steps": 145, "total_steps": 168, "loss": 0.8282, "lr": 1.45e-05, "epoch": 2.551111111111111, "percentage": 86.31, "elapsed_time": "0:35:49", "remaining_time": "0:05:40", "throughput": 375.56, "total_tokens": 807328} |
| {"current_steps": 150, "total_steps": 168, "loss": 0.8178, "lr": 1.5000000000000002e-05, "epoch": 2.64, "percentage": 89.29, "elapsed_time": "0:37:03", "remaining_time": "0:04:26", "throughput": 375.4, "total_tokens": 834608} |
| {"current_steps": 155, "total_steps": 168, "loss": 0.7387, "lr": 1.55e-05, "epoch": 2.728888888888889, "percentage": 92.26, "elapsed_time": "0:38:16", "remaining_time": "0:03:12", "throughput": 375.11, "total_tokens": 861456} |
| {"current_steps": 160, "total_steps": 168, "loss": 0.7247, "lr": 1.6000000000000003e-05, "epoch": 2.8177777777777777, "percentage": 95.24, "elapsed_time": "0:39:25", "remaining_time": "0:01:58", "throughput": 374.95, "total_tokens": 886960} |
| {"current_steps": 165, "total_steps": 168, "loss": 0.7848, "lr": 1.65e-05, "epoch": 2.9066666666666667, "percentage": 98.21, "elapsed_time": "0:40:38", "remaining_time": "0:00:44", "throughput": 374.9, "total_tokens": 914176} |
| {"current_steps": 168, "total_steps": 168, "epoch": 2.96, "percentage": 100.0, "elapsed_time": "0:41:30", "remaining_time": "0:00:00", "throughput": 374.11, "total_tokens": 931840} |
|
|