| {"current_steps": 5, "total_steps": 1140, "loss": 5.1888, "lr": 3.508771929824561e-05, "epoch": 0.08771929824561403, "percentage": 0.44, "elapsed_time": "0:00:01", "remaining_time": "0:06:28", "throughput": 1890.63, "total_tokens": 3232} | |
| {"current_steps": 10, "total_steps": 1140, "loss": 1.3169, "lr": 7.894736842105263e-05, "epoch": 0.17543859649122806, "percentage": 0.88, "elapsed_time": "0:00:02", "remaining_time": "0:05:19", "throughput": 2278.16, "total_tokens": 6432} | |
| {"current_steps": 15, "total_steps": 1140, "loss": 0.5036, "lr": 0.00012280701754385965, "epoch": 0.2631578947368421, "percentage": 1.32, "elapsed_time": "0:00:03", "remaining_time": "0:04:51", "throughput": 2414.8, "total_tokens": 9376} | |
| {"current_steps": 20, "total_steps": 1140, "loss": 0.3251, "lr": 0.00016666666666666666, "epoch": 0.3508771929824561, "percentage": 1.75, "elapsed_time": "0:00:04", "remaining_time": "0:04:37", "throughput": 2511.78, "total_tokens": 12448} | |
| {"current_steps": 25, "total_steps": 1140, "loss": 0.4105, "lr": 0.00021052631578947367, "epoch": 0.43859649122807015, "percentage": 2.19, "elapsed_time": "0:00:06", "remaining_time": "0:04:29", "throughput": 2562.15, "total_tokens": 15456} | |
| {"current_steps": 30, "total_steps": 1140, "loss": 0.6098, "lr": 0.0002543859649122807, "epoch": 0.5263157894736842, "percentage": 2.63, "elapsed_time": "0:00:07", "remaining_time": "0:04:23", "throughput": 2608.91, "total_tokens": 18592} | |
| {"current_steps": 35, "total_steps": 1140, "loss": 0.284, "lr": 0.0002982456140350877, "epoch": 0.6140350877192983, "percentage": 3.07, "elapsed_time": "0:00:08", "remaining_time": "0:04:27", "throughput": 2731.72, "total_tokens": 23136} | |
| {"current_steps": 40, "total_steps": 1140, "loss": 0.4434, "lr": 0.00034210526315789477, "epoch": 0.7017543859649122, "percentage": 3.51, "elapsed_time": "0:00:09", "remaining_time": "0:04:23", "throughput": 2761.3, "total_tokens": 26496} | |
| {"current_steps": 45, "total_steps": 1140, "loss": 0.5031, "lr": 0.00038596491228070175, "epoch": 0.7894736842105263, "percentage": 3.95, "elapsed_time": "0:00:10", "remaining_time": "0:04:20", "throughput": 2774.5, "total_tokens": 29728} | |
| {"current_steps": 50, "total_steps": 1140, "loss": 0.483, "lr": 0.0004298245614035088, "epoch": 0.8771929824561403, "percentage": 4.39, "elapsed_time": "0:00:11", "remaining_time": "0:04:18", "throughput": 2787.53, "total_tokens": 33024} | |
| {"current_steps": 55, "total_steps": 1140, "loss": 0.3463, "lr": 0.00047368421052631577, "epoch": 0.9649122807017544, "percentage": 4.82, "elapsed_time": "0:00:12", "remaining_time": "0:04:14", "throughput": 2783.39, "total_tokens": 35904} | |
| {"current_steps": 57, "total_steps": 1140, "eval_loss": 0.6230526566505432, "epoch": 1.0, "percentage": 5.0, "elapsed_time": "0:00:13", "remaining_time": "0:04:25", "throughput": 2609.62, "total_tokens": 36480} | |
| {"current_steps": 60, "total_steps": 1140, "loss": 0.2954, "lr": 0.0005175438596491229, "epoch": 1.0526315789473684, "percentage": 5.26, "elapsed_time": "0:00:15", "remaining_time": "0:04:41", "throughput": 2427.37, "total_tokens": 38016} | |
| {"current_steps": 65, "total_steps": 1140, "loss": 0.3105, "lr": 0.0005614035087719298, "epoch": 1.1403508771929824, "percentage": 5.7, "elapsed_time": "0:00:16", "remaining_time": "0:04:36", "throughput": 2442.98, "total_tokens": 40800} | |
| {"current_steps": 70, "total_steps": 1140, "loss": 0.3103, "lr": 0.0006052631578947369, "epoch": 1.2280701754385965, "percentage": 6.14, "elapsed_time": "0:00:17", "remaining_time": "0:04:31", "throughput": 2458.75, "total_tokens": 43648} | |
| {"current_steps": 75, "total_steps": 1140, "loss": 0.614, "lr": 0.0006491228070175439, "epoch": 1.3157894736842106, "percentage": 6.58, "elapsed_time": "0:00:18", "remaining_time": "0:04:26", "throughput": 2461.46, "total_tokens": 46112} | |
| {"current_steps": 80, "total_steps": 1140, "loss": 0.3025, "lr": 0.0006929824561403509, "epoch": 1.4035087719298245, "percentage": 7.02, "elapsed_time": "0:00:19", "remaining_time": "0:04:23", "throughput": 2496.49, "total_tokens": 49632} | |
| {"current_steps": 85, "total_steps": 1140, "loss": 0.1801, "lr": 0.0007368421052631579, "epoch": 1.4912280701754386, "percentage": 7.46, "elapsed_time": "0:00:21", "remaining_time": "0:04:20", "throughput": 2522.96, "total_tokens": 53024} | |
| {"current_steps": 90, "total_steps": 1140, "loss": 0.2907, "lr": 0.0007807017543859649, "epoch": 1.5789473684210527, "percentage": 7.89, "elapsed_time": "0:00:22", "remaining_time": "0:04:19", "throughput": 2551.49, "total_tokens": 56672} | |
| {"current_steps": 95, "total_steps": 1140, "loss": 0.4426, "lr": 0.000824561403508772, "epoch": 1.6666666666666665, "percentage": 8.33, "elapsed_time": "0:00:23", "remaining_time": "0:04:15", "throughput": 2552.47, "total_tokens": 59296} | |
| {"current_steps": 100, "total_steps": 1140, "loss": 0.2812, "lr": 0.000868421052631579, "epoch": 1.7543859649122808, "percentage": 8.77, "elapsed_time": "0:00:24", "remaining_time": "0:04:13", "throughput": 2568.41, "total_tokens": 62528} | |
| {"current_steps": 105, "total_steps": 1140, "loss": 0.1671, "lr": 0.000912280701754386, "epoch": 1.8421052631578947, "percentage": 9.21, "elapsed_time": "0:00:25", "remaining_time": "0:04:11", "throughput": 2585.2, "total_tokens": 65856} | |
| {"current_steps": 110, "total_steps": 1140, "loss": 0.341, "lr": 0.0009561403508771929, "epoch": 1.9298245614035088, "percentage": 9.65, "elapsed_time": "0:00:26", "remaining_time": "0:04:09", "throughput": 2611.62, "total_tokens": 69664} | |
| {"current_steps": 114, "total_steps": 1140, "eval_loss": 0.3803446590900421, "epoch": 2.0, "percentage": 10.0, "elapsed_time": "0:00:28", "remaining_time": "0:04:14", "throughput": 2546.62, "total_tokens": 72112} | |
| {"current_steps": 115, "total_steps": 1140, "loss": 0.4422, "lr": 0.001, "epoch": 2.017543859649123, "percentage": 10.09, "elapsed_time": "0:00:29", "remaining_time": "0:04:22", "throughput": 2471.53, "total_tokens": 72848} | |