| {"current_steps": 5, "total_steps": 1800, "loss": 0.1508, "lr": 0.0006666666666666666, "epoch": 0.05555555555555555, "percentage": 0.28, "elapsed_time": "0:00:01", "remaining_time": "0:07:54", "throughput": 1211.63, "total_tokens": 1600} |
| {"current_steps": 10, "total_steps": 1800, "loss": 0.1225, "lr": 0.0015, "epoch": 0.1111111111111111, "percentage": 0.56, "elapsed_time": "0:00:02", "remaining_time": "0:06:14", "throughput": 1527.49, "total_tokens": 3200} |
| {"current_steps": 15, "total_steps": 1800, "loss": 0.2189, "lr": 0.002333333333333333, "epoch": 0.16666666666666666, "percentage": 0.83, "elapsed_time": "0:00:02", "remaining_time": "0:05:41", "throughput": 1663.76, "total_tokens": 4768} |
| {"current_steps": 20, "total_steps": 1800, "loss": 0.2288, "lr": 0.0031666666666666666, "epoch": 0.2222222222222222, "percentage": 1.11, "elapsed_time": "0:00:03", "remaining_time": "0:05:23", "throughput": 1742.37, "total_tokens": 6336} |
| {"current_steps": 25, "total_steps": 1800, "loss": 4.5867, "lr": 0.004, "epoch": 0.2777777777777778, "percentage": 1.39, "elapsed_time": "0:00:04", "remaining_time": "0:05:12", "throughput": 1793.47, "total_tokens": 7904} |
| {"current_steps": 30, "total_steps": 1800, "loss": 3.3424, "lr": 0.004833333333333334, "epoch": 0.3333333333333333, "percentage": 1.67, "elapsed_time": "0:00:05", "remaining_time": "0:05:05", "throughput": 1834.72, "total_tokens": 9504} |
| {"current_steps": 35, "total_steps": 1800, "loss": 1.1922, "lr": 0.005666666666666666, "epoch": 0.3888888888888889, "percentage": 1.94, "elapsed_time": "0:00:05", "remaining_time": "0:05:00", "throughput": 1860.42, "total_tokens": 11072} |
| {"current_steps": 40, "total_steps": 1800, "loss": 0.5121, "lr": 0.0065, "epoch": 0.4444444444444444, "percentage": 2.22, "elapsed_time": "0:00:06", "remaining_time": "0:04:55", "throughput": 1884.74, "total_tokens": 12672} |
| {"current_steps": 45, "total_steps": 1800, "loss": 0.2904, "lr": 0.007333333333333333, "epoch": 0.5, "percentage": 2.5, "elapsed_time": "0:00:07", "remaining_time": "0:04:52", "throughput": 1892.77, "total_tokens": 14176} |
| {"current_steps": 50, "total_steps": 1800, "loss": 0.3048, "lr": 0.008166666666666666, "epoch": 0.5555555555555556, "percentage": 2.78, "elapsed_time": "0:00:08", "remaining_time": "0:04:49", "throughput": 1909.08, "total_tokens": 15776} |
| {"current_steps": 55, "total_steps": 1800, "loss": 0.3677, "lr": 0.009, "epoch": 0.6111111111111112, "percentage": 3.06, "elapsed_time": "0:00:09", "remaining_time": "0:04:46", "throughput": 1916.57, "total_tokens": 17312} |
| {"current_steps": 60, "total_steps": 1800, "loss": 0.2604, "lr": 0.009833333333333333, "epoch": 0.6666666666666666, "percentage": 3.33, "elapsed_time": "0:00:09", "remaining_time": "0:04:44", "throughput": 1922.94, "total_tokens": 18848} |
| {"current_steps": 65, "total_steps": 1800, "loss": 0.256, "lr": 0.010666666666666666, "epoch": 0.7222222222222222, "percentage": 3.61, "elapsed_time": "0:00:10", "remaining_time": "0:04:42", "throughput": 1933.79, "total_tokens": 20448} |
| {"current_steps": 70, "total_steps": 1800, "loss": 0.5609, "lr": 0.0115, "epoch": 0.7777777777777778, "percentage": 3.89, "elapsed_time": "0:00:11", "remaining_time": "0:04:40", "throughput": 1940.71, "total_tokens": 22016} |
| {"current_steps": 75, "total_steps": 1800, "loss": 1.0653, "lr": 0.012333333333333332, "epoch": 0.8333333333333334, "percentage": 4.17, "elapsed_time": "0:00:12", "remaining_time": "0:04:38", "throughput": 1949.01, "total_tokens": 23616} |
| {"current_steps": 80, "total_steps": 1800, "loss": 0.2765, "lr": 0.013166666666666667, "epoch": 0.8888888888888888, "percentage": 4.44, "elapsed_time": "0:00:12", "remaining_time": "0:04:37", "throughput": 1951.85, "total_tokens": 25152} |
| {"current_steps": 85, "total_steps": 1800, "loss": 1.0491, "lr": 0.014, "epoch": 0.9444444444444444, "percentage": 4.72, "elapsed_time": "0:00:13", "remaining_time": "0:04:35", "throughput": 1953.7, "total_tokens": 26688} |
| {"current_steps": 90, "total_steps": 1800, "loss": 0.26, "lr": 0.014833333333333334, "epoch": 1.0, "percentage": 5.0, "elapsed_time": "0:00:14", "remaining_time": "0:04:34", "throughput": 1953.06, "total_tokens": 28256} |
| {"current_steps": 90, "total_steps": 1800, "eval_loss": 0.23620998859405518, "epoch": 1.0, "percentage": 5.0, "elapsed_time": "0:00:15", "remaining_time": "0:04:50", "throughput": 1849.98, "total_tokens": 28256} |
| {"current_steps": 95, "total_steps": 1800, "loss": 0.29, "lr": 0.015666666666666666, "epoch": 1.0555555555555556, "percentage": 5.28, "elapsed_time": "0:00:16", "remaining_time": "0:05:03", "throughput": 1763.95, "total_tokens": 29824} |
| {"current_steps": 100, "total_steps": 1800, "loss": 0.3073, "lr": 0.0165, "epoch": 1.1111111111111112, "percentage": 5.56, "elapsed_time": "0:00:17", "remaining_time": "0:05:00", "throughput": 1773.59, "total_tokens": 31360} |
| {"current_steps": 105, "total_steps": 1800, "loss": 0.231, "lr": 0.017333333333333333, "epoch": 1.1666666666666667, "percentage": 5.83, "elapsed_time": "0:00:18", "remaining_time": "0:04:58", "throughput": 1783.2, "total_tokens": 32960} |
| {"current_steps": 110, "total_steps": 1800, "loss": 0.2256, "lr": 0.018166666666666664, "epoch": 1.2222222222222223, "percentage": 6.11, "elapsed_time": "0:00:19", "remaining_time": "0:04:55", "throughput": 1790.16, "total_tokens": 34464} |
|
|