| {"current_steps": 5, "total_steps": 900, "loss": 0.361, "lr": 2.2222222222222225e-06, "epoch": 0.05555555555555555, "percentage": 0.56, "elapsed_time": "0:00:02", "remaining_time": "0:06:22", "throughput": 719.29, "total_tokens": 1536} |
| {"current_steps": 10, "total_steps": 900, "loss": 0.3455, "lr": 5e-06, "epoch": 0.1111111111111111, "percentage": 1.11, "elapsed_time": "0:00:03", "remaining_time": "0:04:30", "throughput": 1040.57, "total_tokens": 3168} |
| {"current_steps": 15, "total_steps": 900, "loss": 0.267, "lr": 7.777777777777777e-06, "epoch": 0.16666666666666666, "percentage": 1.67, "elapsed_time": "0:00:03", "remaining_time": "0:03:53", "throughput": 1199.12, "total_tokens": 4736} |
| {"current_steps": 20, "total_steps": 900, "loss": 0.3256, "lr": 1.0555555555555555e-05, "epoch": 0.2222222222222222, "percentage": 2.22, "elapsed_time": "0:00:04", "remaining_time": "0:03:33", "throughput": 1298.1, "total_tokens": 6304} |
| {"current_steps": 25, "total_steps": 900, "loss": 0.2055, "lr": 1.3333333333333333e-05, "epoch": 0.2777777777777778, "percentage": 2.78, "elapsed_time": "0:00:05", "remaining_time": "0:03:21", "throughput": 1360.15, "total_tokens": 7840} |
| {"current_steps": 30, "total_steps": 900, "loss": 0.1017, "lr": 1.6111111111111115e-05, "epoch": 0.3333333333333333, "percentage": 3.33, "elapsed_time": "0:00:06", "remaining_time": "0:03:13", "throughput": 1409.39, "total_tokens": 9408} |
| {"current_steps": 35, "total_steps": 900, "loss": 0.2479, "lr": 1.888888888888889e-05, "epoch": 0.3888888888888889, "percentage": 3.89, "elapsed_time": "0:00:07", "remaining_time": "0:03:07", "throughput": 1439.83, "total_tokens": 10912} |
| {"current_steps": 40, "total_steps": 900, "loss": 0.1075, "lr": 2.1666666666666667e-05, "epoch": 0.4444444444444444, "percentage": 4.44, "elapsed_time": "0:00:08", "remaining_time": "0:03:02", "throughput": 1466.83, "total_tokens": 12448} |
| {"current_steps": 45, "total_steps": 900, "loss": 0.2326, "lr": 2.4444444444444445e-05, "epoch": 0.5, "percentage": 5.0, "elapsed_time": "0:00:09", "remaining_time": "0:02:58", "throughput": 1492.24, "total_tokens": 14016} |
| {"current_steps": 45, "total_steps": 900, "eval_loss": 0.21843767166137695, "epoch": 0.5, "percentage": 5.0, "elapsed_time": "0:00:10", "remaining_time": "0:03:19", "throughput": 1337.6, "total_tokens": 14016} |
| {"current_steps": 50, "total_steps": 900, "loss": 0.092, "lr": 2.7222222222222223e-05, "epoch": 0.5555555555555556, "percentage": 5.56, "elapsed_time": "0:00:12", "remaining_time": "0:03:31", "throughput": 1251.42, "total_tokens": 15584} |
| {"current_steps": 55, "total_steps": 900, "loss": 0.1915, "lr": 3e-05, "epoch": 0.6111111111111112, "percentage": 6.11, "elapsed_time": "0:00:13", "remaining_time": "0:03:25", "throughput": 1285.75, "total_tokens": 17184} |
| {"current_steps": 60, "total_steps": 900, "loss": 0.1305, "lr": 3.277777777777778e-05, "epoch": 0.6666666666666666, "percentage": 6.67, "elapsed_time": "0:00:14", "remaining_time": "0:03:19", "throughput": 1313.76, "total_tokens": 18752} |
| {"current_steps": 65, "total_steps": 900, "loss": 0.2508, "lr": 3.555555555555556e-05, "epoch": 0.7222222222222222, "percentage": 7.22, "elapsed_time": "0:00:15", "remaining_time": "0:03:15", "throughput": 1340.25, "total_tokens": 20352} |
| {"current_steps": 70, "total_steps": 900, "loss": 0.0133, "lr": 3.8333333333333334e-05, "epoch": 0.7777777777777778, "percentage": 7.78, "elapsed_time": "0:00:16", "remaining_time": "0:03:10", "throughput": 1363.69, "total_tokens": 21952} |
| {"current_steps": 75, "total_steps": 900, "loss": 0.0971, "lr": 4.111111111111111e-05, "epoch": 0.8333333333333334, "percentage": 8.33, "elapsed_time": "0:00:17", "remaining_time": "0:03:07", "throughput": 1379.65, "total_tokens": 23456} |
| {"current_steps": 80, "total_steps": 900, "loss": 0.335, "lr": 4.388888888888889e-05, "epoch": 0.8888888888888888, "percentage": 8.89, "elapsed_time": "0:00:17", "remaining_time": "0:03:03", "throughput": 1398.1, "total_tokens": 25056} |
| {"current_steps": 85, "total_steps": 900, "loss": 0.0556, "lr": 4.666666666666667e-05, "epoch": 0.9444444444444444, "percentage": 9.44, "elapsed_time": "0:00:18", "remaining_time": "0:03:00", "throughput": 1410.88, "total_tokens": 26560} |
| {"current_steps": 90, "total_steps": 900, "loss": 0.2002, "lr": 4.9444444444444446e-05, "epoch": 1.0, "percentage": 10.0, "elapsed_time": "0:00:19", "remaining_time": "0:02:58", "throughput": 1420.38, "total_tokens": 28096} |
| {"current_steps": 90, "total_steps": 900, "eval_loss": 0.17683683335781097, "epoch": 1.0, "percentage": 10.0, "elapsed_time": "0:00:20", "remaining_time": "0:03:07", "throughput": 1350.39, "total_tokens": 28096} |
| {"current_steps": 95, "total_steps": 900, "loss": 0.1392, "lr": 4.9996991493233693e-05, "epoch": 1.0555555555555556, "percentage": 10.56, "elapsed_time": "0:00:22", "remaining_time": "0:03:14", "throughput": 1292.42, "total_tokens": 29696} |
| {"current_steps": 100, "total_steps": 900, "loss": 0.1666, "lr": 4.99847706754774e-05, "epoch": 1.1111111111111112, "percentage": 11.11, "elapsed_time": "0:00:23", "remaining_time": "0:03:11", "throughput": 1307.41, "total_tokens": 31232} |
|
|