| {"current_steps": 5, "total_steps": 234, "loss": 0.3795, "lr": 9.988738792578126e-07, "epoch": 0.021333333333333333, "percentage": 2.14, "elapsed_time": "0:03:41", "remaining_time": "2:48:47", "throughput": 7206.08, "total_tokens": 1593504} |
| {"current_steps": 10, "total_steps": 234, "loss": 0.368, "lr": 9.955005896229541e-07, "epoch": 0.042666666666666665, "percentage": 4.27, "elapsed_time": "0:07:04", "remaining_time": "2:38:25", "throughput": 7480.99, "total_tokens": 3174528} |
| {"current_steps": 15, "total_steps": 234, "loss": 0.3613, "lr": 9.898953260211337e-07, "epoch": 0.064, "percentage": 6.41, "elapsed_time": "0:10:26", "remaining_time": "2:32:31", "throughput": 7581.29, "total_tokens": 4751904} |
| {"current_steps": 20, "total_steps": 234, "loss": 0.3559, "lr": 9.820833372667812e-07, "epoch": 0.08533333333333333, "percentage": 8.55, "elapsed_time": "0:14:19", "remaining_time": "2:33:11", "throughput": 7483.88, "total_tokens": 6428832} |
| {"current_steps": 25, "total_steps": 234, "loss": 0.3606, "lr": 9.720998123301922e-07, "epoch": 0.10666666666666667, "percentage": 10.68, "elapsed_time": "0:17:57", "remaining_time": "2:30:06", "throughput": 7443.18, "total_tokens": 8018560} |
| {"current_steps": 30, "total_steps": 234, "loss": 0.3444, "lr": 9.599897218294121e-07, "epoch": 0.128, "percentage": 12.82, "elapsed_time": "0:21:22", "remaining_time": "2:25:18", "throughput": 7476.4, "total_tokens": 9586176} |
| {"current_steps": 35, "total_steps": 234, "loss": 0.3477, "lr": 9.458076154608515e-07, "epoch": 0.14933333333333335, "percentage": 14.96, "elapsed_time": "0:24:53", "remaining_time": "2:21:30", "throughput": 7479.65, "total_tokens": 11169056} |
| {"current_steps": 40, "total_steps": 234, "loss": 0.3555, "lr": 9.296173762811084e-07, "epoch": 0.17066666666666666, "percentage": 17.09, "elapsed_time": "0:28:27", "remaining_time": "2:18:02", "throughput": 7482.41, "total_tokens": 12777728} |
| {"current_steps": 45, "total_steps": 234, "loss": 0.348, "lr": 9.114919329468282e-07, "epoch": 0.192, "percentage": 19.23, "elapsed_time": "0:31:54", "remaining_time": "2:14:00", "throughput": 7482.66, "total_tokens": 14324480} |
| {"current_steps": 50, "total_steps": 234, "loss": 0.336, "lr": 8.915129312088112e-07, "epoch": 0.21333333333333335, "percentage": 21.37, "elapsed_time": "0:35:33", "remaining_time": "2:10:53", "throughput": 7476.17, "total_tokens": 15953952} |
| {"current_steps": 55, "total_steps": 234, "loss": 0.3461, "lr": 8.697703661401185e-07, "epoch": 0.23466666666666666, "percentage": 23.5, "elapsed_time": "0:39:21", "remaining_time": "2:08:05", "throughput": 7447.42, "total_tokens": 17587840} |
| {"current_steps": 60, "total_steps": 234, "loss": 0.344, "lr": 8.463621767547997e-07, "epoch": 0.256, "percentage": 25.64, "elapsed_time": "0:42:32", "remaining_time": "2:03:23", "throughput": 7500.43, "total_tokens": 19148064} |
| {"current_steps": 65, "total_steps": 234, "loss": 0.3407, "lr": 8.213938048432696e-07, "epoch": 0.2773333333333333, "percentage": 27.78, "elapsed_time": "0:45:55", "remaining_time": "1:59:24", "throughput": 7516.95, "total_tokens": 20713472} |
| {"current_steps": 70, "total_steps": 234, "loss": 0.3473, "lr": 7.949777200115614e-07, "epoch": 0.2986666666666667, "percentage": 29.91, "elapsed_time": "0:49:18", "remaining_time": "1:55:30", "throughput": 7544.2, "total_tokens": 22317856} |
| {"current_steps": 75, "total_steps": 234, "loss": 0.3491, "lr": 7.672329130639005e-07, "epoch": 0.32, "percentage": 32.05, "elapsed_time": "0:52:33", "remaining_time": "1:51:25", "throughput": 7569.38, "total_tokens": 23871520} |
| {"current_steps": 80, "total_steps": 234, "loss": 0.3482, "lr": 7.382843600106539e-07, "epoch": 0.3413333333333333, "percentage": 34.19, "elapsed_time": "0:56:04", "remaining_time": "1:47:56", "throughput": 7565.76, "total_tokens": 25455392} |
| {"current_steps": 85, "total_steps": 234, "loss": 0.3476, "lr": 7.0826245911602e-07, "epoch": 0.3626666666666667, "percentage": 36.32, "elapsed_time": "0:59:36", "remaining_time": "1:44:29", "throughput": 7556.23, "total_tokens": 27024576} |
| {"current_steps": 90, "total_steps": 234, "loss": 0.3439, "lr": 6.773024435212677e-07, "epoch": 0.384, "percentage": 38.46, "elapsed_time": "1:02:44", "remaining_time": "1:40:22", "throughput": 7594.62, "total_tokens": 28587680} |
| {"current_steps": 95, "total_steps": 234, "loss": 0.3385, "lr": 6.455437720893564e-07, "epoch": 0.4053333333333333, "percentage": 40.6, "elapsed_time": "1:06:27", "remaining_time": "1:37:14", "throughput": 7571.05, "total_tokens": 30189472} |
| {"current_steps": 100, "total_steps": 234, "loss": 0.3467, "lr": 6.131295012148612e-07, "epoch": 0.4266666666666667, "percentage": 42.74, "elapsed_time": "1:09:53", "remaining_time": "1:33:38", "throughput": 7570.71, "total_tokens": 31745184} |
| {"current_steps": 105, "total_steps": 234, "loss": 0.3412, "lr": 5.802056404288801e-07, "epoch": 0.448, "percentage": 44.87, "elapsed_time": "1:13:09", "remaining_time": "1:29:53", "throughput": 7591.39, "total_tokens": 33324448} |
| {"current_steps": 110, "total_steps": 234, "loss": 0.3407, "lr": 5.469204947015897e-07, "epoch": 0.4693333333333333, "percentage": 47.01, "elapsed_time": "1:16:48", "remaining_time": "1:26:34", "throughput": 7576.44, "total_tokens": 34913472} |
| {"current_steps": 115, "total_steps": 234, "loss": 0.3376, "lr": 5.134239964050307e-07, "epoch": 0.49066666666666664, "percentage": 49.15, "elapsed_time": "1:20:09", "remaining_time": "1:22:57", "throughput": 7587.81, "total_tokens": 36496928} |
| {"current_steps": 120, "total_steps": 234, "loss": 0.3451, "lr": 4.798670299452926e-07, "epoch": 0.512, "percentage": 51.28, "elapsed_time": "1:23:54", "remaining_time": "1:19:42", "throughput": 7576.52, "total_tokens": 38144288} |
| {"current_steps": 125, "total_steps": 234, "loss": 0.3363, "lr": 4.464007521062761e-07, "epoch": 0.5333333333333333, "percentage": 53.42, "elapsed_time": "1:27:17", "remaining_time": "1:16:06", "throughput": 7587.97, "total_tokens": 39740288} |
| {"current_steps": 130, "total_steps": 234, "loss": 0.3331, "lr": 4.131759111665348e-07, "epoch": 0.5546666666666666, "percentage": 55.56, "elapsed_time": "1:30:48", "remaining_time": "1:12:38", "throughput": 7595.77, "total_tokens": 41385504} |
| {"current_steps": 135, "total_steps": 234, "loss": 0.3435, "lr": 3.8034216785622125e-07, "epoch": 0.576, "percentage": 57.69, "elapsed_time": "1:34:21", "remaining_time": "1:09:11", "throughput": 7595.65, "total_tokens": 43003136} |
| {"current_steps": 140, "total_steps": 234, "loss": 0.345, "lr": 3.4804742121287654e-07, "epoch": 0.5973333333333334, "percentage": 59.83, "elapsed_time": "1:37:51", "remaining_time": "1:05:42", "throughput": 7589.72, "total_tokens": 44564448} |
| {"current_steps": 145, "total_steps": 234, "loss": 0.3477, "lr": 3.164371423727362e-07, "epoch": 0.6186666666666667, "percentage": 61.97, "elapsed_time": "1:41:14", "remaining_time": "1:02:08", "throughput": 7596.32, "total_tokens": 46143616} |
| {"current_steps": 150, "total_steps": 234, "loss": 0.3455, "lr": 2.856537192984728e-07, "epoch": 0.64, "percentage": 64.1, "elapsed_time": "1:44:31", "remaining_time": "0:58:31", "throughput": 7606.25, "total_tokens": 47701504} |
| {"current_steps": 155, "total_steps": 234, "loss": 0.3364, "lr": 2.5583581539504463e-07, "epoch": 0.6613333333333333, "percentage": 66.24, "elapsed_time": "1:47:56", "remaining_time": "0:55:00", "throughput": 7609.57, "total_tokens": 49280704} |
| {"current_steps": 160, "total_steps": 234, "loss": 0.3418, "lr": 2.2711774490274766e-07, "epoch": 0.6826666666666666, "percentage": 68.38, "elapsed_time": "1:51:20", "remaining_time": "0:51:29", "throughput": 7611.85, "total_tokens": 50851808} |
| {"current_steps": 165, "total_steps": 234, "loss": 0.3399, "lr": 1.9962886788101047e-07, "epoch": 0.704, "percentage": 70.51, "elapsed_time": "1:54:55", "remaining_time": "0:48:03", "throughput": 7602.89, "total_tokens": 52422848} |
| {"current_steps": 170, "total_steps": 234, "loss": 0.3449, "lr": 1.7349300750820757e-07, "epoch": 0.7253333333333334, "percentage": 72.65, "elapsed_time": "1:58:39", "remaining_time": "0:44:40", "throughput": 7591.95, "total_tokens": 54053664} |
| {"current_steps": 175, "total_steps": 234, "loss": 0.3356, "lr": 1.4882789232226122e-07, "epoch": 0.7466666666666667, "percentage": 74.79, "elapsed_time": "2:02:08", "remaining_time": "0:41:10", "throughput": 7593.91, "total_tokens": 55653888} |
| {"current_steps": 180, "total_steps": 234, "loss": 0.347, "lr": 1.257446259144494e-07, "epoch": 0.768, "percentage": 76.92, "elapsed_time": "2:05:29", "remaining_time": "0:37:38", "throughput": 7595.31, "total_tokens": 57190560} |
| {"current_steps": 185, "total_steps": 234, "loss": 0.3377, "lr": 1.0434718646516916e-07, "epoch": 0.7893333333333333, "percentage": 79.06, "elapsed_time": "2:08:59", "remaining_time": "0:34:10", "throughput": 7592.97, "total_tokens": 58769344} |
| {"current_steps": 190, "total_steps": 234, "loss": 0.3469, "lr": 8.473195837599417e-08, "epoch": 0.8106666666666666, "percentage": 81.2, "elapsed_time": "2:12:42", "remaining_time": "0:30:43", "throughput": 7580.57, "total_tokens": 60359232} |
| {"current_steps": 195, "total_steps": 234, "loss": 0.3466, "lr": 6.698729810778064e-08, "epoch": 0.832, "percentage": 83.33, "elapsed_time": "2:16:07", "remaining_time": "0:27:13", "throughput": 7577.04, "total_tokens": 61888640} |
| {"current_steps": 200, "total_steps": 234, "loss": 0.3514, "lr": 5.119313618049309e-08, "epoch": 0.8533333333333334, "percentage": 85.47, "elapsed_time": "2:19:33", "remaining_time": "0:23:43", "throughput": 7578.94, "total_tokens": 63459232} |
| {"current_steps": 205, "total_steps": 234, "loss": 0.3382, "lr": 3.742061712753824e-08, "epoch": 0.8746666666666667, "percentage": 87.61, "elapsed_time": "2:23:13", "remaining_time": "0:20:15", "throughput": 7573.91, "total_tokens": 65087360} |
| {"current_steps": 210, "total_steps": 234, "loss": 0.3379, "lr": 2.5731779026427257e-08, "epoch": 0.896, "percentage": 89.74, "elapsed_time": "2:27:10", "remaining_time": "0:16:49", "throughput": 7554.35, "total_tokens": 66706016} |
| {"current_steps": 215, "total_steps": 234, "loss": 0.3463, "lr": 1.6179274049310966e-08, "epoch": 0.9173333333333333, "percentage": 91.88, "elapsed_time": "2:31:02", "remaining_time": "0:13:20", "throughput": 7543.33, "total_tokens": 68361792} |
| {"current_steps": 220, "total_steps": 234, "loss": 0.3436, "lr": 8.806131292167617e-09, "epoch": 0.9386666666666666, "percentage": 94.02, "elapsed_time": "2:34:21", "remaining_time": "0:09:49", "throughput": 7550.84, "total_tokens": 69930880} |
| {"current_steps": 225, "total_steps": 234, "loss": 0.3406, "lr": 3.6455629509730135e-09, "epoch": 0.96, "percentage": 96.15, "elapsed_time": "2:37:47", "remaining_time": "0:06:18", "throughput": 7555.84, "total_tokens": 71534880} |
| {"current_steps": 230, "total_steps": 234, "loss": 0.3431, "lr": 7.208147179291191e-10, "epoch": 0.9813333333333333, "percentage": 98.29, "elapsed_time": "2:40:56", "remaining_time": "0:02:47", "throughput": 7568.22, "total_tokens": 73081376} |
| {"current_steps": 234, "total_steps": 234, "epoch": 0.9984, "percentage": 100.0, "elapsed_time": "2:44:01", "remaining_time": "0:00:00", "throughput": 7555.04, "total_tokens": 74351744} |
|
|