| {"current_steps": 100, "total_steps": 12480, "loss": 1.3897, "learning_rate": 4.006410256410257e-07, "epoch": 0.08009611533840609, "percentage": 0.8, "elapsed_time": "0:04:43", "remaining_time": "9:44:30", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 200, "total_steps": 12480, "loss": 0.0598, "learning_rate": 8.012820512820515e-07, "epoch": 0.16019223067681218, "percentage": 1.6, "elapsed_time": "0:09:16", "remaining_time": "9:29:27", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 300, "total_steps": 12480, "loss": 0.0551, "learning_rate": 1.201923076923077e-06, "epoch": 0.24028834601521826, "percentage": 2.4, "elapsed_time": "0:13:50", "remaining_time": "9:21:51", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 400, "total_steps": 12480, "loss": 0.0517, "learning_rate": 1.602564102564103e-06, "epoch": 0.32038446135362436, "percentage": 3.21, "elapsed_time": "0:18:23", "remaining_time": "9:15:29", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 500, "total_steps": 12480, "loss": 0.0501, "learning_rate": 2.0032051282051286e-06, "epoch": 0.4004805766920304, "percentage": 4.01, "elapsed_time": "0:22:56", "remaining_time": "9:09:35", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 600, "total_steps": 12480, "loss": 0.0485, "learning_rate": 2.403846153846154e-06, "epoch": 0.4805766920304365, "percentage": 4.81, "elapsed_time": "0:27:29", "remaining_time": "9:04:23", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 700, "total_steps": 12480, "loss": 0.0463, "learning_rate": 2.8044871794871797e-06, "epoch": 0.5606728073688426, "percentage": 5.61, "elapsed_time": "0:32:02", "remaining_time": "8:59:07", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 800, "total_steps": 12480, "loss": 0.0443, "learning_rate": 3.205128205128206e-06, "epoch": 0.6407689227072487, "percentage": 6.41, "elapsed_time": "0:36:34", "remaining_time": "8:54:02", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 900, "total_steps": 12480, "loss": 0.0437, "learning_rate": 3.605769230769231e-06, "epoch": 0.7208650380456548, "percentage": 7.21, "elapsed_time": "0:41:07", "remaining_time": "8:49:07", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 1000, "total_steps": 12480, "loss": 0.042, "learning_rate": 4.006410256410257e-06, "epoch": 0.8009611533840608, "percentage": 8.01, "elapsed_time": "0:45:40", "remaining_time": "8:44:23", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 1000, "total_steps": 12480, "eval_loss": 0.041240859776735306, "epoch": 0.8009611533840608, "percentage": 8.01, "elapsed_time": "0:47:18", "remaining_time": "9:03:06", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 1100, "total_steps": 12480, "loss": 0.0411, "learning_rate": 4.4070512820512826e-06, "epoch": 0.8810572687224669, "percentage": 8.81, "elapsed_time": "0:52:30", "remaining_time": "9:03:10", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 1200, "total_steps": 12480, "loss": 0.0399, "learning_rate": 4.807692307692308e-06, "epoch": 0.961153384060873, "percentage": 9.62, "elapsed_time": "0:57:03", "remaining_time": "8:56:21", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 1300, "total_steps": 12480, "loss": 0.0379, "learning_rate": 4.999735579817769e-06, "epoch": 1.0412494993992791, "percentage": 10.42, "elapsed_time": "1:01:37", "remaining_time": "8:49:54", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 1400, "total_steps": 12480, "loss": 0.0366, "learning_rate": 4.997740994288484e-06, "epoch": 1.1213456147376852, "percentage": 11.22, "elapsed_time": "1:06:10", "remaining_time": "8:43:47", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 1500, "total_steps": 12480, "loss": 0.0359, "learning_rate": 4.993792498360407e-06, "epoch": 1.2014417300760913, "percentage": 12.02, "elapsed_time": "1:10:44", "remaining_time": "8:37:46", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 1600, "total_steps": 12480, "loss": 0.0347, "learning_rate": 4.9878931808274796e-06, "epoch": 1.2815378454144974, "percentage": 12.82, "elapsed_time": "1:15:17", "remaining_time": "8:31:59", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 1700, "total_steps": 12480, "loss": 0.0344, "learning_rate": 4.980047656554856e-06, "epoch": 1.3616339607529035, "percentage": 13.62, "elapsed_time": "1:19:51", "remaining_time": "8:26:23", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 1800, "total_steps": 12480, "loss": 0.0341, "learning_rate": 4.970262062868821e-06, "epoch": 1.4417300760913097, "percentage": 14.42, "elapsed_time": "1:24:24", "remaining_time": "8:20:48", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 1900, "total_steps": 12480, "loss": 0.0331, "learning_rate": 4.958544054755741e-06, "epoch": 1.5218261914297155, "percentage": 15.22, "elapsed_time": "1:28:56", "remaining_time": "8:15:17", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 2000, "total_steps": 12480, "loss": 0.0324, "learning_rate": 4.944902798873794e-06, "epoch": 1.6019223067681216, "percentage": 16.03, "elapsed_time": "1:33:29", "remaining_time": "8:09:55", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 2000, "total_steps": 12480, "eval_loss": 0.03307706490159035, "epoch": 1.6019223067681216, "percentage": 16.03, "elapsed_time": "1:35:07", "remaining_time": "8:18:26", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 2100, "total_steps": 12480, "loss": 0.0318, "learning_rate": 4.92934896638215e-06, "epoch": 1.6820184221065277, "percentage": 16.83, "elapsed_time": "1:44:56", "remaining_time": "8:38:43", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 2200, "total_steps": 12480, "loss": 0.0307, "learning_rate": 4.91189472459324e-06, "epoch": 1.7621145374449338, "percentage": 17.63, "elapsed_time": "1:49:30", "remaining_time": "8:31:40", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 2300, "total_steps": 12480, "loss": 0.0309, "learning_rate": 4.892553727454616e-06, "epoch": 1.84221065278334, "percentage": 18.43, "elapsed_time": "1:54:03", "remaining_time": "8:24:49", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 2400, "total_steps": 12480, "loss": 0.0301, "learning_rate": 4.8713411048678635e-06, "epoch": 1.922306768121746, "percentage": 19.23, "elapsed_time": "1:58:36", "remaining_time": "8:18:09", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 2500, "total_steps": 12480, "loss": 0.0297, "learning_rate": 4.848273450852921e-06, "epoch": 2.002402883460152, "percentage": 20.03, "elapsed_time": "2:03:09", "remaining_time": "8:11:38", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 2600, "total_steps": 12480, "loss": 0.0259, "learning_rate": 4.823368810567056e-06, "epoch": 2.0824989987985583, "percentage": 20.83, "elapsed_time": "2:07:42", "remaining_time": "8:05:18", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 2700, "total_steps": 12480, "loss": 0.0259, "learning_rate": 4.796646666188663e-06, "epoch": 2.1625951141369644, "percentage": 21.63, "elapsed_time": "2:12:15", "remaining_time": "7:59:03", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 2800, "total_steps": 12480, "loss": 0.0262, "learning_rate": 4.768127921676916e-06, "epoch": 2.2426912294753705, "percentage": 22.44, "elapsed_time": "2:16:47", "remaining_time": "7:52:55", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 2900, "total_steps": 12480, "loss": 0.0264, "learning_rate": 4.737834886419217e-06, "epoch": 2.3227873448137766, "percentage": 23.24, "elapsed_time": "2:21:20", "remaining_time": "7:46:53", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 3000, "total_steps": 12480, "loss": 0.0262, "learning_rate": 4.705791257779196e-06, "epoch": 2.4028834601521827, "percentage": 24.04, "elapsed_time": "2:25:52", "remaining_time": "7:40:57", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 3000, "total_steps": 12480, "eval_loss": 0.028629949316382408, "epoch": 2.4028834601521827, "percentage": 24.04, "elapsed_time": "2:27:29", "remaining_time": "7:46:05", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 3100, "total_steps": 12480, "loss": 0.0257, "learning_rate": 4.672022102558958e-06, "epoch": 2.482979575490589, "percentage": 24.84, "elapsed_time": "2:37:39", "remaining_time": "7:57:03", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 3200, "total_steps": 12480, "loss": 0.0259, "learning_rate": 4.636553837390051e-06, "epoch": 2.563075690828995, "percentage": 25.64, "elapsed_time": "2:42:12", "remaining_time": "7:50:25", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 3300, "total_steps": 12480, "loss": 0.025, "learning_rate": 4.5994142080684956e-06, "epoch": 2.643171806167401, "percentage": 26.44, "elapsed_time": "2:46:45", "remaining_time": "7:43:54", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 3400, "total_steps": 12480, "loss": 0.0251, "learning_rate": 4.560632267850054e-06, "epoch": 2.723267921505807, "percentage": 27.24, "elapsed_time": "2:51:19", "remaining_time": "7:37:31", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 3500, "total_steps": 12480, "loss": 0.0249, "learning_rate": 4.5202383547227134e-06, "epoch": 2.803364036844213, "percentage": 28.04, "elapsed_time": "2:55:51", "remaining_time": "7:31:13", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 3600, "total_steps": 12480, "loss": 0.0248, "learning_rate": 4.478264067674155e-06, "epoch": 2.8834601521826193, "percentage": 28.85, "elapsed_time": "3:00:25", "remaining_time": "7:25:02", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 3700, "total_steps": 12480, "loss": 0.0248, "learning_rate": 4.43474224197278e-06, "epoch": 2.9635562675210254, "percentage": 29.65, "elapsed_time": "3:04:58", "remaining_time": "7:18:56", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 3800, "total_steps": 12480, "loss": 0.0212, "learning_rate": 4.389706923481633e-06, "epoch": 3.0436523828594315, "percentage": 30.45, "elapsed_time": "3:09:31", "remaining_time": "7:12:55", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 3900, "total_steps": 12480, "loss": 0.0188, "learning_rate": 4.34319334202531e-06, "epoch": 3.1237484981978376, "percentage": 31.25, "elapsed_time": "3:14:04", "remaining_time": "7:06:57", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 4000, "total_steps": 12480, "loss": 0.0192, "learning_rate": 4.2952378838306855e-06, "epoch": 3.2038446135362433, "percentage": 32.05, "elapsed_time": "3:18:36", "remaining_time": "7:01:03", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 4000, "total_steps": 12480, "eval_loss": 0.02867858298122883, "epoch": 3.2038446135362433, "percentage": 32.05, "elapsed_time": "3:20:14", "remaining_time": "7:04:30", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 4100, "total_steps": 12480, "loss": 0.0192, "learning_rate": 4.245878063063022e-06, "epoch": 3.28394072887465, "percentage": 32.85, "elapsed_time": "3:33:13", "remaining_time": "7:15:48", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 4200, "total_steps": 12480, "loss": 0.0193, "learning_rate": 4.195152492479727e-06, "epoch": 3.3640368442130555, "percentage": 33.65, "elapsed_time": "3:37:45", "remaining_time": "7:09:16", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 4300, "total_steps": 12480, "loss": 0.0192, "learning_rate": 4.143100853224714e-06, "epoch": 3.4441329595514616, "percentage": 34.46, "elapsed_time": "3:42:17", "remaining_time": "7:02:52", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 4400, "total_steps": 12480, "loss": 0.019, "learning_rate": 4.089763863786988e-06, "epoch": 3.5242290748898677, "percentage": 35.26, "elapsed_time": "3:46:50", "remaining_time": "6:56:33", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 4500, "total_steps": 12480, "loss": 0.0189, "learning_rate": 4.035183248147752e-06, "epoch": 3.604325190228274, "percentage": 36.06, "elapsed_time": "3:51:23", "remaining_time": "6:50:19", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 4600, "total_steps": 12480, "loss": 0.0185, "learning_rate": 3.979401703140955e-06, "epoch": 3.68442130556668, "percentage": 36.86, "elapsed_time": "3:55:55", "remaining_time": "6:44:09", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 4700, "total_steps": 12480, "loss": 0.0191, "learning_rate": 3.922462865052782e-06, "epoch": 3.764517420905086, "percentage": 37.66, "elapsed_time": "4:00:29", "remaining_time": "6:38:04", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 4800, "total_steps": 12480, "loss": 0.0187, "learning_rate": 3.8644112754862614e-06, "epoch": 3.844613536243492, "percentage": 38.46, "elapsed_time": "4:05:01", "remaining_time": "6:32:02", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 4900, "total_steps": 12480, "loss": 0.0184, "learning_rate": 3.805292346517659e-06, "epoch": 3.924709651581898, "percentage": 39.26, "elapsed_time": "4:09:34", "remaining_time": "6:26:03", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 5000, "total_steps": 12480, "loss": 0.0178, "learning_rate": 3.745152325171921e-06, "epoch": 4.004805766920304, "percentage": 40.06, "elapsed_time": "4:14:06", "remaining_time": "6:20:09", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 5000, "total_steps": 12480, "eval_loss": 0.031728021800518036, "epoch": 4.004805766920304, "percentage": 40.06, "elapsed_time": "4:15:44", "remaining_time": "6:22:35", "throughput": "0.00", "total_tokens": 0} | |