| {"current_steps": 5, "total_steps": 213, "loss": 0.7566, "lr": 4.99565044765711e-05, "epoch": 0.06956521739130435, "percentage": 2.35, "elapsed_time": "0:02:03", "remaining_time": "1:25:41", "throughput": 1115.81, "total_tokens": 137920} |
| {"current_steps": 10, "total_steps": 213, "loss": 0.6594, "lr": 4.978006327248537e-05, "epoch": 0.1391304347826087, "percentage": 4.69, "elapsed_time": "0:04:01", "remaining_time": "1:21:43", "throughput": 1125.42, "total_tokens": 271824} |
| {"current_steps": 15, "total_steps": 213, "loss": 0.6611, "lr": 4.946891632198452e-05, "epoch": 0.20869565217391303, "percentage": 7.04, "elapsed_time": "0:06:07", "remaining_time": "1:20:45", "throughput": 1120.29, "total_tokens": 411200} |
| {"current_steps": 20, "total_steps": 213, "loss": 0.6368, "lr": 4.9024755036496795e-05, "epoch": 0.2782608695652174, "percentage": 9.39, "elapsed_time": "0:08:04", "remaining_time": "1:17:58", "throughput": 1123.75, "total_tokens": 544816} |
| {"current_steps": 25, "total_steps": 213, "loss": 0.6475, "lr": 4.8449993900474187e-05, "epoch": 0.34782608695652173, "percentage": 11.74, "elapsed_time": "0:10:08", "remaining_time": "1:16:12", "throughput": 1122.51, "total_tokens": 682528} |
| {"current_steps": 30, "total_steps": 213, "loss": 0.6333, "lr": 4.774775734612604e-05, "epoch": 0.41739130434782606, "percentage": 14.08, "elapsed_time": "0:12:03", "remaining_time": "1:13:30", "throughput": 1125.08, "total_tokens": 813456} |
| {"current_steps": 35, "total_steps": 213, "loss": 0.581, "lr": 4.6921862768838855e-05, "epoch": 0.48695652173913045, "percentage": 16.43, "elapsed_time": "0:14:03", "remaining_time": "1:11:29", "throughput": 1125.3, "total_tokens": 949040} |
| {"current_steps": 40, "total_steps": 213, "loss": 0.5915, "lr": 4.597679977561122e-05, "epoch": 0.5565217391304348, "percentage": 18.78, "elapsed_time": "0:16:05", "remaining_time": "1:09:36", "throughput": 1124.72, "total_tokens": 1085984} |
| {"current_steps": 45, "total_steps": 213, "loss": 0.5869, "lr": 4.491770577931057e-05, "epoch": 0.6260869565217392, "percentage": 21.13, "elapsed_time": "0:18:02", "remaining_time": "1:07:19", "throughput": 1125.24, "total_tokens": 1217520} |
| {"current_steps": 50, "total_steps": 213, "loss": 0.5684, "lr": 4.375033807142267e-05, "epoch": 0.6956521739130435, "percentage": 23.47, "elapsed_time": "0:20:03", "remaining_time": "1:05:22", "throughput": 1125.33, "total_tokens": 1353968} |
| {"current_steps": 55, "total_steps": 213, "loss": 0.5967, "lr": 4.2481042525107854e-05, "epoch": 0.7652173913043478, "percentage": 25.82, "elapsed_time": "0:22:06", "remaining_time": "1:03:29", "throughput": 1124.91, "total_tokens": 1491728} |
| {"current_steps": 60, "total_steps": 213, "loss": 0.5831, "lr": 4.111671909869582e-05, "epoch": 0.8347826086956521, "percentage": 28.17, "elapsed_time": "0:24:04", "remaining_time": "1:01:22", "throughput": 1125.32, "total_tokens": 1625184} |
| {"current_steps": 65, "total_steps": 213, "loss": 0.5782, "lr": 3.9664784327143955e-05, "epoch": 0.9043478260869565, "percentage": 30.52, "elapsed_time": "0:26:02", "remaining_time": "0:59:16", "throughput": 1125.63, "total_tokens": 1758384} |
| {"current_steps": 70, "total_steps": 213, "loss": 0.5842, "lr": 3.813313100535747e-05, "epoch": 0.9739130434782609, "percentage": 32.86, "elapsed_time": "0:28:02", "remaining_time": "0:57:16", "throughput": 1125.33, "total_tokens": 1893088} |
| {"current_steps": 75, "total_steps": 213, "loss": 0.5629, "lr": 3.653008528253509e-05, "epoch": 1.0556521739130436, "percentage": 35.21, "elapsed_time": "0:30:22", "remaining_time": "0:55:53", "throughput": 1125.29, "total_tokens": 2051200} |
| {"current_steps": 80, "total_steps": 213, "loss": 0.5549, "lr": 3.486436140077764e-05, "epoch": 1.1252173913043477, "percentage": 37.56, "elapsed_time": "0:32:19", "remaining_time": "0:53:44", "throughput": 1125.75, "total_tokens": 2183136} |
| {"current_steps": 85, "total_steps": 213, "loss": 0.5263, "lr": 3.3145014324002944e-05, "epoch": 1.1947826086956521, "percentage": 39.91, "elapsed_time": "0:34:17", "remaining_time": "0:51:39", "throughput": 1126.17, "total_tokens": 2317616} |
| {"current_steps": 90, "total_steps": 213, "loss": 0.505, "lr": 3.1381390514678696e-05, "epoch": 1.2643478260869565, "percentage": 42.25, "elapsed_time": "0:36:23", "remaining_time": "0:49:43", "throughput": 1125.57, "total_tokens": 2457440} |
| {"current_steps": 95, "total_steps": 213, "loss": 0.555, "lr": 2.9583077125953716e-05, "epoch": 1.333913043478261, "percentage": 44.6, "elapsed_time": "0:38:22", "remaining_time": "0:47:40", "throughput": 1125.71, "total_tokens": 2592320} |
| {"current_steps": 100, "total_steps": 213, "loss": 0.5266, "lr": 2.775984988538175e-05, "epoch": 1.4034782608695653, "percentage": 46.95, "elapsed_time": "0:40:25", "remaining_time": "0:45:41", "throughput": 1125.37, "total_tokens": 2729856} |
| {"current_steps": 105, "total_steps": 213, "loss": 0.5364, "lr": 2.592161995354479e-05, "epoch": 1.4730434782608697, "percentage": 49.3, "elapsed_time": "0:42:27", "remaining_time": "0:43:40", "throughput": 1125.22, "total_tokens": 2866464} |
| {"current_steps": 110, "total_steps": 213, "loss": 0.5215, "lr": 2.4078380046455222e-05, "epoch": 1.542608695652174, "percentage": 51.64, "elapsed_time": "0:44:28", "remaining_time": "0:41:38", "throughput": 1125.44, "total_tokens": 3003392} |
| {"current_steps": 115, "total_steps": 213, "loss": 0.5354, "lr": 2.224015011461826e-05, "epoch": 1.6121739130434782, "percentage": 53.99, "elapsed_time": "0:46:32", "remaining_time": "0:39:39", "throughput": 1125.14, "total_tokens": 3141984} |
| {"current_steps": 120, "total_steps": 213, "loss": 0.5098, "lr": 2.0416922874046293e-05, "epoch": 1.6817391304347826, "percentage": 56.34, "elapsed_time": "0:48:37", "remaining_time": "0:37:40", "throughput": 1124.77, "total_tokens": 3281264} |
| {"current_steps": 125, "total_steps": 213, "loss": 0.4939, "lr": 1.8618609485321313e-05, "epoch": 1.7513043478260868, "percentage": 58.69, "elapsed_time": "0:50:38", "remaining_time": "0:35:39", "throughput": 1124.82, "total_tokens": 3418208} |
| {"current_steps": 130, "total_steps": 213, "loss": 0.4919, "lr": 1.6854985675997066e-05, "epoch": 1.8208695652173912, "percentage": 61.03, "elapsed_time": "0:52:37", "remaining_time": "0:33:35", "throughput": 1125.15, "total_tokens": 3552624} |
| {"current_steps": 135, "total_steps": 213, "loss": 0.5245, "lr": 1.5135638599222368e-05, "epoch": 1.8904347826086956, "percentage": 63.38, "elapsed_time": "0:54:35", "remaining_time": "0:31:32", "throughput": 1125.58, "total_tokens": 3686752} |
| {"current_steps": 140, "total_steps": 213, "loss": 0.5566, "lr": 1.3469914717464916e-05, "epoch": 1.96, "percentage": 65.73, "elapsed_time": "0:56:20", "remaining_time": "0:29:22", "throughput": 1126.7, "total_tokens": 3809216} |
| {"current_steps": 145, "total_steps": 213, "loss": 0.5672, "lr": 1.1866868994642535e-05, "epoch": 2.0417391304347827, "percentage": 68.08, "elapsed_time": "0:58:47", "remaining_time": "0:27:34", "throughput": 1125.84, "total_tokens": 3971664} |
| {"current_steps": 150, "total_steps": 213, "loss": 0.5116, "lr": 1.0335215672856046e-05, "epoch": 2.111304347826087, "percentage": 70.42, "elapsed_time": "1:00:50", "remaining_time": "0:25:33", "throughput": 1125.56, "total_tokens": 4108736} |
| {"current_steps": 155, "total_steps": 213, "loss": 0.4855, "lr": 8.883280901304187e-06, "epoch": 2.1808695652173915, "percentage": 72.77, "elapsed_time": "1:02:53", "remaining_time": "0:23:32", "throughput": 1125.32, "total_tokens": 4246544} |
| {"current_steps": 160, "total_steps": 213, "loss": 0.4634, "lr": 7.518957474892149e-06, "epoch": 2.2504347826086954, "percentage": 75.12, "elapsed_time": "1:04:58", "remaining_time": "0:21:31", "throughput": 1124.94, "total_tokens": 4385600} |
| {"current_steps": 165, "total_steps": 213, "loss": 0.4784, "lr": 6.2496619285773356e-06, "epoch": 2.32, "percentage": 77.46, "elapsed_time": "1:06:52", "remaining_time": "0:19:27", "throughput": 1125.42, "total_tokens": 4515424} |
| {"current_steps": 170, "total_steps": 213, "loss": 0.4562, "lr": 5.082294220689435e-06, "epoch": 2.3895652173913042, "percentage": 79.81, "elapsed_time": "1:08:58", "remaining_time": "0:17:26", "throughput": 1125.14, "total_tokens": 4656832} |
| {"current_steps": 175, "total_steps": 213, "loss": 0.4635, "lr": 4.023200224388787e-06, "epoch": 2.4591304347826086, "percentage": 82.16, "elapsed_time": "1:10:53", "remaining_time": "0:15:23", "throughput": 1125.44, "total_tokens": 4787584} |
| {"current_steps": 180, "total_steps": 213, "loss": 0.5231, "lr": 3.078137231161146e-06, "epoch": 2.528695652173913, "percentage": 84.51, "elapsed_time": "1:12:51", "remaining_time": "0:13:21", "throughput": 1125.53, "total_tokens": 4920640} |
| {"current_steps": 185, "total_steps": 213, "loss": 0.4908, "lr": 2.2522426538739566e-06, "epoch": 2.5982608695652174, "percentage": 86.85, "elapsed_time": "1:14:58", "remaining_time": "0:11:20", "throughput": 1125.1, "total_tokens": 5061360} |
| {"current_steps": 190, "total_steps": 213, "loss": 0.5252, "lr": 1.5500060995258137e-06, "epoch": 2.667826086956522, "percentage": 89.2, "elapsed_time": "1:17:35", "remaining_time": "0:09:23", "throughput": 1115.2, "total_tokens": 5192048} |
| {"current_steps": 195, "total_steps": 213, "loss": 0.4728, "lr": 9.75244963503205e-07, "epoch": 2.737391304347826, "percentage": 91.55, "elapsed_time": "1:19:23", "remaining_time": "0:07:19", "throughput": 1116.36, "total_tokens": 5317552} |
| {"current_steps": 200, "total_steps": 213, "loss": 0.4781, "lr": 5.310836780154899e-07, "epoch": 2.8069565217391306, "percentage": 93.9, "elapsed_time": "1:21:27", "remaining_time": "0:05:17", "throughput": 1116.39, "total_tokens": 5456864} |
| {"current_steps": 205, "total_steps": 213, "loss": 0.5074, "lr": 2.1993672751463579e-07, "epoch": 2.8765217391304345, "percentage": 96.24, "elapsed_time": "1:23:37", "remaining_time": "0:03:15", "throughput": 1114.52, "total_tokens": 5592320} |
| {"current_steps": 210, "total_steps": 213, "loss": 0.454, "lr": 4.3495523428899174e-08, "epoch": 2.9460869565217394, "percentage": 98.59, "elapsed_time": "1:26:15", "remaining_time": "0:01:13", "throughput": 1106.84, "total_tokens": 5728832} |
| {"current_steps": 213, "total_steps": 213, "epoch": 2.9878260869565216, "percentage": 100.0, "elapsed_time": "1:27:30", "remaining_time": "0:00:00", "throughput": 1107.07, "total_tokens": 5812176} |
|
|