| {"current_steps": 5, "total_steps": 5650, "loss": 0.7007, "accuracy": 0.30000001192092896, "lr": 2.0000000000000003e-06, "epoch": 0.001769363471491131, "percentage": 0.09, "elapsed_time": "0:05:41", "remaining_time": "4 days, 11:01:16", "throughput": 1209.7, "total_tokens": 412816} |
| {"current_steps": 10, "total_steps": 5650, "loss": 0.7069, "accuracy": 0.45000001788139343, "lr": 4.5e-06, "epoch": 0.003538726942982262, "percentage": 0.18, "elapsed_time": "0:11:57", "remaining_time": "4 days, 16:25:18", "throughput": 1209.05, "total_tokens": 867600} |
| {"current_steps": 15, "total_steps": 5650, "loss": 0.7222, "accuracy": 0.30000001192092896, "lr": 7.000000000000001e-06, "epoch": 0.005308090414473393, "percentage": 0.27, "elapsed_time": "0:17:53", "remaining_time": "4 days, 15:59:56", "throughput": 1210.86, "total_tokens": 1299600} |
| {"current_steps": 20, "total_steps": 5650, "loss": 0.6994, "accuracy": 0.5250000357627869, "lr": 9.5e-06, "epoch": 0.007077453885964524, "percentage": 0.35, "elapsed_time": "0:23:28", "remaining_time": "4 days, 14:07:51", "throughput": 1215.4, "total_tokens": 1711792} |
| {"current_steps": 25, "total_steps": 5650, "loss": 0.6976, "accuracy": 0.45000001788139343, "lr": 1.2e-05, "epoch": 0.008846817357455655, "percentage": 0.44, "elapsed_time": "0:29:08", "remaining_time": "4 days, 13:16:27", "throughput": 1216.78, "total_tokens": 2127408} |
| {"current_steps": 30, "total_steps": 5650, "loss": 0.7107, "accuracy": 0.375, "lr": 1.45e-05, "epoch": 0.010616180828946786, "percentage": 0.53, "elapsed_time": "0:35:07", "remaining_time": "4 days, 13:41:24", "throughput": 1213.85, "total_tokens": 2558704} |
| {"current_steps": 35, "total_steps": 5650, "loss": 0.6795, "accuracy": 0.550000011920929, "lr": 1.7000000000000003e-05, "epoch": 0.012385544300437918, "percentage": 0.62, "elapsed_time": "0:41:19", "remaining_time": "4 days, 14:29:12", "throughput": 1212.78, "total_tokens": 3006864} |
| {"current_steps": 40, "total_steps": 5650, "loss": 0.6505, "accuracy": 0.6500000357627869, "lr": 1.9500000000000003e-05, "epoch": 0.014154907771929048, "percentage": 0.71, "elapsed_time": "0:47:05", "remaining_time": "4 days, 14:04:22", "throughput": 1213.94, "total_tokens": 3429856} |
| {"current_steps": 45, "total_steps": 5650, "loss": 0.6165, "accuracy": 0.6500000357627869, "lr": 2.2000000000000003e-05, "epoch": 0.01592427124342018, "percentage": 0.8, "elapsed_time": "0:52:33", "remaining_time": "4 days, 13:05:58", "throughput": 1215.95, "total_tokens": 3834240} |
| {"current_steps": 50, "total_steps": 5650, "loss": 0.7095, "accuracy": 0.6500000357627869, "lr": 2.45e-05, "epoch": 0.01769363471491131, "percentage": 0.88, "elapsed_time": "0:58:19", "remaining_time": "4 days, 12:52:26", "throughput": 1215.07, "total_tokens": 4252160} |
| {"current_steps": 55, "total_steps": 5650, "loss": 0.5922, "accuracy": 0.625, "lr": 2.7000000000000002e-05, "epoch": 0.01946299818640244, "percentage": 0.97, "elapsed_time": "1:03:44", "remaining_time": "4 days, 12:03:49", "throughput": 1216.38, "total_tokens": 4651712} |
| {"current_steps": 60, "total_steps": 5650, "loss": 0.6177, "accuracy": 0.699999988079071, "lr": 2.95e-05, "epoch": 0.02123236165789357, "percentage": 1.06, "elapsed_time": "1:08:45", "remaining_time": "4 days, 10:46:44", "throughput": 1219.08, "total_tokens": 5029920} |
| {"current_steps": 65, "total_steps": 5650, "loss": 0.5734, "accuracy": 0.675000011920929, "lr": 3.2000000000000005e-05, "epoch": 0.023001725129384705, "percentage": 1.15, "elapsed_time": "1:14:16", "remaining_time": "4 days, 10:22:26", "throughput": 1219.61, "total_tokens": 5435632} |
| {"current_steps": 70, "total_steps": 5650, "loss": 0.6006, "accuracy": 0.699999988079071, "lr": 3.45e-05, "epoch": 0.024771088600875835, "percentage": 1.24, "elapsed_time": "1:20:25", "remaining_time": "4 days, 10:50:47", "throughput": 1218.71, "total_tokens": 5880688} |
| {"current_steps": 75, "total_steps": 5650, "loss": 0.5279, "accuracy": 0.699999988079071, "lr": 3.7e-05, "epoch": 0.026540452072366966, "percentage": 1.33, "elapsed_time": "1:26:26", "remaining_time": "4 days, 11:06:00", "throughput": 1218.34, "total_tokens": 6319408} |
| {"current_steps": 80, "total_steps": 5650, "loss": 0.4824, "accuracy": 0.7750000357627869, "lr": 3.9500000000000005e-05, "epoch": 0.028309815543858096, "percentage": 1.42, "elapsed_time": "1:31:59", "remaining_time": "4 days, 10:44:56", "throughput": 1218.55, "total_tokens": 6725776} |
| {"current_steps": 85, "total_steps": 5650, "loss": 0.6604, "accuracy": 0.675000011920929, "lr": 4.2e-05, "epoch": 0.030079179015349226, "percentage": 1.5, "elapsed_time": "1:37:48", "remaining_time": "4 days, 10:43:51", "throughput": 1218.26, "total_tokens": 7149680} |
| {"current_steps": 90, "total_steps": 5650, "loss": 0.5578, "accuracy": 0.75, "lr": 4.4500000000000004e-05, "epoch": 0.03184854248684036, "percentage": 1.59, "elapsed_time": "1:44:06", "remaining_time": "4 days, 11:11:17", "throughput": 1217.54, "total_tokens": 7605024} |
| {"current_steps": 95, "total_steps": 5650, "loss": 0.4137, "accuracy": 0.824999988079071, "lr": 4.7e-05, "epoch": 0.03361790595833149, "percentage": 1.68, "elapsed_time": "1:49:49", "remaining_time": "4 days, 11:02:13", "throughput": 1217.39, "total_tokens": 8022448} |
| {"current_steps": 100, "total_steps": 5650, "loss": 0.5827, "accuracy": 0.7250000238418579, "lr": 4.9500000000000004e-05, "epoch": 0.03538726942982262, "percentage": 1.77, "elapsed_time": "1:56:05", "remaining_time": "4 days, 11:23:32", "throughput": 1216.41, "total_tokens": 8473504} |
| {"current_steps": 105, "total_steps": 5650, "loss": 0.5244, "accuracy": 0.675000011920929, "lr": 5e-05, "epoch": 0.037156632901313755, "percentage": 1.86, "elapsed_time": "2:02:15", "remaining_time": "4 days, 11:36:03", "throughput": 1215.94, "total_tokens": 8919072} |
| {"current_steps": 110, "total_steps": 5650, "loss": 0.5994, "accuracy": 0.6500000357627869, "lr": 5e-05, "epoch": 0.03892599637280488, "percentage": 1.95, "elapsed_time": "2:08:06", "remaining_time": "4 days, 11:32:15", "throughput": 1215.9, "total_tokens": 9346368} |
| {"current_steps": 115, "total_steps": 5650, "loss": 0.4091, "accuracy": 0.800000011920929, "lr": 5e-05, "epoch": 0.040695359844296015, "percentage": 2.04, "elapsed_time": "2:14:16", "remaining_time": "4 days, 11:42:28", "throughput": 1215.8, "total_tokens": 9794768} |
| {"current_steps": 120, "total_steps": 5650, "loss": 0.5556, "accuracy": 0.675000011920929, "lr": 5e-05, "epoch": 0.04246472331578714, "percentage": 2.12, "elapsed_time": "2:20:03", "remaining_time": "4 days, 11:34:18", "throughput": 1216.15, "total_tokens": 10219808} |
| {"current_steps": 125, "total_steps": 5650, "loss": 0.525, "accuracy": 0.824999988079071, "lr": 5e-05, "epoch": 0.044234086787278276, "percentage": 2.21, "elapsed_time": "2:25:38", "remaining_time": "4 days, 11:17:35", "throughput": 1216.43, "total_tokens": 10630176} |
| {"current_steps": 130, "total_steps": 5650, "loss": 0.4138, "accuracy": 0.75, "lr": 5e-05, "epoch": 0.04600345025876941, "percentage": 2.3, "elapsed_time": "2:31:05", "remaining_time": "4 days, 10:55:41", "throughput": 1217.03, "total_tokens": 11033168} |
| {"current_steps": 135, "total_steps": 5650, "loss": 0.6679, "accuracy": 0.7250000238418579, "lr": 5e-05, "epoch": 0.04777281373026054, "percentage": 2.39, "elapsed_time": "2:37:20", "remaining_time": "4 days, 11:07:48", "throughput": 1216.72, "total_tokens": 11486624} |
| {"current_steps": 140, "total_steps": 5650, "loss": 0.5462, "accuracy": 0.675000011920929, "lr": 5e-05, "epoch": 0.04954217720175167, "percentage": 2.48, "elapsed_time": "2:43:24", "remaining_time": "4 days, 11:11:00", "throughput": 1216.31, "total_tokens": 11924752} |
| {"current_steps": 145, "total_steps": 5650, "loss": 0.6519, "accuracy": 0.675000011920929, "lr": 5e-05, "epoch": 0.0513115406732428, "percentage": 2.57, "elapsed_time": "2:49:10", "remaining_time": "4 days, 11:02:34", "throughput": 1216.51, "total_tokens": 12347664} |
| {"current_steps": 150, "total_steps": 5650, "loss": 0.5751, "accuracy": 0.699999988079071, "lr": 5e-05, "epoch": 0.05308090414473393, "percentage": 2.65, "elapsed_time": "2:55:00", "remaining_time": "4 days, 10:56:53", "throughput": 1216.54, "total_tokens": 12774112} |
| {"current_steps": 155, "total_steps": 5650, "loss": 0.4459, "accuracy": 0.75, "lr": 5e-05, "epoch": 0.054850267616225065, "percentage": 2.74, "elapsed_time": "3:01:02", "remaining_time": "4 days, 10:57:56", "throughput": 1216.5, "total_tokens": 13213600} |
| {"current_steps": 160, "total_steps": 5650, "loss": 0.5585, "accuracy": 0.7250000238418579, "lr": 5e-05, "epoch": 0.05661963108771619, "percentage": 2.83, "elapsed_time": "3:07:09", "remaining_time": "4 days, 11:02:00", "throughput": 1216.5, "total_tokens": 13660992} |
| {"current_steps": 165, "total_steps": 5650, "loss": 0.5305, "accuracy": 0.75, "lr": 5e-05, "epoch": 0.058388994559207326, "percentage": 2.92, "elapsed_time": "3:13:09", "remaining_time": "4 days, 11:01:04", "throughput": 1216.44, "total_tokens": 14098048} |
| {"current_steps": 170, "total_steps": 5650, "loss": 0.5502, "accuracy": 0.6000000238418579, "lr": 5e-05, "epoch": 0.06015835803069845, "percentage": 3.01, "elapsed_time": "3:19:02", "remaining_time": "4 days, 10:56:23", "throughput": 1216.48, "total_tokens": 14528272} |
| {"current_steps": 175, "total_steps": 5650, "loss": 0.3892, "accuracy": 0.824999988079071, "lr": 5e-05, "epoch": 0.06192772150218959, "percentage": 3.1, "elapsed_time": "3:24:46", "remaining_time": "4 days, 10:46:22", "throughput": 1216.62, "total_tokens": 14947680} |
| {"current_steps": 180, "total_steps": 5650, "loss": 0.3826, "accuracy": 0.824999988079071, "lr": 5e-05, "epoch": 0.06369708497368072, "percentage": 3.19, "elapsed_time": "3:30:32", "remaining_time": "4 days, 10:38:17", "throughput": 1216.68, "total_tokens": 15370144} |
| {"current_steps": 185, "total_steps": 5650, "loss": 0.7038, "accuracy": 0.699999988079071, "lr": 5e-05, "epoch": 0.06546644844517185, "percentage": 3.27, "elapsed_time": "3:36:37", "remaining_time": "4 days, 10:39:14", "throughput": 1216.37, "total_tokens": 15809776} |
| {"current_steps": 190, "total_steps": 5650, "loss": 0.7389, "accuracy": 0.574999988079071, "lr": 5e-05, "epoch": 0.06723581191666297, "percentage": 3.36, "elapsed_time": "3:42:52", "remaining_time": "4 days, 10:44:47", "throughput": 1216.08, "total_tokens": 16262160} |
| {"current_steps": 195, "total_steps": 5650, "loss": 0.4602, "accuracy": 0.75, "lr": 5e-05, "epoch": 0.06900517538815411, "percentage": 3.45, "elapsed_time": "3:48:33", "remaining_time": "4 days, 10:33:49", "throughput": 1216.16, "total_tokens": 16677888} |
| {"current_steps": 200, "total_steps": 5650, "loss": 0.5559, "accuracy": 0.625, "lr": 5e-05, "epoch": 0.07077453885964524, "percentage": 3.54, "elapsed_time": "3:54:30", "remaining_time": "4 days, 10:30:31", "throughput": 1216.25, "total_tokens": 17113744} |
| {"current_steps": 205, "total_steps": 5650, "loss": 0.5598, "accuracy": 0.6500000357627869, "lr": 5e-05, "epoch": 0.07254390233113638, "percentage": 3.63, "elapsed_time": "4:00:22", "remaining_time": "4 days, 10:24:33", "throughput": 1216.37, "total_tokens": 17542960} |
| {"current_steps": 210, "total_steps": 5650, "loss": 0.3538, "accuracy": 0.875, "lr": 5e-05, "epoch": 0.07431326580262751, "percentage": 3.72, "elapsed_time": "4:06:17", "remaining_time": "4 days, 10:20:06", "throughput": 1216.32, "total_tokens": 17974176} |
| {"current_steps": 215, "total_steps": 5650, "loss": 0.6008, "accuracy": 0.75, "lr": 5e-05, "epoch": 0.07608262927411863, "percentage": 3.81, "elapsed_time": "4:12:18", "remaining_time": "4 days, 10:18:15", "throughput": 1216.03, "total_tokens": 18409216} |
| {"current_steps": 220, "total_steps": 5650, "loss": 0.4245, "accuracy": 0.800000011920929, "lr": 5e-05, "epoch": 0.07785199274560976, "percentage": 3.89, "elapsed_time": "4:18:05", "remaining_time": "4 days, 10:10:06", "throughput": 1216.13, "total_tokens": 18832224} |
| {"current_steps": 225, "total_steps": 5650, "loss": 0.3894, "accuracy": 0.800000011920929, "lr": 5e-05, "epoch": 0.0796213562171009, "percentage": 3.98, "elapsed_time": "4:24:07", "remaining_time": "4 days, 10:08:20", "throughput": 1216.03, "total_tokens": 19270960} |
| {"current_steps": 230, "total_steps": 5650, "loss": 0.5075, "accuracy": 0.800000011920929, "lr": 5e-05, "epoch": 0.08139071968859203, "percentage": 4.07, "elapsed_time": "4:30:15", "remaining_time": "4 days, 10:08:36", "throughput": 1215.81, "total_tokens": 19714624} |
| {"current_steps": 235, "total_steps": 5650, "loss": 0.5245, "accuracy": 0.800000011920929, "lr": 5e-05, "epoch": 0.08316008316008316, "percentage": 4.16, "elapsed_time": "4:36:04", "remaining_time": "4 days, 10:01:35", "throughput": 1215.87, "total_tokens": 20140592} |
| {"current_steps": 240, "total_steps": 5650, "loss": 0.3702, "accuracy": 0.800000011920929, "lr": 5e-05, "epoch": 0.08492944663157428, "percentage": 4.25, "elapsed_time": "4:42:10", "remaining_time": "4 days, 10:00:35", "throughput": 1215.79, "total_tokens": 20583600} |
| {"current_steps": 245, "total_steps": 5650, "loss": 0.9015, "accuracy": 0.625, "lr": 5e-05, "epoch": 0.08669881010306542, "percentage": 4.34, "elapsed_time": "4:48:13", "remaining_time": "4 days, 9:58:40", "throughput": 1215.65, "total_tokens": 21023104} |
| {"current_steps": 250, "total_steps": 5650, "loss": 0.4629, "accuracy": 0.75, "lr": 5e-05, "epoch": 0.08846817357455655, "percentage": 4.42, "elapsed_time": "4:54:00", "remaining_time": "4 days, 9:50:24", "throughput": 1215.92, "total_tokens": 21448880} |
| {"current_steps": 255, "total_steps": 5650, "loss": 0.6402, "accuracy": 0.6500000357627869, "lr": 5e-05, "epoch": 0.09023753704604769, "percentage": 4.51, "elapsed_time": "4:59:57", "remaining_time": "4 days, 9:46:18", "throughput": 1215.87, "total_tokens": 21883104} |
| {"current_steps": 260, "total_steps": 5650, "loss": 0.4876, "accuracy": 0.7750000357627869, "lr": 5e-05, "epoch": 0.09200690051753882, "percentage": 4.6, "elapsed_time": "5:05:55", "remaining_time": "4 days, 9:42:06", "throughput": 1215.83, "total_tokens": 22317296} |
| {"current_steps": 265, "total_steps": 5650, "loss": 0.4873, "accuracy": 0.800000011920929, "lr": 5e-05, "epoch": 0.09377626398902994, "percentage": 4.69, "elapsed_time": "5:12:11", "remaining_time": "4 days, 9:43:52", "throughput": 1215.59, "total_tokens": 22769520} |
| {"current_steps": 270, "total_steps": 5650, "loss": 0.5793, "accuracy": 0.7250000238418579, "lr": 5e-05, "epoch": 0.09554562746052107, "percentage": 4.78, "elapsed_time": "5:17:34", "remaining_time": "4 days, 9:28:05", "throughput": 1215.93, "total_tokens": 23169472} |
| {"current_steps": 275, "total_steps": 5650, "loss": 0.4828, "accuracy": 0.7750000357627869, "lr": 5e-05, "epoch": 0.09731499093201221, "percentage": 4.87, "elapsed_time": "5:23:27", "remaining_time": "4 days, 9:22:02", "throughput": 1215.92, "total_tokens": 23597584} |
| {"current_steps": 280, "total_steps": 5650, "loss": 0.6516, "accuracy": 0.6500000357627869, "lr": 5e-05, "epoch": 0.09908435440350334, "percentage": 4.96, "elapsed_time": "5:28:50", "remaining_time": "4 days, 9:06:37", "throughput": 1216.15, "total_tokens": 23994848} |
| {"current_steps": 285, "total_steps": 5650, "loss": 0.5529, "accuracy": 0.6500000357627869, "lr": 5e-05, "epoch": 0.10085371787499448, "percentage": 5.04, "elapsed_time": "5:34:26", "remaining_time": "4 days, 8:55:52", "throughput": 1216.43, "total_tokens": 24410112} |
| {"current_steps": 290, "total_steps": 5650, "loss": 0.538, "accuracy": 0.824999988079071, "lr": 5e-05, "epoch": 0.1026230813464856, "percentage": 5.13, "elapsed_time": "5:40:30", "remaining_time": "4 days, 8:53:37", "throughput": 1216.29, "total_tokens": 24849760} |
| {"current_steps": 295, "total_steps": 5650, "loss": 0.6213, "accuracy": 0.699999988079071, "lr": 5e-05, "epoch": 0.10439244481797673, "percentage": 5.22, "elapsed_time": "5:46:15", "remaining_time": "4 days, 8:45:30", "throughput": 1216.38, "total_tokens": 25271120} |
| {"current_steps": 300, "total_steps": 5650, "loss": 0.6277, "accuracy": 0.699999988079071, "lr": 5e-05, "epoch": 0.10616180828946786, "percentage": 5.31, "elapsed_time": "5:52:17", "remaining_time": "4 days, 8:42:35", "throughput": 1216.37, "total_tokens": 25711264} |
| {"current_steps": 305, "total_steps": 5650, "loss": 0.4608, "accuracy": 0.75, "lr": 5e-05, "epoch": 0.107931171760959, "percentage": 5.4, "elapsed_time": "5:58:04", "remaining_time": "4 days, 8:35:10", "throughput": 1216.39, "total_tokens": 26133856} |
| {"current_steps": 310, "total_steps": 5650, "loss": 0.6676, "accuracy": 0.75, "lr": 5e-05, "epoch": 0.10970053523245013, "percentage": 5.49, "elapsed_time": "6:03:59", "remaining_time": "4 days, 8:30:08", "throughput": 1216.42, "total_tokens": 26566464} |
| {"current_steps": 315, "total_steps": 5650, "loss": 0.391, "accuracy": 0.875, "lr": 5e-05, "epoch": 0.11146989870394125, "percentage": 5.58, "elapsed_time": "6:09:41", "remaining_time": "4 days, 8:21:24", "throughput": 1216.65, "total_tokens": 26987696} |
| {"current_steps": 320, "total_steps": 5650, "loss": 0.519, "accuracy": 0.7250000238418579, "lr": 5e-05, "epoch": 0.11323926217543238, "percentage": 5.66, "elapsed_time": "6:15:41", "remaining_time": "4 days, 8:17:36", "throughput": 1216.54, "total_tokens": 27422736} |
| {"current_steps": 325, "total_steps": 5650, "loss": 0.638, "accuracy": 0.675000011920929, "lr": 5e-05, "epoch": 0.11500862564692352, "percentage": 5.75, "elapsed_time": "6:21:29", "remaining_time": "4 days, 8:10:28", "throughput": 1216.6, "total_tokens": 27846896} |
| {"current_steps": 330, "total_steps": 5650, "loss": 0.5461, "accuracy": 0.699999988079071, "lr": 5e-05, "epoch": 0.11677798911841465, "percentage": 5.84, "elapsed_time": "6:27:22", "remaining_time": "4 days, 8:05:00", "throughput": 1216.35, "total_tokens": 28271120} |
| {"current_steps": 335, "total_steps": 5650, "loss": 0.5056, "accuracy": 0.75, "lr": 5e-05, "epoch": 0.11854735258990579, "percentage": 5.93, "elapsed_time": "6:33:17", "remaining_time": "4 days, 7:59:47", "throughput": 1216.39, "total_tokens": 28703424} |
| {"current_steps": 340, "total_steps": 5650, "loss": 0.4629, "accuracy": 0.824999988079071, "lr": 5e-05, "epoch": 0.1203167160613969, "percentage": 6.02, "elapsed_time": "6:39:22", "remaining_time": "4 days, 7:57:25", "throughput": 1216.23, "total_tokens": 29144368} |
| {"current_steps": 345, "total_steps": 5650, "loss": 0.4835, "accuracy": 0.800000011920929, "lr": 5e-05, "epoch": 0.12208607953288804, "percentage": 6.11, "elapsed_time": "6:45:28", "remaining_time": "4 days, 7:54:59", "throughput": 1216.02, "total_tokens": 29584352} |
| {"current_steps": 350, "total_steps": 5650, "loss": 0.3763, "accuracy": 0.824999988079071, "lr": 5e-05, "epoch": 0.12385544300437917, "percentage": 6.19, "elapsed_time": "6:51:03", "remaining_time": "4 days, 7:44:35", "throughput": 1216.14, "total_tokens": 29994288} |
| {"current_steps": 355, "total_steps": 5650, "loss": 0.5416, "accuracy": 0.7250000238418579, "lr": 5e-05, "epoch": 0.1256248064758703, "percentage": 6.28, "elapsed_time": "6:57:10", "remaining_time": "4 days, 7:42:16", "throughput": 1216.13, "total_tokens": 30439920} |
| {"current_steps": 360, "total_steps": 5650, "loss": 0.3773, "accuracy": 0.800000011920929, "lr": 5e-05, "epoch": 0.12739416994736144, "percentage": 6.37, "elapsed_time": "7:02:44", "remaining_time": "4 days, 7:31:50", "throughput": 1216.32, "total_tokens": 30850784} |
| {"current_steps": 365, "total_steps": 5650, "loss": 0.4021, "accuracy": 0.800000011920929, "lr": 5e-05, "epoch": 0.12916353341885256, "percentage": 6.46, "elapsed_time": "7:08:33", "remaining_time": "4 days, 7:25:10", "throughput": 1216.37, "total_tokens": 31276512} |
| {"current_steps": 370, "total_steps": 5650, "loss": 0.4368, "accuracy": 0.824999988079071, "lr": 5e-05, "epoch": 0.1309328968903437, "percentage": 6.55, "elapsed_time": "7:14:29", "remaining_time": "4 days, 7:20:17", "throughput": 1216.35, "total_tokens": 31709488} |
| {"current_steps": 375, "total_steps": 5650, "loss": 0.7189, "accuracy": 0.7250000238418579, "lr": 5e-05, "epoch": 0.13270226036183483, "percentage": 6.64, "elapsed_time": "7:20:20", "remaining_time": "4 days, 7:14:09", "throughput": 1216.45, "total_tokens": 32139280} |
| {"current_steps": 380, "total_steps": 5650, "loss": 0.6274, "accuracy": 0.7250000238418579, "lr": 5e-05, "epoch": 0.13447162383332595, "percentage": 6.73, "elapsed_time": "7:26:30", "remaining_time": "4 days, 7:12:21", "throughput": 1216.31, "total_tokens": 32585488} |
| {"current_steps": 385, "total_steps": 5650, "loss": 0.4543, "accuracy": 0.8500000238418579, "lr": 5e-05, "epoch": 0.1362409873048171, "percentage": 6.81, "elapsed_time": "7:32:18", "remaining_time": "4 days, 7:05:33", "throughput": 1216.31, "total_tokens": 33009248} |
| {"current_steps": 390, "total_steps": 5650, "loss": 0.5678, "accuracy": 0.7750000357627869, "lr": 5e-05, "epoch": 0.13801035077630822, "percentage": 6.9, "elapsed_time": "7:37:54", "remaining_time": "4 days, 6:55:55", "throughput": 1216.4, "total_tokens": 33420096} |
| {"current_steps": 395, "total_steps": 5650, "loss": 0.4672, "accuracy": 0.75, "lr": 5e-05, "epoch": 0.13977971424779936, "percentage": 6.99, "elapsed_time": "7:43:41", "remaining_time": "4 days, 6:48:47", "throughput": 1216.38, "total_tokens": 33841152} |
| {"current_steps": 400, "total_steps": 5650, "loss": 0.5062, "accuracy": 0.7750000357627869, "lr": 5e-05, "epoch": 0.14154907771929048, "percentage": 7.08, "elapsed_time": "7:49:38", "remaining_time": "4 days, 6:44:02", "throughput": 1216.34, "total_tokens": 34274576} |
| {"current_steps": 405, "total_steps": 5650, "loss": 0.3181, "accuracy": 0.875, "lr": 5e-05, "epoch": 0.1433184411907816, "percentage": 7.17, "elapsed_time": "7:55:23", "remaining_time": "4 days, 6:36:36", "throughput": 1216.42, "total_tokens": 34696512} |
| {"current_steps": 410, "total_steps": 5650, "loss": 0.5775, "accuracy": 0.7250000238418579, "lr": 5e-05, "epoch": 0.14508780466227275, "percentage": 7.26, "elapsed_time": "8:00:55", "remaining_time": "4 days, 6:26:31", "throughput": 1216.58, "total_tokens": 35105520} |
| {"current_steps": 415, "total_steps": 5650, "loss": 0.5774, "accuracy": 0.675000011920929, "lr": 5e-05, "epoch": 0.14685716813376387, "percentage": 7.35, "elapsed_time": "8:06:58", "remaining_time": "4 days, 6:22:57", "throughput": 1216.48, "total_tokens": 35543808} |
| {"current_steps": 420, "total_steps": 5650, "loss": 0.4911, "accuracy": 0.75, "lr": 5e-05, "epoch": 0.14862653160525502, "percentage": 7.43, "elapsed_time": "8:12:38", "remaining_time": "4 days, 6:14:31", "throughput": 1216.58, "total_tokens": 35960080} |
| {"current_steps": 425, "total_steps": 5650, "loss": 0.4225, "accuracy": 0.75, "lr": 5e-05, "epoch": 0.15039589507674614, "percentage": 7.52, "elapsed_time": "8:18:36", "remaining_time": "4 days, 6:09:58", "throughput": 1216.5, "total_tokens": 36393728} |
| {"current_steps": 430, "total_steps": 5650, "loss": 0.3742, "accuracy": 0.824999988079071, "lr": 5e-05, "epoch": 0.15216525854823726, "percentage": 7.61, "elapsed_time": "8:23:53", "remaining_time": "4 days, 5:57:03", "throughput": 1216.7, "total_tokens": 36785408} |
| {"current_steps": 435, "total_steps": 5650, "loss": 0.6809, "accuracy": 0.699999988079071, "lr": 5e-05, "epoch": 0.1539346220197284, "percentage": 7.7, "elapsed_time": "8:29:41", "remaining_time": "4 days, 5:50:31", "throughput": 1216.69, "total_tokens": 37208592} |
| {"current_steps": 440, "total_steps": 5650, "loss": 0.4763, "accuracy": 0.800000011920929, "lr": 5e-05, "epoch": 0.15570398549121953, "percentage": 7.79, "elapsed_time": "8:35:46", "remaining_time": "4 days, 5:47:13", "throughput": 1216.66, "total_tokens": 37651264} |
| {"current_steps": 445, "total_steps": 5650, "loss": 0.2061, "accuracy": 0.925000011920929, "lr": 5e-05, "epoch": 0.15747334896271067, "percentage": 7.88, "elapsed_time": "8:41:32", "remaining_time": "4 days, 5:40:11", "throughput": 1216.69, "total_tokens": 38072752} |
| {"current_steps": 450, "total_steps": 5650, "loss": 0.5319, "accuracy": 0.800000011920929, "lr": 5e-05, "epoch": 0.1592427124342018, "percentage": 7.96, "elapsed_time": "8:47:10", "remaining_time": "4 days, 5:31:45", "throughput": 1216.68, "total_tokens": 38484032} |
| {"current_steps": 455, "total_steps": 5650, "loss": 0.2169, "accuracy": 0.9000000357627869, "lr": 5e-05, "epoch": 0.16101207590569291, "percentage": 8.05, "elapsed_time": "8:52:55", "remaining_time": "4 days, 5:24:42", "throughput": 1216.73, "total_tokens": 38905632} |
| {"current_steps": 460, "total_steps": 5650, "loss": 0.6762, "accuracy": 0.800000011920929, "lr": 5e-05, "epoch": 0.16278143937718406, "percentage": 8.14, "elapsed_time": "8:58:41", "remaining_time": "4 days, 5:17:51", "throughput": 1216.81, "total_tokens": 39329168} |
| {"current_steps": 465, "total_steps": 5650, "loss": 0.4977, "accuracy": 0.699999988079071, "lr": 5e-05, "epoch": 0.16455080284867518, "percentage": 8.23, "elapsed_time": "9:04:27", "remaining_time": "4 days, 5:10:59", "throughput": 1216.83, "total_tokens": 39750912} |
| {"current_steps": 470, "total_steps": 5650, "loss": 0.5154, "accuracy": 0.699999988079071, "lr": 5e-05, "epoch": 0.16632016632016633, "percentage": 8.32, "elapsed_time": "9:10:23", "remaining_time": "4 days, 5:05:58", "throughput": 1216.85, "total_tokens": 40184384} |
| {"current_steps": 475, "total_steps": 5650, "loss": 0.7516, "accuracy": 0.625, "lr": 5e-05, "epoch": 0.16808952979165745, "percentage": 8.41, "elapsed_time": "9:16:08", "remaining_time": "4 days, 4:58:58", "throughput": 1216.87, "total_tokens": 40604896} |
| {"current_steps": 480, "total_steps": 5650, "loss": 0.4826, "accuracy": 0.7750000357627869, "lr": 5e-05, "epoch": 0.16985889326314857, "percentage": 8.5, "elapsed_time": "9:22:09", "remaining_time": "4 days, 4:54:59", "throughput": 1216.8, "total_tokens": 41042464} |
| {"current_steps": 485, "total_steps": 5650, "loss": 0.468, "accuracy": 0.7250000238418579, "lr": 5e-05, "epoch": 0.17162825673463972, "percentage": 8.58, "elapsed_time": "9:27:24", "remaining_time": "4 days, 4:42:39", "throughput": 1216.99, "total_tokens": 41432176} |
| {"current_steps": 490, "total_steps": 5650, "loss": 0.4554, "accuracy": 0.75, "lr": 5e-05, "epoch": 0.17339762020613084, "percentage": 8.67, "elapsed_time": "9:33:21", "remaining_time": "4 days, 4:37:52", "throughput": 1216.99, "total_tokens": 41866832} |
| {"current_steps": 495, "total_steps": 5650, "loss": 0.3794, "accuracy": 0.7750000357627869, "lr": 5e-05, "epoch": 0.17516698367762198, "percentage": 8.76, "elapsed_time": "9:39:30", "remaining_time": "4 days, 4:35:00", "throughput": 1216.92, "total_tokens": 42312256} |
| {"current_steps": 500, "total_steps": 5650, "loss": 0.6173, "accuracy": 0.7250000238418579, "lr": 5e-05, "epoch": 0.1769363471491131, "percentage": 8.85, "elapsed_time": "9:45:29", "remaining_time": "4 days, 4:30:29", "throughput": 1216.82, "total_tokens": 42745920} |
| {"current_steps": 505, "total_steps": 5650, "loss": 0.3998, "accuracy": 0.800000011920929, "lr": 5e-05, "epoch": 0.17870571062060422, "percentage": 8.94, "elapsed_time": "9:51:40", "remaining_time": "4 days, 4:28:05", "throughput": 1216.75, "total_tokens": 43195520} |
| {"current_steps": 510, "total_steps": 5650, "loss": 0.289, "accuracy": 0.875, "lr": 5e-05, "epoch": 0.18047507409209537, "percentage": 9.03, "elapsed_time": "9:57:39", "remaining_time": "4 days, 4:23:24", "throughput": 1216.73, "total_tokens": 43630816} |
| {"current_steps": 515, "total_steps": 5650, "loss": 0.367, "accuracy": 0.800000011920929, "lr": 5e-05, "epoch": 0.1822444375635865, "percentage": 9.12, "elapsed_time": "10:03:32", "remaining_time": "4 days, 4:17:53", "throughput": 1216.74, "total_tokens": 44061616} |
| {"current_steps": 520, "total_steps": 5650, "loss": 0.3997, "accuracy": 0.7750000357627869, "lr": 5e-05, "epoch": 0.18401380103507764, "percentage": 9.2, "elapsed_time": "10:09:33", "remaining_time": "4 days, 4:13:30", "throughput": 1216.77, "total_tokens": 44501264} |
| {"current_steps": 525, "total_steps": 5650, "loss": 0.3655, "accuracy": 0.824999988079071, "lr": 5e-05, "epoch": 0.18578316450656876, "percentage": 9.29, "elapsed_time": "10:15:43", "remaining_time": "4 days, 4:10:43", "throughput": 1216.69, "total_tokens": 44949280} |
| {"current_steps": 530, "total_steps": 5650, "loss": 0.5736, "accuracy": 0.7250000238418579, "lr": 5e-05, "epoch": 0.18755252797805988, "percentage": 9.38, "elapsed_time": "10:21:39", "remaining_time": "4 days, 4:05:24", "throughput": 1216.61, "total_tokens": 45378432} |
| {"current_steps": 535, "total_steps": 5650, "loss": 0.6538, "accuracy": 0.800000011920929, "lr": 5e-05, "epoch": 0.18932189144955103, "percentage": 9.47, "elapsed_time": "10:27:44", "remaining_time": "4 days, 4:01:43", "throughput": 1216.48, "total_tokens": 45818368} |
| {"current_steps": 540, "total_steps": 5650, "loss": 0.6261, "accuracy": 0.699999988079071, "lr": 5e-05, "epoch": 0.19109125492104215, "percentage": 9.56, "elapsed_time": "10:34:04", "remaining_time": "4 days, 4:00:15", "throughput": 1216.38, "total_tokens": 46276768} |
| {"current_steps": 545, "total_steps": 5650, "loss": 0.4122, "accuracy": 0.824999988079071, "lr": 5e-05, "epoch": 0.1928606183925333, "percentage": 9.65, "elapsed_time": "10:39:39", "remaining_time": "4 days, 3:51:42", "throughput": 1216.44, "total_tokens": 46686592} |
| {"current_steps": 550, "total_steps": 5650, "loss": 0.6515, "accuracy": 0.699999988079071, "lr": 5e-05, "epoch": 0.19462998186402442, "percentage": 9.73, "elapsed_time": "10:45:40", "remaining_time": "4 days, 3:47:09", "throughput": 1216.37, "total_tokens": 47122912} |
| {"current_steps": 555, "total_steps": 5650, "loss": 0.5666, "accuracy": 0.699999988079071, "lr": 5e-05, "epoch": 0.19639934533551553, "percentage": 9.82, "elapsed_time": "10:51:54", "remaining_time": "4 days, 3:44:37", "throughput": 1216.25, "total_tokens": 47573008} |
| {"current_steps": 560, "total_steps": 5650, "loss": 0.3994, "accuracy": 0.8500000238418579, "lr": 5e-05, "epoch": 0.19816870880700668, "percentage": 9.91, "elapsed_time": "10:57:43", "remaining_time": "4 days, 3:38:11", "throughput": 1216.27, "total_tokens": 47997904} |
| {"current_steps": 565, "total_steps": 5650, "loss": 0.5355, "accuracy": 0.800000011920929, "lr": 5e-05, "epoch": 0.1999380722784978, "percentage": 10.0, "elapsed_time": "11:03:37", "remaining_time": "4 days, 3:32:34", "throughput": 1216.29, "total_tokens": 48429200} |
| {"current_steps": 570, "total_steps": 5650, "loss": 0.484, "accuracy": 0.699999988079071, "lr": 5e-05, "epoch": 0.20170743574998895, "percentage": 10.09, "elapsed_time": "11:09:50", "remaining_time": "4 days, 3:29:50", "throughput": 1216.18, "total_tokens": 48878960} |
| {"current_steps": 575, "total_steps": 5650, "loss": 0.5568, "accuracy": 0.7250000238418579, "lr": 5e-05, "epoch": 0.20347679922148007, "percentage": 10.18, "elapsed_time": "11:15:29", "remaining_time": "4 days, 3:21:59", "throughput": 1216.26, "total_tokens": 49294800} |
| {"current_steps": 580, "total_steps": 5650, "loss": 0.4609, "accuracy": 0.824999988079071, "lr": 5e-05, "epoch": 0.2052461626929712, "percentage": 10.27, "elapsed_time": "11:21:10", "remaining_time": "4 days, 3:14:22", "throughput": 1216.33, "total_tokens": 49711712} |
| {"current_steps": 585, "total_steps": 5650, "loss": 0.9046, "accuracy": 0.699999988079071, "lr": 5e-05, "epoch": 0.20701552616446234, "percentage": 10.35, "elapsed_time": "11:27:06", "remaining_time": "4 days, 3:09:02", "throughput": 1216.27, "total_tokens": 50142368} |
| {"current_steps": 590, "total_steps": 5650, "loss": 0.5276, "accuracy": 0.7750000357627869, "lr": 5e-05, "epoch": 0.20878488963595346, "percentage": 10.44, "elapsed_time": "11:33:18", "remaining_time": "4 days, 3:05:57", "throughput": 1216.23, "total_tokens": 50593120} |
| {"current_steps": 595, "total_steps": 5650, "loss": 0.701, "accuracy": 0.699999988079071, "lr": 5e-05, "epoch": 0.2105542531074446, "percentage": 10.53, "elapsed_time": "11:38:54", "remaining_time": "4 days, 2:57:48", "throughput": 1216.34, "total_tokens": 51006832} |
| {"current_steps": 600, "total_steps": 5650, "loss": 0.6403, "accuracy": 0.75, "lr": 5e-05, "epoch": 0.21232361657893573, "percentage": 10.62, "elapsed_time": "11:44:47", "remaining_time": "4 days, 2:51:57", "throughput": 1216.31, "total_tokens": 51434480} |
| {"current_steps": 605, "total_steps": 5650, "loss": 0.5286, "accuracy": 0.7750000357627869, "lr": 5e-05, "epoch": 0.21409298005042685, "percentage": 10.71, "elapsed_time": "11:50:47", "remaining_time": "4 days, 2:47:07", "throughput": 1216.34, "total_tokens": 51873200} |
| {"current_steps": 610, "total_steps": 5650, "loss": 0.3787, "accuracy": 0.824999988079071, "lr": 5e-05, "epoch": 0.215862343521918, "percentage": 10.8, "elapsed_time": "11:56:15", "remaining_time": "4 days, 2:38:00", "throughput": 1216.47, "total_tokens": 52279168} |
| {"current_steps": 615, "total_steps": 5650, "loss": 0.3953, "accuracy": 0.875, "lr": 5e-05, "epoch": 0.2176317069934091, "percentage": 10.88, "elapsed_time": "12:01:59", "remaining_time": "4 days, 2:30:52", "throughput": 1216.54, "total_tokens": 52699424} |
| {"current_steps": 620, "total_steps": 5650, "loss": 0.387, "accuracy": 0.7750000357627869, "lr": 5e-05, "epoch": 0.21940107046490026, "percentage": 10.97, "elapsed_time": "12:07:46", "remaining_time": "4 days, 2:24:18", "throughput": 1216.48, "total_tokens": 53119104} |
| {"current_steps": 625, "total_steps": 5650, "loss": 0.3241, "accuracy": 0.9000000357627869, "lr": 5e-05, "epoch": 0.22117043393639138, "percentage": 11.06, "elapsed_time": "12:14:06", "remaining_time": "4 days, 2:22:10", "throughput": 1216.32, "total_tokens": 53574080} |
| {"current_steps": 630, "total_steps": 5650, "loss": 0.5328, "accuracy": 0.7750000357627869, "lr": 5e-05, "epoch": 0.2229397974078825, "percentage": 11.15, "elapsed_time": "12:19:32", "remaining_time": "4 days, 2:12:51", "throughput": 1216.48, "total_tokens": 53978416} |
| {"current_steps": 635, "total_steps": 5650, "loss": 0.345, "accuracy": 0.875, "lr": 5e-05, "epoch": 0.22470916087937365, "percentage": 11.24, "elapsed_time": "12:26:25", "remaining_time": "4 days, 2:15:02", "throughput": 1216.09, "total_tokens": 54463632} |
| {"current_steps": 640, "total_steps": 5650, "loss": 0.3271, "accuracy": 0.824999988079071, "lr": 5e-05, "epoch": 0.22647852435086477, "percentage": 11.33, "elapsed_time": "12:32:18", "remaining_time": "4 days, 2:09:11", "throughput": 1216.09, "total_tokens": 54892560} |
| {"current_steps": 645, "total_steps": 5650, "loss": 0.372, "accuracy": 0.9000000357627869, "lr": 5e-05, "epoch": 0.22824788782235592, "percentage": 11.42, "elapsed_time": "12:38:33", "remaining_time": "4 days, 2:06:07", "throughput": 1216.03, "total_tokens": 55345584} |
| {"current_steps": 650, "total_steps": 5650, "loss": 0.6258, "accuracy": 0.75, "lr": 5e-05, "epoch": 0.23001725129384704, "percentage": 11.5, "elapsed_time": "12:44:13", "remaining_time": "4 days, 1:58:38", "throughput": 1216.11, "total_tokens": 55762704} |
| {"current_steps": 655, "total_steps": 5650, "loss": 0.5042, "accuracy": 0.800000011920929, "lr": 5e-05, "epoch": 0.23178661476533816, "percentage": 11.59, "elapsed_time": "12:49:51", "remaining_time": "4 days, 1:50:57", "throughput": 1216.14, "total_tokens": 56175680} |
| {"current_steps": 660, "total_steps": 5650, "loss": 0.527, "accuracy": 0.800000011920929, "lr": 5e-05, "epoch": 0.2335559782368293, "percentage": 11.68, "elapsed_time": "12:55:43", "remaining_time": "4 days, 1:44:59", "throughput": 1216.13, "total_tokens": 56603424} |
| {"current_steps": 665, "total_steps": 5650, "loss": 0.5832, "accuracy": 0.824999988079071, "lr": 5e-05, "epoch": 0.23532534170832042, "percentage": 11.77, "elapsed_time": "13:01:46", "remaining_time": "4 days, 1:40:22", "throughput": 1216.14, "total_tokens": 57045024} |
| {"current_steps": 670, "total_steps": 5650, "loss": 0.1878, "accuracy": 0.925000011920929, "lr": 5e-05, "epoch": 0.23709470517981157, "percentage": 11.86, "elapsed_time": "13:07:22", "remaining_time": "4 days, 1:32:29", "throughput": 1216.22, "total_tokens": 57457936} |
| {"current_steps": 675, "total_steps": 5650, "loss": 0.5784, "accuracy": 0.800000011920929, "lr": 5e-05, "epoch": 0.2388640686513027, "percentage": 11.95, "elapsed_time": "13:13:25", "remaining_time": "4 days, 1:27:52", "throughput": 1216.17, "total_tokens": 57896768} |
| {"current_steps": 680, "total_steps": 5650, "loss": 0.4625, "accuracy": 0.824999988079071, "lr": 5e-05, "epoch": 0.2406334321227938, "percentage": 12.04, "elapsed_time": "13:19:28", "remaining_time": "4 days, 1:23:11", "throughput": 1216.13, "total_tokens": 58335520} |
| {"current_steps": 685, "total_steps": 5650, "loss": 0.3701, "accuracy": 0.800000011920929, "lr": 5e-05, "epoch": 0.24240279559428496, "percentage": 12.12, "elapsed_time": "13:25:19", "remaining_time": "4 days, 1:17:06", "throughput": 1216.14, "total_tokens": 58762928} |
| {"current_steps": 690, "total_steps": 5650, "loss": 0.3422, "accuracy": 0.8500000238418579, "lr": 5e-05, "epoch": 0.24417215906577608, "percentage": 12.21, "elapsed_time": "13:31:23", "remaining_time": "4 days, 1:12:38", "throughput": 1216.09, "total_tokens": 59203888} |
| {"current_steps": 695, "total_steps": 5650, "loss": 0.2533, "accuracy": 0.875, "lr": 5e-05, "epoch": 0.24594152253726723, "percentage": 12.3, "elapsed_time": "13:36:53", "remaining_time": "4 days, 1:04:02", "throughput": 1216.18, "total_tokens": 59609616} |
| {"current_steps": 700, "total_steps": 5650, "loss": 0.2436, "accuracy": 0.875, "lr": 5e-05, "epoch": 0.24771088600875835, "percentage": 12.39, "elapsed_time": "13:42:44", "remaining_time": "4 days, 0:57:59", "throughput": 1216.19, "total_tokens": 60037040} |
| {"current_steps": 705, "total_steps": 5650, "loss": 0.3803, "accuracy": 0.800000011920929, "lr": 5e-05, "epoch": 0.2494802494802495, "percentage": 12.48, "elapsed_time": "13:48:49", "remaining_time": "4 days, 0:53:28", "throughput": 1216.13, "total_tokens": 60476768} |
| {"current_steps": 710, "total_steps": 5650, "loss": 0.4185, "accuracy": 0.7750000357627869, "lr": 5e-05, "epoch": 0.2512496129517406, "percentage": 12.57, "elapsed_time": "13:55:06", "remaining_time": "4 days, 0:50:27", "throughput": 1216.0, "total_tokens": 60929392} |
| {"current_steps": 715, "total_steps": 5650, "loss": 0.4909, "accuracy": 0.7250000238418579, "lr": 5e-05, "epoch": 0.25301897642323173, "percentage": 12.65, "elapsed_time": "14:01:00", "remaining_time": "4 days, 0:44:42", "throughput": 1216.02, "total_tokens": 61361088} |
| {"current_steps": 720, "total_steps": 5650, "loss": 0.4257, "accuracy": 0.8500000238418579, "lr": 5e-05, "epoch": 0.2547883398947229, "percentage": 12.74, "elapsed_time": "14:06:13", "remaining_time": "4 days, 0:34:17", "throughput": 1216.09, "total_tokens": 61745280} |
| {"current_steps": 725, "total_steps": 5650, "loss": 0.4216, "accuracy": 0.8500000238418579, "lr": 5e-05, "epoch": 0.25655770336621403, "percentage": 12.83, "elapsed_time": "14:12:26", "remaining_time": "4 days, 0:30:44", "throughput": 1216.0, "total_tokens": 62194208} |
| {"current_steps": 730, "total_steps": 5650, "loss": 0.4921, "accuracy": 0.875, "lr": 5e-05, "epoch": 0.2583270668377051, "percentage": 12.92, "elapsed_time": "14:18:11", "remaining_time": "4 days, 0:23:56", "throughput": 1216.05, "total_tokens": 62616000} |
| {"current_steps": 735, "total_steps": 5650, "loss": 0.5456, "accuracy": 0.7750000357627869, "lr": 5e-05, "epoch": 0.26009643030919627, "percentage": 13.01, "elapsed_time": "14:24:01", "remaining_time": "4 days, 0:17:50", "throughput": 1216.05, "total_tokens": 63042272} |
| {"current_steps": 740, "total_steps": 5650, "loss": 0.3492, "accuracy": 0.824999988079071, "lr": 5e-05, "epoch": 0.2618657937806874, "percentage": 13.1, "elapsed_time": "14:29:50", "remaining_time": "4 days, 0:11:31", "throughput": 1216.06, "total_tokens": 63466752} |
| {"current_steps": 745, "total_steps": 5650, "loss": 0.2846, "accuracy": 0.7750000357627869, "lr": 5e-05, "epoch": 0.2636351572521785, "percentage": 13.19, "elapsed_time": "14:35:46", "remaining_time": "4 days, 0:05:59", "throughput": 1216.03, "total_tokens": 63898224} |
| {"current_steps": 750, "total_steps": 5650, "loss": 0.5799, "accuracy": 0.699999988079071, "lr": 5e-05, "epoch": 0.26540452072366966, "percentage": 13.27, "elapsed_time": "14:41:54", "remaining_time": "4 days, 0:01:47", "throughput": 1215.99, "total_tokens": 64343376} |
| {"current_steps": 755, "total_steps": 5650, "loss": 0.7227, "accuracy": 0.75, "lr": 5e-05, "epoch": 0.2671738841951608, "percentage": 13.36, "elapsed_time": "14:47:57", "remaining_time": "3 days, 23:56:58", "throughput": 1215.96, "total_tokens": 64782496} |
| {"current_steps": 760, "total_steps": 5650, "loss": 0.5296, "accuracy": 0.699999988079071, "lr": 5e-05, "epoch": 0.2689432476666519, "percentage": 13.45, "elapsed_time": "14:53:43", "remaining_time": "3 days, 23:50:26", "throughput": 1215.92, "total_tokens": 65202528} |
| {"current_steps": 765, "total_steps": 5650, "loss": 0.3434, "accuracy": 0.7750000357627869, "lr": 5e-05, "epoch": 0.27071261113814304, "percentage": 13.54, "elapsed_time": "14:59:42", "remaining_time": "3 days, 23:45:14", "throughput": 1215.91, "total_tokens": 65638112} |
| {"current_steps": 770, "total_steps": 5650, "loss": 0.3618, "accuracy": 0.75, "lr": 5e-05, "epoch": 0.2724819746096342, "percentage": 13.63, "elapsed_time": "15:05:21", "remaining_time": "3 days, 23:37:49", "throughput": 1215.95, "total_tokens": 66051936} |
| {"current_steps": 775, "total_steps": 5650, "loss": 0.2786, "accuracy": 0.875, "lr": 5e-05, "epoch": 0.27425133808112534, "percentage": 13.72, "elapsed_time": "15:10:23", "remaining_time": "3 days, 23:26:37", "throughput": 1216.15, "total_tokens": 66430048} |
| {"current_steps": 780, "total_steps": 5650, "loss": 0.4517, "accuracy": 0.75, "lr": 5e-05, "epoch": 0.27602070155261643, "percentage": 13.81, "elapsed_time": "15:16:25", "remaining_time": "3 days, 23:21:45", "throughput": 1216.1, "total_tokens": 66867392} |
| {"current_steps": 785, "total_steps": 5650, "loss": 0.5228, "accuracy": 0.699999988079071, "lr": 5e-05, "epoch": 0.2777900650241076, "percentage": 13.89, "elapsed_time": "15:22:21", "remaining_time": "3 days, 23:16:16", "throughput": 1216.13, "total_tokens": 67302704} |
| {"current_steps": 790, "total_steps": 5650, "loss": 0.6936, "accuracy": 0.800000011920929, "lr": 5e-05, "epoch": 0.2795594284955987, "percentage": 13.98, "elapsed_time": "15:28:38", "remaining_time": "3 days, 23:12:53", "throughput": 1216.09, "total_tokens": 67758592} |
| {"current_steps": 795, "total_steps": 5650, "loss": 0.305, "accuracy": 0.9000000357627869, "lr": 5e-05, "epoch": 0.2813287919670898, "percentage": 14.07, "elapsed_time": "15:34:32", "remaining_time": "3 days, 23:07:12", "throughput": 1216.06, "total_tokens": 68187872} |
| {"current_steps": 800, "total_steps": 5650, "loss": 0.2953, "accuracy": 0.925000011920929, "lr": 5e-05, "epoch": 0.28309815543858097, "percentage": 14.16, "elapsed_time": "15:40:44", "remaining_time": "3 days, 23:03:16", "throughput": 1216.01, "total_tokens": 68637280} |
| {"current_steps": 805, "total_steps": 5650, "loss": 0.7255, "accuracy": 0.7250000238418579, "lr": 5e-05, "epoch": 0.2848675189100721, "percentage": 14.25, "elapsed_time": "15:46:48", "remaining_time": "3 days, 22:58:29", "throughput": 1215.96, "total_tokens": 69077024} |
| {"current_steps": 810, "total_steps": 5650, "loss": 0.4705, "accuracy": 0.7750000357627869, "lr": 5e-05, "epoch": 0.2866368823815632, "percentage": 14.34, "elapsed_time": "15:52:59", "remaining_time": "3 days, 22:54:26", "throughput": 1215.89, "total_tokens": 69524112} |
| {"current_steps": 815, "total_steps": 5650, "loss": 0.5801, "accuracy": 0.7750000357627869, "lr": 5e-05, "epoch": 0.28840624585305435, "percentage": 14.42, "elapsed_time": "15:59:01", "remaining_time": "3 days, 22:49:27", "throughput": 1215.91, "total_tokens": 69965824} |
| {"current_steps": 820, "total_steps": 5650, "loss": 0.4369, "accuracy": 0.800000011920929, "lr": 5e-05, "epoch": 0.2901756093245455, "percentage": 14.51, "elapsed_time": "16:05:12", "remaining_time": "3 days, 22:45:18", "throughput": 1215.85, "total_tokens": 70412688} |
| {"current_steps": 825, "total_steps": 5650, "loss": 0.4453, "accuracy": 0.699999988079071, "lr": 5e-05, "epoch": 0.29194497279603665, "percentage": 14.6, "elapsed_time": "16:10:46", "remaining_time": "3 days, 22:37:35", "throughput": 1215.85, "total_tokens": 70819184} |
| {"current_steps": 830, "total_steps": 5650, "loss": 0.2737, "accuracy": 0.875, "lr": 5e-05, "epoch": 0.29371433626752774, "percentage": 14.69, "elapsed_time": "16:17:00", "remaining_time": "3 days, 22:33:44", "throughput": 1215.76, "total_tokens": 71269008} |
| {"current_steps": 835, "total_steps": 5650, "loss": 0.23, "accuracy": 0.9000000357627869, "lr": 5e-05, "epoch": 0.2954836997390189, "percentage": 14.78, "elapsed_time": "16:22:55", "remaining_time": "3 days, 22:28:00", "throughput": 1215.79, "total_tokens": 71701728} |
| {"current_steps": 840, "total_steps": 5650, "loss": 0.263, "accuracy": 0.925000011920929, "lr": 5e-05, "epoch": 0.29725306321051004, "percentage": 14.87, "elapsed_time": "16:29:03", "remaining_time": "3 days, 22:23:30", "throughput": 1215.75, "total_tokens": 72146848} |
| {"current_steps": 845, "total_steps": 5650, "loss": 0.7728, "accuracy": 0.824999988079071, "lr": 5e-05, "epoch": 0.29902242668200113, "percentage": 14.96, "elapsed_time": "16:34:42", "remaining_time": "3 days, 22:16:19", "throughput": 1215.79, "total_tokens": 72561872} |
| {"current_steps": 850, "total_steps": 5650, "loss": 0.31, "accuracy": 0.7750000357627869, "lr": 5e-05, "epoch": 0.3007917901534923, "percentage": 15.04, "elapsed_time": "16:40:28", "remaining_time": "3 days, 22:09:43", "throughput": 1215.82, "total_tokens": 72983456} |
| {"current_steps": 855, "total_steps": 5650, "loss": 0.3231, "accuracy": 0.824999988079071, "lr": 5e-05, "epoch": 0.3025611536249834, "percentage": 15.13, "elapsed_time": "16:46:38", "remaining_time": "3 days, 22:05:27", "throughput": 1215.79, "total_tokens": 73432112} |
| {"current_steps": 860, "total_steps": 5650, "loss": 0.2965, "accuracy": 0.8500000238418579, "lr": 5e-05, "epoch": 0.3043305170964745, "percentage": 15.22, "elapsed_time": "16:52:37", "remaining_time": "3 days, 22:00:05", "throughput": 1215.78, "total_tokens": 73867616} |
| {"current_steps": 865, "total_steps": 5650, "loss": 0.6317, "accuracy": 0.7250000238418579, "lr": 5e-05, "epoch": 0.30609988056796567, "percentage": 15.31, "elapsed_time": "16:58:30", "remaining_time": "3 days, 21:54:10", "throughput": 1215.77, "total_tokens": 74296384} |
| {"current_steps": 870, "total_steps": 5650, "loss": 0.3742, "accuracy": 0.8500000238418579, "lr": 5e-05, "epoch": 0.3078692440394568, "percentage": 15.4, "elapsed_time": "17:04:16", "remaining_time": "3 days, 21:47:38", "throughput": 1215.8, "total_tokens": 74719152} |
| {"current_steps": 875, "total_steps": 5650, "loss": 0.7317, "accuracy": 0.699999988079071, "lr": 5e-05, "epoch": 0.30963860751094796, "percentage": 15.49, "elapsed_time": "17:10:07", "remaining_time": "3 days, 21:41:30", "throughput": 1215.84, "total_tokens": 75147360} |
| {"current_steps": 880, "total_steps": 5650, "loss": 0.4742, "accuracy": 0.824999988079071, "lr": 5e-05, "epoch": 0.31140797098243905, "percentage": 15.58, "elapsed_time": "17:16:13", "remaining_time": "3 days, 21:36:47", "throughput": 1215.77, "total_tokens": 75588640} |
| {"current_steps": 885, "total_steps": 5650, "loss": 0.4411, "accuracy": 0.875, "lr": 5e-05, "epoch": 0.3131773344539302, "percentage": 15.66, "elapsed_time": "17:22:16", "remaining_time": "3 days, 21:31:45", "throughput": 1215.75, "total_tokens": 76028464} |
| {"current_steps": 890, "total_steps": 5650, "loss": 0.3603, "accuracy": 0.875, "lr": 5e-05, "epoch": 0.31494669792542135, "percentage": 15.75, "elapsed_time": "17:28:18", "remaining_time": "3 days, 21:26:39", "throughput": 1215.72, "total_tokens": 76466512} |
| {"current_steps": 895, "total_steps": 5650, "loss": 0.4708, "accuracy": 0.75, "lr": 5e-05, "epoch": 0.31671606139691244, "percentage": 15.84, "elapsed_time": "17:34:15", "remaining_time": "3 days, 21:21:08", "throughput": 1215.67, "total_tokens": 76897952} |
| {"current_steps": 900, "total_steps": 5650, "loss": 0.5458, "accuracy": 0.8500000238418579, "lr": 5e-05, "epoch": 0.3184854248684036, "percentage": 15.93, "elapsed_time": "17:40:07", "remaining_time": "3 days, 21:15:08", "throughput": 1215.66, "total_tokens": 77325616} |
| {"current_steps": 905, "total_steps": 5650, "loss": 0.3873, "accuracy": 0.7750000357627869, "lr": 5e-05, "epoch": 0.32025478833989474, "percentage": 16.02, "elapsed_time": "17:45:38", "remaining_time": "3 days, 21:07:18", "throughput": 1215.72, "total_tokens": 77732032} |
| {"current_steps": 910, "total_steps": 5650, "loss": 0.4705, "accuracy": 0.7750000357627869, "lr": 5e-05, "epoch": 0.32202415181138583, "percentage": 16.11, "elapsed_time": "17:51:41", "remaining_time": "3 days, 21:02:12", "throughput": 1215.7, "total_tokens": 78171152} |
| {"current_steps": 915, "total_steps": 5650, "loss": 0.4214, "accuracy": 0.800000011920929, "lr": 5e-05, "epoch": 0.323793515282877, "percentage": 16.19, "elapsed_time": "17:57:38", "remaining_time": "3 days, 20:56:38", "throughput": 1215.72, "total_tokens": 78606736} |
| {"current_steps": 920, "total_steps": 5650, "loss": 0.4696, "accuracy": 0.9000000357627869, "lr": 5e-05, "epoch": 0.3255628787543681, "percentage": 16.28, "elapsed_time": "18:03:49", "remaining_time": "3 days, 20:52:16", "throughput": 1215.67, "total_tokens": 79054704} |
| {"current_steps": 925, "total_steps": 5650, "loss": 0.5645, "accuracy": 0.8500000238418579, "lr": 5e-05, "epoch": 0.32733224222585927, "percentage": 16.37, "elapsed_time": "18:09:56", "remaining_time": "3 days, 20:47:31", "throughput": 1215.62, "total_tokens": 79497344} |
| {"current_steps": 930, "total_steps": 5650, "loss": 0.4224, "accuracy": 0.824999988079071, "lr": 5e-05, "epoch": 0.32910160569735036, "percentage": 16.46, "elapsed_time": "18:15:59", "remaining_time": "3 days, 20:42:25", "throughput": 1215.6, "total_tokens": 79937104} |
| {"current_steps": 935, "total_steps": 5650, "loss": 0.1669, "accuracy": 0.925000011920929, "lr": 5e-05, "epoch": 0.3308709691688415, "percentage": 16.55, "elapsed_time": "18:22:08", "remaining_time": "3 days, 20:37:52", "throughput": 1215.56, "total_tokens": 80383424} |
| {"current_steps": 940, "total_steps": 5650, "loss": 0.3363, "accuracy": 0.800000011920929, "lr": 5e-05, "epoch": 0.33264033264033266, "percentage": 16.64, "elapsed_time": "18:28:05", "remaining_time": "3 days, 20:32:13", "throughput": 1215.55, "total_tokens": 80816144} |
| {"current_steps": 945, "total_steps": 5650, "loss": 0.5649, "accuracy": 0.824999988079071, "lr": 5e-05, "epoch": 0.33440969611182375, "percentage": 16.73, "elapsed_time": "18:34:04", "remaining_time": "3 days, 20:26:46", "throughput": 1215.56, "total_tokens": 81253168} |
| {"current_steps": 950, "total_steps": 5650, "loss": 0.1902, "accuracy": 0.9000000357627869, "lr": 5e-05, "epoch": 0.3361790595833149, "percentage": 16.81, "elapsed_time": "18:39:41", "remaining_time": "3 days, 20:19:30", "throughput": 1215.61, "total_tokens": 81666336} |
| {"current_steps": 955, "total_steps": 5650, "loss": 0.3939, "accuracy": 0.75, "lr": 5e-05, "epoch": 0.33794842305480605, "percentage": 16.9, "elapsed_time": "18:45:27", "remaining_time": "3 days, 20:13:00", "throughput": 1215.62, "total_tokens": 82087904} |
| {"current_steps": 960, "total_steps": 5650, "loss": 0.4545, "accuracy": 0.824999988079071, "lr": 5e-05, "epoch": 0.33971778652629714, "percentage": 16.99, "elapsed_time": "18:51:43", "remaining_time": "3 days, 20:08:58", "throughput": 1215.57, "total_tokens": 82541648} |
| {"current_steps": 965, "total_steps": 5650, "loss": 0.301, "accuracy": 0.875, "lr": 5e-05, "epoch": 0.3414871499977883, "percentage": 17.08, "elapsed_time": "18:57:30", "remaining_time": "3 days, 20:02:28", "throughput": 1215.59, "total_tokens": 82963968} |
| {"current_steps": 970, "total_steps": 5650, "loss": 0.3444, "accuracy": 0.800000011920929, "lr": 5e-05, "epoch": 0.34325651346927943, "percentage": 17.17, "elapsed_time": "19:03:28", "remaining_time": "3 days, 19:56:57", "throughput": 1215.55, "total_tokens": 83396720} |
| {"current_steps": 975, "total_steps": 5650, "loss": 0.4458, "accuracy": 0.824999988079071, "lr": 5e-05, "epoch": 0.3450258769407706, "percentage": 17.26, "elapsed_time": "19:09:10", "remaining_time": "3 days, 19:50:07", "throughput": 1215.58, "total_tokens": 83814640} |
| {"current_steps": 980, "total_steps": 5650, "loss": 0.3216, "accuracy": 0.8500000238418579, "lr": 5e-05, "epoch": 0.3467952404122617, "percentage": 17.35, "elapsed_time": "19:15:05", "remaining_time": "3 days, 19:44:21", "throughput": 1215.57, "total_tokens": 84245888} |
| {"current_steps": 985, "total_steps": 5650, "loss": 0.2563, "accuracy": 0.875, "lr": 5e-05, "epoch": 0.3485646038837528, "percentage": 17.43, "elapsed_time": "19:20:59", "remaining_time": "3 days, 19:38:31", "throughput": 1215.6, "total_tokens": 84678784} |
| {"current_steps": 990, "total_steps": 5650, "loss": 0.4849, "accuracy": 0.75, "lr": 5e-05, "epoch": 0.35033396735524397, "percentage": 17.52, "elapsed_time": "19:27:02", "remaining_time": "3 days, 19:33:19", "throughput": 1215.59, "total_tokens": 85118464} |
| {"current_steps": 995, "total_steps": 5650, "loss": 0.5631, "accuracy": 0.9000000357627869, "lr": 5e-05, "epoch": 0.35210333082673506, "percentage": 17.61, "elapsed_time": "19:33:07", "remaining_time": "3 days, 19:28:20", "throughput": 1215.54, "total_tokens": 85559040} |
| {"current_steps": 1000, "total_steps": 5650, "loss": 0.3912, "accuracy": 0.8500000238418579, "lr": 5e-05, "epoch": 0.3538726942982262, "percentage": 17.7, "elapsed_time": "19:38:57", "remaining_time": "3 days, 19:22:07", "throughput": 1215.55, "total_tokens": 85984288} |
| {"current_steps": 1005, "total_steps": 5650, "loss": 0.2859, "accuracy": 0.824999988079071, "lr": 5e-05, "epoch": 0.35564205776971736, "percentage": 17.79, "elapsed_time": "19:45:08", "remaining_time": "3 days, 19:17:37", "throughput": 1215.4, "total_tokens": 86425696} |
| {"current_steps": 1010, "total_steps": 5650, "loss": 0.3711, "accuracy": 0.8500000238418579, "lr": 5e-05, "epoch": 0.35741142124120845, "percentage": 17.88, "elapsed_time": "19:51:17", "remaining_time": "3 days, 19:12:51", "throughput": 1215.38, "total_tokens": 86871840} |
| {"current_steps": 1015, "total_steps": 5650, "loss": 0.5815, "accuracy": 0.75, "lr": 5e-05, "epoch": 0.3591807847126996, "percentage": 17.96, "elapsed_time": "19:57:02", "remaining_time": "3 days, 19:06:16", "throughput": 1215.4, "total_tokens": 87292992} |
| {"current_steps": 1020, "total_steps": 5650, "loss": 0.3729, "accuracy": 0.824999988079071, "lr": 5e-05, "epoch": 0.36095014818419074, "percentage": 18.05, "elapsed_time": "20:02:57", "remaining_time": "3 days, 19:00:27", "throughput": 1215.4, "total_tokens": 87723920} |
| {"current_steps": 1025, "total_steps": 5650, "loss": 0.2932, "accuracy": 0.8500000238418579, "lr": 5e-05, "epoch": 0.3627195116556819, "percentage": 18.14, "elapsed_time": "20:08:46", "remaining_time": "3 days, 18:54:15", "throughput": 1215.39, "total_tokens": 88148800} |
| {"current_steps": 1030, "total_steps": 5650, "loss": 0.4418, "accuracy": 0.824999988079071, "lr": 5e-05, "epoch": 0.364488875127173, "percentage": 18.23, "elapsed_time": "20:14:40", "remaining_time": "3 days, 18:48:21", "throughput": 1215.43, "total_tokens": 88581088} |
|
|