| {"current_steps": 1, "total_steps": 45, "loss": 1.8295, "lr": 9.987820251299122e-05, "epoch": 0.10191082802547771, "percentage": 2.22, "elapsed_time": "0:02:55", "remaining_time": "2:08:59", "throughput": 1490.41, "total_tokens": 262144} |
| {"current_steps": 2, "total_steps": 45, "loss": 1.7519, "lr": 9.951340343707852e-05, "epoch": 0.20382165605095542, "percentage": 4.44, "elapsed_time": "0:05:50", "remaining_time": "2:05:28", "throughput": 1497.36, "total_tokens": 524288} |
| {"current_steps": 3, "total_steps": 45, "loss": 1.548, "lr": 9.890738003669029e-05, "epoch": 0.3057324840764331, "percentage": 6.67, "elapsed_time": "0:08:44", "remaining_time": "2:02:23", "throughput": 1499.25, "total_tokens": 786432} |
| {"current_steps": 4, "total_steps": 45, "loss": 1.4192, "lr": 9.806308479691595e-05, "epoch": 0.40764331210191085, "percentage": 8.89, "elapsed_time": "0:11:38", "remaining_time": "1:59:21", "throughput": 1500.78, "total_tokens": 1048576} |
| {"current_steps": 5, "total_steps": 45, "loss": 1.3309, "lr": 9.698463103929542e-05, "epoch": 0.5095541401273885, "percentage": 11.11, "elapsed_time": "0:14:33", "remaining_time": "1:56:25", "throughput": 1501.18, "total_tokens": 1310720} |
| {"current_steps": 6, "total_steps": 45, "loss": 1.2174, "lr": 9.567727288213005e-05, "epoch": 0.6114649681528662, "percentage": 13.33, "elapsed_time": "0:17:27", "remaining_time": "1:53:28", "throughput": 1501.6, "total_tokens": 1572864} |
| {"current_steps": 7, "total_steps": 45, "loss": 1.1651, "lr": 9.414737964294636e-05, "epoch": 0.7133757961783439, "percentage": 15.56, "elapsed_time": "0:20:22", "remaining_time": "1:50:34", "throughput": 1501.56, "total_tokens": 1835008} |
| {"current_steps": 8, "total_steps": 45, "loss": 1.1265, "lr": 9.24024048078213e-05, "epoch": 0.8152866242038217, "percentage": 17.78, "elapsed_time": "0:23:16", "remaining_time": "1:47:40", "throughput": 1501.25, "total_tokens": 2097152} |
| {"current_steps": 9, "total_steps": 45, "loss": 1.0418, "lr": 9.045084971874738e-05, "epoch": 0.9171974522292994, "percentage": 20.0, "elapsed_time": "0:26:11", "remaining_time": "1:44:47", "throughput": 1501.0, "total_tokens": 2359296} |
| {"current_steps": 10, "total_steps": 45, "loss": 1.8242, "lr": 8.83022221559489e-05, "epoch": 1.1019108280254777, "percentage": 22.22, "elapsed_time": "0:30:23", "remaining_time": "1:46:20", "throughput": 1500.84, "total_tokens": 2736128} |
| {"current_steps": 11, "total_steps": 45, "loss": 0.7817, "lr": 8.596699001693255e-05, "epoch": 1.2038216560509554, "percentage": 24.44, "elapsed_time": "0:33:17", "remaining_time": "1:42:54", "throughput": 1500.98, "total_tokens": 2998272} |
| {"current_steps": 12, "total_steps": 45, "loss": 0.7755, "lr": 8.345653031794292e-05, "epoch": 1.305732484076433, "percentage": 26.67, "elapsed_time": "0:36:12", "remaining_time": "1:39:33", "throughput": 1501.01, "total_tokens": 3260416} |
| {"current_steps": 13, "total_steps": 45, "loss": 0.7461, "lr": 8.07830737662829e-05, "epoch": 1.4076433121019107, "percentage": 28.89, "elapsed_time": "0:39:06", "remaining_time": "1:36:15", "throughput": 1501.23, "total_tokens": 3522560} |
| {"current_steps": 14, "total_steps": 45, "loss": 0.7051, "lr": 7.795964517353735e-05, "epoch": 1.5095541401273884, "percentage": 31.11, "elapsed_time": "0:42:00", "remaining_time": "1:33:01", "throughput": 1501.43, "total_tokens": 3784704} |
| {"current_steps": 15, "total_steps": 45, "loss": 0.7105, "lr": 7.500000000000001e-05, "epoch": 1.611464968152866, "percentage": 33.33, "elapsed_time": "0:44:55", "remaining_time": "1:29:50", "throughput": 1501.5, "total_tokens": 4046848} |
| {"current_steps": 16, "total_steps": 45, "loss": 0.6743, "lr": 7.191855733945387e-05, "epoch": 1.7133757961783438, "percentage": 35.56, "elapsed_time": "0:47:49", "remaining_time": "1:26:41", "throughput": 1501.54, "total_tokens": 4308992} |
| {"current_steps": 17, "total_steps": 45, "loss": 0.6563, "lr": 6.873032967079561e-05, "epoch": 1.8152866242038217, "percentage": 37.78, "elapsed_time": "0:50:44", "remaining_time": "1:23:34", "throughput": 1501.49, "total_tokens": 4571136} |
| {"current_steps": 18, "total_steps": 45, "loss": 0.6639, "lr": 6.545084971874738e-05, "epoch": 1.9171974522292994, "percentage": 40.0, "elapsed_time": "0:53:38", "remaining_time": "1:20:28", "throughput": 1501.57, "total_tokens": 4833280} |
| {"current_steps": 19, "total_steps": 45, "loss": 1.1352, "lr": 6.209609477998338e-05, "epoch": 2.1019108280254777, "percentage": 42.22, "elapsed_time": "0:57:49", "remaining_time": "1:19:07", "throughput": 1501.78, "total_tokens": 5210112} |
| {"current_steps": 20, "total_steps": 45, "loss": 0.4333, "lr": 5.868240888334653e-05, "epoch": 2.2038216560509554, "percentage": 44.44, "elapsed_time": "1:00:43", "remaining_time": "1:15:54", "throughput": 1501.85, "total_tokens": 5472256} |
| {"current_steps": 21, "total_steps": 45, "loss": 0.4481, "lr": 5.522642316338268e-05, "epoch": 2.305732484076433, "percentage": 46.67, "elapsed_time": "1:03:37", "remaining_time": "1:12:43", "throughput": 1501.98, "total_tokens": 5734400} |
| {"current_steps": 22, "total_steps": 45, "loss": 0.4308, "lr": 5.174497483512506e-05, "epoch": 2.4076433121019107, "percentage": 48.89, "elapsed_time": "1:06:32", "remaining_time": "1:09:33", "throughput": 1502.13, "total_tokens": 5996544} |
| {"current_steps": 23, "total_steps": 45, "loss": 0.4263, "lr": 4.825502516487497e-05, "epoch": 2.5095541401273884, "percentage": 51.11, "elapsed_time": "1:09:26", "remaining_time": "1:06:25", "throughput": 1502.15, "total_tokens": 6258688} |
| {"current_steps": 24, "total_steps": 45, "loss": 0.4325, "lr": 4.477357683661734e-05, "epoch": 2.611464968152866, "percentage": 53.33, "elapsed_time": "1:12:20", "remaining_time": "1:03:18", "throughput": 1502.2, "total_tokens": 6520832} |
| {"current_steps": 25, "total_steps": 45, "loss": 0.4288, "lr": 4.131759111665349e-05, "epoch": 2.713375796178344, "percentage": 55.56, "elapsed_time": "1:15:15", "remaining_time": "1:00:12", "throughput": 1502.18, "total_tokens": 6782976} |
| {"current_steps": 26, "total_steps": 45, "loss": 0.4328, "lr": 3.790390522001662e-05, "epoch": 2.8152866242038215, "percentage": 57.78, "elapsed_time": "1:18:10", "remaining_time": "0:57:07", "throughput": 1502.06, "total_tokens": 7045120} |
| {"current_steps": 27, "total_steps": 45, "loss": 0.4079, "lr": 3.4549150281252636e-05, "epoch": 2.917197452229299, "percentage": 60.0, "elapsed_time": "1:21:04", "remaining_time": "0:54:03", "throughput": 1502.03, "total_tokens": 7307264} |
| {"current_steps": 28, "total_steps": 45, "loss": 0.682, "lr": 3.12696703292044e-05, "epoch": 3.1019108280254777, "percentage": 62.22, "elapsed_time": "1:25:16", "remaining_time": "0:51:46", "throughput": 1501.96, "total_tokens": 7684096} |
| {"current_steps": 29, "total_steps": 45, "loss": 0.2745, "lr": 2.8081442660546125e-05, "epoch": 3.2038216560509554, "percentage": 64.44, "elapsed_time": "1:28:10", "remaining_time": "0:48:38", "throughput": 1502.03, "total_tokens": 7946240} |
| {"current_steps": 30, "total_steps": 45, "loss": 0.2449, "lr": 2.500000000000001e-05, "epoch": 3.305732484076433, "percentage": 66.67, "elapsed_time": "1:31:04", "remaining_time": "0:45:32", "throughput": 1502.0, "total_tokens": 8208384} |
| {"current_steps": 31, "total_steps": 45, "loss": 0.2599, "lr": 2.2040354826462668e-05, "epoch": 3.4076433121019107, "percentage": 68.89, "elapsed_time": "1:33:59", "remaining_time": "0:42:26", "throughput": 1501.97, "total_tokens": 8470528} |
| {"current_steps": 32, "total_steps": 45, "loss": 0.2269, "lr": 1.9216926233717085e-05, "epoch": 3.5095541401273884, "percentage": 71.11, "elapsed_time": "1:36:54", "remaining_time": "0:39:21", "throughput": 1501.99, "total_tokens": 8732672} |
| {"current_steps": 33, "total_steps": 45, "loss": 0.2438, "lr": 1.6543469682057106e-05, "epoch": 3.611464968152866, "percentage": 73.33, "elapsed_time": "1:39:48", "remaining_time": "0:36:17", "throughput": 1502.0, "total_tokens": 8994816} |
| {"current_steps": 34, "total_steps": 45, "loss": 0.2341, "lr": 1.4033009983067452e-05, "epoch": 3.713375796178344, "percentage": 75.56, "elapsed_time": "1:42:43", "remaining_time": "0:33:13", "throughput": 1502.0, "total_tokens": 9256960} |
| {"current_steps": 35, "total_steps": 45, "loss": 0.2269, "lr": 1.1697777844051105e-05, "epoch": 3.8152866242038215, "percentage": 77.78, "elapsed_time": "1:45:37", "remaining_time": "0:30:10", "throughput": 1502.02, "total_tokens": 9519104} |
| {"current_steps": 36, "total_steps": 45, "loss": 0.2346, "lr": 9.549150281252633e-06, "epoch": 3.917197452229299, "percentage": 80.0, "elapsed_time": "1:48:32", "remaining_time": "0:27:08", "throughput": 1502.0, "total_tokens": 9781248} |
| {"current_steps": 37, "total_steps": 45, "loss": 0.4042, "lr": 7.597595192178702e-06, "epoch": 4.101910828025478, "percentage": 82.22, "elapsed_time": "1:52:42", "remaining_time": "0:24:22", "throughput": 1502.01, "total_tokens": 10158080} |
| {"current_steps": 38, "total_steps": 45, "loss": 0.1847, "lr": 5.852620357053651e-06, "epoch": 4.203821656050955, "percentage": 84.44, "elapsed_time": "1:55:37", "remaining_time": "0:21:17", "throughput": 1502.01, "total_tokens": 10420224} |
| {"current_steps": 39, "total_steps": 45, "loss": 0.167, "lr": 4.322727117869951e-06, "epoch": 4.305732484076433, "percentage": 86.67, "elapsed_time": "1:58:32", "remaining_time": "0:18:14", "throughput": 1501.91, "total_tokens": 10682368} |
| {"current_steps": 40, "total_steps": 45, "loss": 0.1547, "lr": 3.0153689607045845e-06, "epoch": 4.407643312101911, "percentage": 88.89, "elapsed_time": "2:01:27", "remaining_time": "0:15:10", "throughput": 1501.91, "total_tokens": 10944512} |
| {"current_steps": 41, "total_steps": 45, "loss": 0.1575, "lr": 1.9369152030840556e-06, "epoch": 4.509554140127388, "percentage": 91.11, "elapsed_time": "2:04:21", "remaining_time": "0:12:07", "throughput": 1501.94, "total_tokens": 11206656} |
| {"current_steps": 42, "total_steps": 45, "loss": 0.1593, "lr": 1.0926199633097157e-06, "epoch": 4.611464968152866, "percentage": 93.33, "elapsed_time": "2:07:16", "remaining_time": "0:09:05", "throughput": 1501.82, "total_tokens": 11468800} |
| {"current_steps": 43, "total_steps": 45, "loss": 0.1497, "lr": 4.865965629214819e-07, "epoch": 4.713375796178344, "percentage": 95.56, "elapsed_time": "2:10:10", "remaining_time": "0:06:03", "throughput": 1501.89, "total_tokens": 11730944} |
| {"current_steps": 44, "total_steps": 45, "loss": 0.1543, "lr": 1.2179748700879012e-07, "epoch": 4.8152866242038215, "percentage": 97.78, "elapsed_time": "2:13:05", "remaining_time": "0:03:01", "throughput": 1501.94, "total_tokens": 11993088} |
| {"current_steps": 45, "total_steps": 45, "loss": 0.1539, "lr": 0.0, "epoch": 4.917197452229299, "percentage": 100.0, "elapsed_time": "2:15:59", "remaining_time": "0:00:00", "throughput": 1501.97, "total_tokens": 12255232} |
| {"current_steps": 45, "total_steps": 45, "epoch": 4.917197452229299, "percentage": 100.0, "elapsed_time": "2:19:20", "remaining_time": "0:00:00", "throughput": 1465.81, "total_tokens": 12255232} |
|
|