File size: 9,337 Bytes
f0a3978 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 | {"current_steps": 10, "total_steps": 381, "loss": 1.1348, "lr": 2.564102564102564e-06, "epoch": 0.07858546168958742, "percentage": 2.62, "elapsed_time": "0:01:19", "remaining_time": "0:49:17", "throughput": 3586.98, "total_tokens": 285944}
{"current_steps": 20, "total_steps": 381, "loss": 0.9328, "lr": 5.128205128205128e-06, "epoch": 0.15717092337917485, "percentage": 5.25, "elapsed_time": "0:02:35", "remaining_time": "0:46:44", "throughput": 3561.25, "total_tokens": 553248}
{"current_steps": 30, "total_steps": 381, "loss": 0.8484, "lr": 7.692307692307694e-06, "epoch": 0.2357563850687623, "percentage": 7.87, "elapsed_time": "0:03:51", "remaining_time": "0:45:10", "throughput": 3550.6, "total_tokens": 822480}
{"current_steps": 40, "total_steps": 381, "loss": 0.758, "lr": 9.999789047591563e-06, "epoch": 0.3143418467583497, "percentage": 10.5, "elapsed_time": "0:05:06", "remaining_time": "0:43:35", "throughput": 3540.03, "total_tokens": 1085968}
{"current_steps": 50, "total_steps": 381, "loss": 0.7506, "lr": 9.974496289936769e-06, "epoch": 0.3929273084479371, "percentage": 13.12, "elapsed_time": "0:06:21", "remaining_time": "0:42:07", "throughput": 3490.27, "total_tokens": 1332664}
{"current_steps": 60, "total_steps": 381, "loss": 0.7311, "lr": 9.90725746626209e-06, "epoch": 0.4715127701375246, "percentage": 15.75, "elapsed_time": "0:07:38", "remaining_time": "0:40:54", "throughput": 3500.07, "total_tokens": 1605712}
{"current_steps": 70, "total_steps": 381, "loss": 0.6815, "lr": 9.798639549376946e-06, "epoch": 0.550098231827112, "percentage": 18.37, "elapsed_time": "0:08:57", "remaining_time": "0:39:49", "throughput": 3525.5, "total_tokens": 1896456}
{"current_steps": 80, "total_steps": 381, "loss": 0.7245, "lr": 9.64955842986544e-06, "epoch": 0.6286836935166994, "percentage": 21.0, "elapsed_time": "0:10:15", "remaining_time": "0:38:34", "throughput": 3513.82, "total_tokens": 2161224}
{"current_steps": 90, "total_steps": 381, "loss": 0.6255, "lr": 9.461271193091971e-06, "epoch": 0.7072691552062869, "percentage": 23.62, "elapsed_time": "0:11:35", "remaining_time": "0:37:28", "throughput": 3547.83, "total_tokens": 2467224}
{"current_steps": 100, "total_steps": 381, "loss": 0.6309, "lr": 9.23536551917611e-06, "epoch": 0.7858546168958742, "percentage": 26.25, "elapsed_time": "0:12:52", "remaining_time": "0:36:11", "throughput": 3550.65, "total_tokens": 2743848}
{"current_steps": 110, "total_steps": 381, "loss": 0.6661, "lr": 8.973746295318499e-06, "epoch": 0.8644400785854617, "percentage": 28.87, "elapsed_time": "0:14:10", "remaining_time": "0:34:54", "throughput": 3546.57, "total_tokens": 3015224}
{"current_steps": 120, "total_steps": 381, "loss": 0.6815, "lr": 8.67861955336566e-06, "epoch": 0.9430255402750491, "percentage": 31.5, "elapsed_time": "0:15:25", "remaining_time": "0:33:33", "throughput": 3536.24, "total_tokens": 3274408}
{"current_steps": 130, "total_steps": 381, "loss": 0.6733, "lr": 8.352473868055746e-06, "epoch": 1.0216110019646365, "percentage": 34.12, "elapsed_time": "0:16:43", "remaining_time": "0:32:17", "throughput": 3539.58, "total_tokens": 3552384}
{"current_steps": 140, "total_steps": 381, "loss": 0.545, "lr": 7.998059372799409e-06, "epoch": 1.1001964636542239, "percentage": 36.75, "elapsed_time": "0:18:01", "remaining_time": "0:31:01", "throughput": 3533.55, "total_tokens": 3820496}
{"current_steps": 150, "total_steps": 381, "loss": 0.5028, "lr": 7.61836456993939e-06, "epoch": 1.1787819253438114, "percentage": 39.37, "elapsed_time": "0:19:18", "remaining_time": "0:29:43", "throughput": 3527.85, "total_tokens": 4086592}
{"current_steps": 160, "total_steps": 381, "loss": 0.5087, "lr": 7.2165911310299305e-06, "epoch": 1.2573673870333988, "percentage": 41.99, "elapsed_time": "0:20:33", "remaining_time": "0:28:23", "throughput": 3531.64, "total_tokens": 4355776}
{"current_steps": 170, "total_steps": 381, "loss": 0.49, "lr": 6.796126899625688e-06, "epoch": 1.3359528487229864, "percentage": 44.62, "elapsed_time": "0:21:49", "remaining_time": "0:27:05", "throughput": 3538.83, "total_tokens": 4634424}
{"current_steps": 180, "total_steps": 381, "loss": 0.4941, "lr": 6.360517324226676e-06, "epoch": 1.4145383104125737, "percentage": 47.24, "elapsed_time": "0:23:09", "remaining_time": "0:25:51", "throughput": 3532.92, "total_tokens": 4909728}
{"current_steps": 190, "total_steps": 381, "loss": 0.4711, "lr": 5.913435562263036e-06, "epoch": 1.493123772102161, "percentage": 49.87, "elapsed_time": "0:24:26", "remaining_time": "0:24:34", "throughput": 3541.39, "total_tokens": 5195200}
{"current_steps": 200, "total_steps": 381, "loss": 0.497, "lr": 5.458651507209518e-06, "epoch": 1.5717092337917484, "percentage": 52.49, "elapsed_time": "0:25:42", "remaining_time": "0:23:16", "throughput": 3541.12, "total_tokens": 5462608}
{"current_steps": 210, "total_steps": 381, "loss": 0.482, "lr": 5e-06, "epoch": 1.650294695481336, "percentage": 55.12, "elapsed_time": "0:26:57", "remaining_time": "0:21:57", "throughput": 3542.76, "total_tokens": 5730248}
{"current_steps": 220, "total_steps": 381, "loss": 0.5014, "lr": 4.541348492790482e-06, "epoch": 1.7288801571709234, "percentage": 57.74, "elapsed_time": "0:28:12", "remaining_time": "0:20:38", "throughput": 3540.28, "total_tokens": 5990552}
{"current_steps": 230, "total_steps": 381, "loss": 0.4757, "lr": 4.0865644377369666e-06, "epoch": 1.807465618860511, "percentage": 60.37, "elapsed_time": "0:29:29", "remaining_time": "0:19:21", "throughput": 3545.66, "total_tokens": 6273288}
{"current_steps": 240, "total_steps": 381, "loss": 0.4583, "lr": 3.639482675773324e-06, "epoch": 1.8860510805500983, "percentage": 62.99, "elapsed_time": "0:30:47", "remaining_time": "0:18:05", "throughput": 3547.14, "total_tokens": 6553400}
{"current_steps": 250, "total_steps": 381, "loss": 0.4617, "lr": 3.203873100374314e-06, "epoch": 1.9646365422396856, "percentage": 65.62, "elapsed_time": "0:32:05", "remaining_time": "0:16:48", "throughput": 3551.1, "total_tokens": 6836072}
{"current_steps": 260, "total_steps": 381, "loss": 0.4566, "lr": 2.783408868970071e-06, "epoch": 2.043222003929273, "percentage": 68.24, "elapsed_time": "0:33:20", "remaining_time": "0:15:31", "throughput": 3545.74, "total_tokens": 7093808}
{"current_steps": 270, "total_steps": 381, "loss": 0.3637, "lr": 2.381635430060611e-06, "epoch": 2.1218074656188604, "percentage": 70.87, "elapsed_time": "0:34:37", "remaining_time": "0:14:14", "throughput": 3546.82, "total_tokens": 7368800}
{"current_steps": 280, "total_steps": 381, "loss": 0.3459, "lr": 2.0019406272005913e-06, "epoch": 2.2003929273084477, "percentage": 73.49, "elapsed_time": "0:35:56", "remaining_time": "0:12:58", "throughput": 3549.45, "total_tokens": 7655808}
{"current_steps": 290, "total_steps": 381, "loss": 0.3553, "lr": 1.6475261319442553e-06, "epoch": 2.2789783889980355, "percentage": 76.12, "elapsed_time": "0:37:12", "remaining_time": "0:11:40", "throughput": 3544.28, "total_tokens": 7911600}
{"current_steps": 300, "total_steps": 381, "loss": 0.3451, "lr": 1.321380446634342e-06, "epoch": 2.357563850687623, "percentage": 78.74, "elapsed_time": "0:38:29", "remaining_time": "0:10:23", "throughput": 3546.81, "total_tokens": 8192536}
{"current_steps": 310, "total_steps": 381, "loss": 0.3735, "lr": 1.026253704681502e-06, "epoch": 2.43614931237721, "percentage": 81.36, "elapsed_time": "0:39:46", "remaining_time": "0:09:06", "throughput": 3547.47, "total_tokens": 8465008}
{"current_steps": 320, "total_steps": 381, "loss": 0.373, "lr": 7.646344808238904e-07, "epoch": 2.5147347740667976, "percentage": 83.99, "elapsed_time": "0:41:02", "remaining_time": "0:07:49", "throughput": 3546.15, "total_tokens": 8732552}
{"current_steps": 330, "total_steps": 381, "loss": 0.3504, "lr": 5.387288069080298e-07, "epoch": 2.593320235756385, "percentage": 86.61, "elapsed_time": "0:42:20", "remaining_time": "0:06:32", "throughput": 3545.89, "total_tokens": 9006928}
{"current_steps": 340, "total_steps": 381, "loss": 0.3255, "lr": 3.504415701345615e-07, "epoch": 2.6719056974459727, "percentage": 89.24, "elapsed_time": "0:43:37", "remaining_time": "0:05:15", "throughput": 3542.31, "total_tokens": 9272760}
{"current_steps": 350, "total_steps": 381, "loss": 0.337, "lr": 2.0136045062305543e-07, "epoch": 2.75049115913556, "percentage": 91.86, "elapsed_time": "0:44:55", "remaining_time": "0:03:58", "throughput": 3539.36, "total_tokens": 9539904}
{"current_steps": 360, "total_steps": 381, "loss": 0.381, "lr": 9.274253373791064e-08, "epoch": 2.8290766208251474, "percentage": 94.49, "elapsed_time": "0:46:13", "remaining_time": "0:02:41", "throughput": 3538.83, "total_tokens": 9813344}
{"current_steps": 370, "total_steps": 381, "loss": 0.3531, "lr": 2.55037100632316e-08, "epoch": 2.907662082514735, "percentage": 97.11, "elapsed_time": "0:47:29", "remaining_time": "0:01:24", "throughput": 3541.27, "total_tokens": 10090560}
{"current_steps": 380, "total_steps": 381, "loss": 0.359, "lr": 2.1095240843815868e-10, "epoch": 2.986247544204322, "percentage": 99.74, "elapsed_time": "0:48:46", "remaining_time": "0:00:07", "throughput": 3542.56, "total_tokens": 10366800}
{"current_steps": 381, "total_steps": 381, "epoch": 2.994106090373281, "percentage": 100.0, "elapsed_time": "0:50:56", "remaining_time": "0:00:00", "throughput": 3404.23, "total_tokens": 10403944}
|